| // SPDX-License-Identifier: GPL-2.0-or-later |
| /* |
| * Firmware-Assisted Dump support on POWERVM platform. |
| * |
| * Copyright 2011, Mahesh Salgaonkar, IBM Corporation. |
| * Copyright 2019, Hari Bathini, IBM Corporation. |
| */ |
| |
| #define pr_fmt(fmt) "rtas fadump: " fmt |
| |
| #include <linux/string.h> |
| #include <linux/memblock.h> |
| #include <linux/delay.h> |
| #include <linux/seq_file.h> |
| #include <linux/crash_dump.h> |
| #include <linux/of.h> |
| #include <linux/of_fdt.h> |
| |
| #include <asm/page.h> |
| #include <asm/rtas.h> |
| #include <asm/fadump.h> |
| #include <asm/fadump-internal.h> |
| |
| #include "rtas-fadump.h" |
| |
| static struct rtas_fadump_mem_struct fdm; |
| static const struct rtas_fadump_mem_struct *fdm_active; |
| |
| static void rtas_fadump_update_config(struct fw_dump *fadump_conf, |
| const struct rtas_fadump_mem_struct *fdm) |
| { |
| fadump_conf->boot_mem_dest_addr = |
| be64_to_cpu(fdm->rmr_region.destination_address); |
| |
| fadump_conf->fadumphdr_addr = (fadump_conf->boot_mem_dest_addr + |
| fadump_conf->boot_memory_size); |
| } |
| |
| /* |
| * This function is called in the capture kernel to get configuration details |
| * setup in the first kernel and passed to the f/w. |
| */ |
| static void __init rtas_fadump_get_config(struct fw_dump *fadump_conf, |
| const struct rtas_fadump_mem_struct *fdm) |
| { |
| fadump_conf->boot_mem_addr[0] = |
| be64_to_cpu(fdm->rmr_region.source_address); |
| fadump_conf->boot_mem_sz[0] = be64_to_cpu(fdm->rmr_region.source_len); |
| fadump_conf->boot_memory_size = fadump_conf->boot_mem_sz[0]; |
| |
| fadump_conf->boot_mem_top = fadump_conf->boot_memory_size; |
| fadump_conf->boot_mem_regs_cnt = 1; |
| |
| /* |
| * Start address of reserve dump area (permanent reservation) for |
| * re-registering FADump after dump capture. |
| */ |
| fadump_conf->reserve_dump_area_start = |
| be64_to_cpu(fdm->cpu_state_data.destination_address); |
| |
| rtas_fadump_update_config(fadump_conf, fdm); |
| } |
| |
| static u64 rtas_fadump_init_mem_struct(struct fw_dump *fadump_conf) |
| { |
| u64 addr = fadump_conf->reserve_dump_area_start; |
| |
| memset(&fdm, 0, sizeof(struct rtas_fadump_mem_struct)); |
| addr = addr & PAGE_MASK; |
| |
| fdm.header.dump_format_version = cpu_to_be32(0x00000001); |
| fdm.header.dump_num_sections = cpu_to_be16(3); |
| fdm.header.dump_status_flag = 0; |
| fdm.header.offset_first_dump_section = |
| cpu_to_be32((u32)offsetof(struct rtas_fadump_mem_struct, |
| cpu_state_data)); |
| |
| /* |
| * Fields for disk dump option. |
| * We are not using disk dump option, hence set these fields to 0. |
| */ |
| fdm.header.dd_block_size = 0; |
| fdm.header.dd_block_offset = 0; |
| fdm.header.dd_num_blocks = 0; |
| fdm.header.dd_offset_disk_path = 0; |
| |
| /* set 0 to disable an automatic dump-reboot. */ |
| fdm.header.max_time_auto = 0; |
| |
| /* Kernel dump sections */ |
| /* cpu state data section. */ |
| fdm.cpu_state_data.request_flag = |
| cpu_to_be32(RTAS_FADUMP_REQUEST_FLAG); |
| fdm.cpu_state_data.source_data_type = |
| cpu_to_be16(RTAS_FADUMP_CPU_STATE_DATA); |
| fdm.cpu_state_data.source_address = 0; |
| fdm.cpu_state_data.source_len = |
| cpu_to_be64(fadump_conf->cpu_state_data_size); |
| fdm.cpu_state_data.destination_address = cpu_to_be64(addr); |
| addr += fadump_conf->cpu_state_data_size; |
| |
| /* hpte region section */ |
| fdm.hpte_region.request_flag = cpu_to_be32(RTAS_FADUMP_REQUEST_FLAG); |
| fdm.hpte_region.source_data_type = |
| cpu_to_be16(RTAS_FADUMP_HPTE_REGION); |
| fdm.hpte_region.source_address = 0; |
| fdm.hpte_region.source_len = |
| cpu_to_be64(fadump_conf->hpte_region_size); |
| fdm.hpte_region.destination_address = cpu_to_be64(addr); |
| addr += fadump_conf->hpte_region_size; |
| |
| /* |
| * Align boot memory area destination address to page boundary to |
| * be able to mmap read this area in the vmcore. |
| */ |
| addr = PAGE_ALIGN(addr); |
| |
| /* RMA region section */ |
| fdm.rmr_region.request_flag = cpu_to_be32(RTAS_FADUMP_REQUEST_FLAG); |
| fdm.rmr_region.source_data_type = |
| cpu_to_be16(RTAS_FADUMP_REAL_MODE_REGION); |
| fdm.rmr_region.source_address = cpu_to_be64(0); |
| fdm.rmr_region.source_len = cpu_to_be64(fadump_conf->boot_memory_size); |
| fdm.rmr_region.destination_address = cpu_to_be64(addr); |
| addr += fadump_conf->boot_memory_size; |
| |
| rtas_fadump_update_config(fadump_conf, &fdm); |
| |
| return addr; |
| } |
| |
| static u64 rtas_fadump_get_bootmem_min(void) |
| { |
| return RTAS_FADUMP_MIN_BOOT_MEM; |
| } |
| |
| static int rtas_fadump_register(struct fw_dump *fadump_conf) |
| { |
| unsigned int wait_time; |
| int rc, err = -EIO; |
| |
| /* TODO: Add upper time limit for the delay */ |
| do { |
| rc = rtas_call(fadump_conf->ibm_configure_kernel_dump, 3, 1, |
| NULL, FADUMP_REGISTER, &fdm, |
| sizeof(struct rtas_fadump_mem_struct)); |
| |
| wait_time = rtas_busy_delay_time(rc); |
| if (wait_time) |
| mdelay(wait_time); |
| |
| } while (wait_time); |
| |
| switch (rc) { |
| case 0: |
| pr_info("Registration is successful!\n"); |
| fadump_conf->dump_registered = 1; |
| err = 0; |
| break; |
| case -1: |
| pr_err("Failed to register. Hardware Error(%d).\n", rc); |
| break; |
| case -3: |
| if (!is_fadump_boot_mem_contiguous()) |
| pr_err("Can't have holes in boot memory area.\n"); |
| else if (!is_fadump_reserved_mem_contiguous()) |
| pr_err("Can't have holes in reserved memory area.\n"); |
| |
| pr_err("Failed to register. Parameter Error(%d).\n", rc); |
| err = -EINVAL; |
| break; |
| case -9: |
| pr_err("Already registered!\n"); |
| fadump_conf->dump_registered = 1; |
| err = -EEXIST; |
| break; |
| default: |
| pr_err("Failed to register. Unknown Error(%d).\n", rc); |
| break; |
| } |
| |
| return err; |
| } |
| |
| static int rtas_fadump_unregister(struct fw_dump *fadump_conf) |
| { |
| unsigned int wait_time; |
| int rc; |
| |
| /* TODO: Add upper time limit for the delay */ |
| do { |
| rc = rtas_call(fadump_conf->ibm_configure_kernel_dump, 3, 1, |
| NULL, FADUMP_UNREGISTER, &fdm, |
| sizeof(struct rtas_fadump_mem_struct)); |
| |
| wait_time = rtas_busy_delay_time(rc); |
| if (wait_time) |
| mdelay(wait_time); |
| } while (wait_time); |
| |
| if (rc) { |
| pr_err("Failed to un-register - unexpected error(%d).\n", rc); |
| return -EIO; |
| } |
| |
| fadump_conf->dump_registered = 0; |
| return 0; |
| } |
| |
| static int rtas_fadump_invalidate(struct fw_dump *fadump_conf) |
| { |
| unsigned int wait_time; |
| int rc; |
| |
| /* TODO: Add upper time limit for the delay */ |
| do { |
| rc = rtas_call(fadump_conf->ibm_configure_kernel_dump, 3, 1, |
| NULL, FADUMP_INVALIDATE, fdm_active, |
| sizeof(struct rtas_fadump_mem_struct)); |
| |
| wait_time = rtas_busy_delay_time(rc); |
| if (wait_time) |
| mdelay(wait_time); |
| } while (wait_time); |
| |
| if (rc) { |
| pr_err("Failed to invalidate - unexpected error (%d).\n", rc); |
| return -EIO; |
| } |
| |
| fadump_conf->dump_active = 0; |
| fdm_active = NULL; |
| return 0; |
| } |
| |
| #define RTAS_FADUMP_GPR_MASK 0xffffff0000000000 |
| static inline int rtas_fadump_gpr_index(u64 id) |
| { |
| char str[3]; |
| int i = -1; |
| |
| if ((id & RTAS_FADUMP_GPR_MASK) == fadump_str_to_u64("GPR")) { |
| /* get the digits at the end */ |
| id &= ~RTAS_FADUMP_GPR_MASK; |
| id >>= 24; |
| str[2] = '\0'; |
| str[1] = id & 0xff; |
| str[0] = (id >> 8) & 0xff; |
| if (kstrtoint(str, 10, &i)) |
| i = -EINVAL; |
| if (i > 31) |
| i = -1; |
| } |
| return i; |
| } |
| |
| static void __init rtas_fadump_set_regval(struct pt_regs *regs, u64 reg_id, u64 reg_val) |
| { |
| int i; |
| |
| i = rtas_fadump_gpr_index(reg_id); |
| if (i >= 0) |
| regs->gpr[i] = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("NIA")) |
| regs->nip = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("MSR")) |
| regs->msr = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("CTR")) |
| regs->ctr = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("LR")) |
| regs->link = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("XER")) |
| regs->xer = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("CR")) |
| regs->ccr = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("DAR")) |
| regs->dar = (unsigned long)reg_val; |
| else if (reg_id == fadump_str_to_u64("DSISR")) |
| regs->dsisr = (unsigned long)reg_val; |
| } |
| |
| static struct rtas_fadump_reg_entry* __init |
| rtas_fadump_read_regs(struct rtas_fadump_reg_entry *reg_entry, |
| struct pt_regs *regs) |
| { |
| memset(regs, 0, sizeof(struct pt_regs)); |
| |
| while (be64_to_cpu(reg_entry->reg_id) != fadump_str_to_u64("CPUEND")) { |
| rtas_fadump_set_regval(regs, be64_to_cpu(reg_entry->reg_id), |
| be64_to_cpu(reg_entry->reg_value)); |
| reg_entry++; |
| } |
| reg_entry++; |
| return reg_entry; |
| } |
| |
| /* |
| * Read CPU state dump data and convert it into ELF notes. |
| * The CPU dump starts with magic number "REGSAVE". NumCpusOffset should be |
| * used to access the data to allow for additional fields to be added without |
| * affecting compatibility. Each list of registers for a CPU starts with |
| * "CPUSTRT" and ends with "CPUEND". Each register entry is of 16 bytes, |
| * 8 Byte ASCII identifier and 8 Byte register value. The register entry |
| * with identifier "CPUSTRT" and "CPUEND" contains 4 byte cpu id as part |
| * of register value. For more details refer to PAPR document. |
| * |
| * Only for the crashing cpu we ignore the CPU dump data and get exact |
| * state from fadump crash info structure populated by first kernel at the |
| * time of crash. |
| */ |
| static int __init rtas_fadump_build_cpu_notes(struct fw_dump *fadump_conf) |
| { |
| struct rtas_fadump_reg_save_area_header *reg_header; |
| struct fadump_crash_info_header *fdh = NULL; |
| struct rtas_fadump_reg_entry *reg_entry; |
| u32 num_cpus, *note_buf; |
| int i, rc = 0, cpu = 0; |
| struct pt_regs regs; |
| unsigned long addr; |
| void *vaddr; |
| |
| addr = be64_to_cpu(fdm_active->cpu_state_data.destination_address); |
| vaddr = __va(addr); |
| |
| reg_header = vaddr; |
| if (be64_to_cpu(reg_header->magic_number) != |
| fadump_str_to_u64("REGSAVE")) { |
| pr_err("Unable to read register save area.\n"); |
| return -ENOENT; |
| } |
| |
| pr_debug("--------CPU State Data------------\n"); |
| pr_debug("Magic Number: %llx\n", be64_to_cpu(reg_header->magic_number)); |
| pr_debug("NumCpuOffset: %x\n", be32_to_cpu(reg_header->num_cpu_offset)); |
| |
| vaddr += be32_to_cpu(reg_header->num_cpu_offset); |
| num_cpus = be32_to_cpu(*((__be32 *)(vaddr))); |
| pr_debug("NumCpus : %u\n", num_cpus); |
| vaddr += sizeof(u32); |
| reg_entry = (struct rtas_fadump_reg_entry *)vaddr; |
| |
| rc = fadump_setup_cpu_notes_buf(num_cpus); |
| if (rc != 0) |
| return rc; |
| |
| note_buf = (u32 *)fadump_conf->cpu_notes_buf_vaddr; |
| |
| if (fadump_conf->fadumphdr_addr) |
| fdh = __va(fadump_conf->fadumphdr_addr); |
| |
| for (i = 0; i < num_cpus; i++) { |
| if (be64_to_cpu(reg_entry->reg_id) != |
| fadump_str_to_u64("CPUSTRT")) { |
| pr_err("Unable to read CPU state data\n"); |
| rc = -ENOENT; |
| goto error_out; |
| } |
| /* Lower 4 bytes of reg_value contains logical cpu id */ |
| cpu = (be64_to_cpu(reg_entry->reg_value) & |
| RTAS_FADUMP_CPU_ID_MASK); |
| if (fdh && !cpumask_test_cpu(cpu, &fdh->cpu_mask)) { |
| RTAS_FADUMP_SKIP_TO_NEXT_CPU(reg_entry); |
| continue; |
| } |
| pr_debug("Reading register data for cpu %d...\n", cpu); |
| if (fdh && fdh->crashing_cpu == cpu) { |
| regs = fdh->regs; |
| note_buf = fadump_regs_to_elf_notes(note_buf, ®s); |
| RTAS_FADUMP_SKIP_TO_NEXT_CPU(reg_entry); |
| } else { |
| reg_entry++; |
| reg_entry = rtas_fadump_read_regs(reg_entry, ®s); |
| note_buf = fadump_regs_to_elf_notes(note_buf, ®s); |
| } |
| } |
| final_note(note_buf); |
| |
| if (fdh) { |
| pr_debug("Updating elfcore header (%llx) with cpu notes\n", |
| fdh->elfcorehdr_addr); |
| fadump_update_elfcore_header(__va(fdh->elfcorehdr_addr)); |
| } |
| return 0; |
| |
| error_out: |
| fadump_free_cpu_notes_buf(); |
| return rc; |
| |
| } |
| |
| /* |
| * Validate and process the dump data stored by firmware before exporting |
| * it through '/proc/vmcore'. |
| */ |
| static int __init rtas_fadump_process(struct fw_dump *fadump_conf) |
| { |
| struct fadump_crash_info_header *fdh; |
| int rc = 0; |
| |
| if (!fdm_active || !fadump_conf->fadumphdr_addr) |
| return -EINVAL; |
| |
| /* Check if the dump data is valid. */ |
| if ((be16_to_cpu(fdm_active->header.dump_status_flag) == |
| RTAS_FADUMP_ERROR_FLAG) || |
| (fdm_active->cpu_state_data.error_flags != 0) || |
| (fdm_active->rmr_region.error_flags != 0)) { |
| pr_err("Dump taken by platform is not valid\n"); |
| return -EINVAL; |
| } |
| if ((fdm_active->rmr_region.bytes_dumped != |
| fdm_active->rmr_region.source_len) || |
| !fdm_active->cpu_state_data.bytes_dumped) { |
| pr_err("Dump taken by platform is incomplete\n"); |
| return -EINVAL; |
| } |
| |
| /* Validate the fadump crash info header */ |
| fdh = __va(fadump_conf->fadumphdr_addr); |
| if (fdh->magic_number != FADUMP_CRASH_INFO_MAGIC) { |
| pr_err("Crash info header is not valid.\n"); |
| return -EINVAL; |
| } |
| |
| rc = rtas_fadump_build_cpu_notes(fadump_conf); |
| if (rc) |
| return rc; |
| |
| /* |
| * We are done validating dump info and elfcore header is now ready |
| * to be exported. set elfcorehdr_addr so that vmcore module will |
| * export the elfcore header through '/proc/vmcore'. |
| */ |
| elfcorehdr_addr = fdh->elfcorehdr_addr; |
| |
| return 0; |
| } |
| |
| static void rtas_fadump_region_show(struct fw_dump *fadump_conf, |
| struct seq_file *m) |
| { |
| const struct rtas_fadump_section *cpu_data_section; |
| const struct rtas_fadump_mem_struct *fdm_ptr; |
| |
| if (fdm_active) |
| fdm_ptr = fdm_active; |
| else |
| fdm_ptr = &fdm; |
| |
| cpu_data_section = &(fdm_ptr->cpu_state_data); |
| seq_printf(m, "CPU :[%#016llx-%#016llx] %#llx bytes, Dumped: %#llx\n", |
| be64_to_cpu(cpu_data_section->destination_address), |
| be64_to_cpu(cpu_data_section->destination_address) + |
| be64_to_cpu(cpu_data_section->source_len) - 1, |
| be64_to_cpu(cpu_data_section->source_len), |
| be64_to_cpu(cpu_data_section->bytes_dumped)); |
| |
| seq_printf(m, "HPTE:[%#016llx-%#016llx] %#llx bytes, Dumped: %#llx\n", |
| be64_to_cpu(fdm_ptr->hpte_region.destination_address), |
| be64_to_cpu(fdm_ptr->hpte_region.destination_address) + |
| be64_to_cpu(fdm_ptr->hpte_region.source_len) - 1, |
| be64_to_cpu(fdm_ptr->hpte_region.source_len), |
| be64_to_cpu(fdm_ptr->hpte_region.bytes_dumped)); |
| |
| seq_printf(m, "DUMP: Src: %#016llx, Dest: %#016llx, ", |
| be64_to_cpu(fdm_ptr->rmr_region.source_address), |
| be64_to_cpu(fdm_ptr->rmr_region.destination_address)); |
| seq_printf(m, "Size: %#llx, Dumped: %#llx bytes\n", |
| be64_to_cpu(fdm_ptr->rmr_region.source_len), |
| be64_to_cpu(fdm_ptr->rmr_region.bytes_dumped)); |
| |
| /* Dump is active. Show preserved area start address. */ |
| if (fdm_active) { |
| seq_printf(m, "\nMemory above %#016llx is reserved for saving crash dump\n", |
| fadump_conf->boot_mem_top); |
| } |
| } |
| |
| static void rtas_fadump_trigger(struct fadump_crash_info_header *fdh, |
| const char *msg) |
| { |
| /* Call ibm,os-term rtas call to trigger firmware assisted dump */ |
| rtas_os_term((char *)msg); |
| } |
| |
| static struct fadump_ops rtas_fadump_ops = { |
| .fadump_init_mem_struct = rtas_fadump_init_mem_struct, |
| .fadump_get_bootmem_min = rtas_fadump_get_bootmem_min, |
| .fadump_register = rtas_fadump_register, |
| .fadump_unregister = rtas_fadump_unregister, |
| .fadump_invalidate = rtas_fadump_invalidate, |
| .fadump_process = rtas_fadump_process, |
| .fadump_region_show = rtas_fadump_region_show, |
| .fadump_trigger = rtas_fadump_trigger, |
| }; |
| |
| void __init rtas_fadump_dt_scan(struct fw_dump *fadump_conf, u64 node) |
| { |
| int i, size, num_sections; |
| const __be32 *sections; |
| const __be32 *token; |
| |
| /* |
| * Check if Firmware Assisted dump is supported. if yes, check |
| * if dump has been initiated on last reboot. |
| */ |
| token = of_get_flat_dt_prop(node, "ibm,configure-kernel-dump", NULL); |
| if (!token) |
| return; |
| |
| fadump_conf->ibm_configure_kernel_dump = be32_to_cpu(*token); |
| fadump_conf->ops = &rtas_fadump_ops; |
| fadump_conf->fadump_supported = 1; |
| |
| /* Firmware supports 64-bit value for size, align it to pagesize. */ |
| fadump_conf->max_copy_size = ALIGN_DOWN(U64_MAX, PAGE_SIZE); |
| |
| /* |
| * The 'ibm,kernel-dump' rtas node is present only if there is |
| * dump data waiting for us. |
| */ |
| fdm_active = of_get_flat_dt_prop(node, "ibm,kernel-dump", NULL); |
| if (fdm_active) { |
| pr_info("Firmware-assisted dump is active.\n"); |
| fadump_conf->dump_active = 1; |
| rtas_fadump_get_config(fadump_conf, (void *)__pa(fdm_active)); |
| } |
| |
| /* Get the sizes required to store dump data for the firmware provided |
| * dump sections. |
| * For each dump section type supported, a 32bit cell which defines |
| * the ID of a supported section followed by two 32 bit cells which |
| * gives the size of the section in bytes. |
| */ |
| sections = of_get_flat_dt_prop(node, "ibm,configure-kernel-dump-sizes", |
| &size); |
| |
| if (!sections) |
| return; |
| |
| num_sections = size / (3 * sizeof(u32)); |
| |
| for (i = 0; i < num_sections; i++, sections += 3) { |
| u32 type = (u32)of_read_number(sections, 1); |
| |
| switch (type) { |
| case RTAS_FADUMP_CPU_STATE_DATA: |
| fadump_conf->cpu_state_data_size = |
| of_read_ulong(§ions[1], 2); |
| break; |
| case RTAS_FADUMP_HPTE_REGION: |
| fadump_conf->hpte_region_size = |
| of_read_ulong(§ions[1], 2); |
| break; |
| } |
| } |
| } |