141df5928SHari Bathini // SPDX-License-Identifier: GPL-2.0-or-later 241df5928SHari Bathini /* 341df5928SHari Bathini * Firmware-Assisted Dump support on POWER platform (OPAL). 441df5928SHari Bathini * 541df5928SHari Bathini * Copyright 2019, Hari Bathini, IBM Corporation. 641df5928SHari Bathini */ 741df5928SHari Bathini 841df5928SHari Bathini #define pr_fmt(fmt) "opal fadump: " fmt 941df5928SHari Bathini 1041df5928SHari Bathini #include <linux/string.h> 1141df5928SHari Bathini #include <linux/seq_file.h> 127b1b3b48SHari Bathini #include <linux/of.h> 1341df5928SHari Bathini #include <linux/of_fdt.h> 1441df5928SHari Bathini #include <linux/libfdt.h> 15742a265aSHari Bathini #include <linux/mm.h> 162a1b06ddSHari Bathini #include <linux/crash_dump.h> 1741df5928SHari Bathini 18742a265aSHari Bathini #include <asm/page.h> 1941df5928SHari Bathini #include <asm/opal.h> 2041df5928SHari Bathini #include <asm/fadump-internal.h> 2141df5928SHari Bathini 22742a265aSHari Bathini #include "opal-fadump.h" 23742a265aSHari Bathini 24bec53196SHari Bathini 25bec53196SHari Bathini #ifdef CONFIG_PRESERVE_FA_DUMP 26bec53196SHari Bathini /* 27bec53196SHari Bathini * When dump is active but PRESERVE_FA_DUMP is enabled on the kernel, 28bec53196SHari Bathini * ensure crash data is preserved in hope that the subsequent memory 29bec53196SHari Bathini * preserving kernel boot is going to process this crash data. 30bec53196SHari Bathini */ 31bec53196SHari Bathini void __init opal_fadump_dt_scan(struct fw_dump *fadump_conf, u64 node) 32bec53196SHari Bathini { 33bec53196SHari Bathini const struct opal_fadump_mem_struct *opal_fdm_active; 34bec53196SHari Bathini const __be32 *prop; 35bec53196SHari Bathini unsigned long dn; 36bec53196SHari Bathini u64 addr = 0; 37bec53196SHari Bathini s64 ret; 38bec53196SHari Bathini 39bec53196SHari Bathini dn = of_get_flat_dt_subnode_by_name(node, "dump"); 40bec53196SHari Bathini if (dn == -FDT_ERR_NOTFOUND) 41bec53196SHari Bathini return; 42bec53196SHari Bathini 43bec53196SHari Bathini /* 44bec53196SHari Bathini * Check if dump has been initiated on last reboot. 45bec53196SHari Bathini */ 46bec53196SHari Bathini prop = of_get_flat_dt_prop(dn, "mpipl-boot", NULL); 47bec53196SHari Bathini if (!prop) 48bec53196SHari Bathini return; 49bec53196SHari Bathini 50bec53196SHari Bathini ret = opal_mpipl_query_tag(OPAL_MPIPL_TAG_KERNEL, &addr); 51bec53196SHari Bathini if ((ret != OPAL_SUCCESS) || !addr) { 52bec53196SHari Bathini pr_debug("Could not get Kernel metadata (%lld)\n", ret); 53bec53196SHari Bathini return; 54bec53196SHari Bathini } 55bec53196SHari Bathini 56bec53196SHari Bathini /* 57bec53196SHari Bathini * Preserve memory only if kernel memory regions are registered 58bec53196SHari Bathini * with f/w for MPIPL. 59bec53196SHari Bathini */ 60bec53196SHari Bathini addr = be64_to_cpu(addr); 61bec53196SHari Bathini pr_debug("Kernel metadata addr: %llx\n", addr); 62bec53196SHari Bathini opal_fdm_active = (void *)addr; 63bec53196SHari Bathini if (opal_fdm_active->registered_regions == 0) 64bec53196SHari Bathini return; 65bec53196SHari Bathini 66bec53196SHari Bathini ret = opal_mpipl_query_tag(OPAL_MPIPL_TAG_BOOT_MEM, &addr); 67bec53196SHari Bathini if ((ret != OPAL_SUCCESS) || !addr) { 68bec53196SHari Bathini pr_err("Failed to get boot memory tag (%lld)\n", ret); 69bec53196SHari Bathini return; 70bec53196SHari Bathini } 71bec53196SHari Bathini 72bec53196SHari Bathini /* 73bec53196SHari Bathini * Memory below this address can be used for booting a 74bec53196SHari Bathini * capture kernel or petitboot kernel. Preserve everything 75bec53196SHari Bathini * above this address for processing crashdump. 76bec53196SHari Bathini */ 77bec53196SHari Bathini fadump_conf->boot_mem_top = be64_to_cpu(addr); 78bec53196SHari Bathini pr_debug("Preserve everything above %llx\n", fadump_conf->boot_mem_top); 79bec53196SHari Bathini 80bec53196SHari Bathini pr_info("Firmware-assisted dump is active.\n"); 81bec53196SHari Bathini fadump_conf->dump_active = 1; 82bec53196SHari Bathini } 83bec53196SHari Bathini 84bec53196SHari Bathini #else /* CONFIG_PRESERVE_FA_DUMP */ 852a1b06ddSHari Bathini static const struct opal_fadump_mem_struct *opal_fdm_active; 865000a17aSHari Bathini static const struct opal_mpipl_fadump *opal_cpu_metadata; 87742a265aSHari Bathini static struct opal_fadump_mem_struct *opal_fdm; 88742a265aSHari Bathini 896f713d18SHari Bathini #ifdef CONFIG_OPAL_CORE 906f713d18SHari Bathini extern bool kernel_initiated; 916f713d18SHari Bathini #endif 926f713d18SHari Bathini 93a20a8fa4SHari Bathini static int opal_fadump_unregister(struct fw_dump *fadump_conf); 94a20a8fa4SHari Bathini 95a20a8fa4SHari Bathini static void opal_fadump_update_config(struct fw_dump *fadump_conf, 96a20a8fa4SHari Bathini const struct opal_fadump_mem_struct *fdm) 97a20a8fa4SHari Bathini { 9851bba8edSHari Bathini pr_debug("Boot memory regions count: %d\n", fdm->region_cnt); 9951bba8edSHari Bathini 100a20a8fa4SHari Bathini /* 101a20a8fa4SHari Bathini * The destination address of the first boot memory region is the 102a20a8fa4SHari Bathini * destination address of boot memory regions. 103a20a8fa4SHari Bathini */ 104a20a8fa4SHari Bathini fadump_conf->boot_mem_dest_addr = fdm->rgn[0].dest; 105a20a8fa4SHari Bathini pr_debug("Destination address of boot memory regions: %#016llx\n", 106a20a8fa4SHari Bathini fadump_conf->boot_mem_dest_addr); 107a20a8fa4SHari Bathini 108a20a8fa4SHari Bathini fadump_conf->fadumphdr_addr = fdm->fadumphdr_addr; 109a20a8fa4SHari Bathini } 110a20a8fa4SHari Bathini 1112a1b06ddSHari Bathini /* 1122a1b06ddSHari Bathini * This function is called in the capture kernel to get configuration details 1132a1b06ddSHari Bathini * from metadata setup by the first kernel. 1142a1b06ddSHari Bathini */ 1152a1b06ddSHari Bathini static void opal_fadump_get_config(struct fw_dump *fadump_conf, 1162a1b06ddSHari Bathini const struct opal_fadump_mem_struct *fdm) 1172a1b06ddSHari Bathini { 1187dee93a9SHari Bathini unsigned long base, size, last_end, hole_size; 1192a1b06ddSHari Bathini int i; 1202a1b06ddSHari Bathini 1212a1b06ddSHari Bathini if (!fadump_conf->dump_active) 1222a1b06ddSHari Bathini return; 1232a1b06ddSHari Bathini 1247dee93a9SHari Bathini last_end = 0; 1257dee93a9SHari Bathini hole_size = 0; 1262a1b06ddSHari Bathini fadump_conf->boot_memory_size = 0; 1272a1b06ddSHari Bathini 1282a1b06ddSHari Bathini pr_debug("Boot memory regions:\n"); 1292a1b06ddSHari Bathini for (i = 0; i < fdm->region_cnt; i++) { 1307dee93a9SHari Bathini base = fdm->rgn[i].src; 1317dee93a9SHari Bathini size = fdm->rgn[i].size; 1327dee93a9SHari Bathini pr_debug("\t[%03d] base: 0x%lx, size: 0x%lx\n", i, base, size); 1332a1b06ddSHari Bathini 1347dee93a9SHari Bathini fadump_conf->boot_mem_addr[i] = base; 1357dee93a9SHari Bathini fadump_conf->boot_mem_sz[i] = size; 1367dee93a9SHari Bathini fadump_conf->boot_memory_size += size; 1377dee93a9SHari Bathini hole_size += (base - last_end); 1387dee93a9SHari Bathini 1397dee93a9SHari Bathini last_end = base + size; 1402a1b06ddSHari Bathini } 1412a1b06ddSHari Bathini 1422a1b06ddSHari Bathini /* 1432a1b06ddSHari Bathini * Start address of reserve dump area (permanent reservation) for 1442a1b06ddSHari Bathini * re-registering FADump after dump capture. 1452a1b06ddSHari Bathini */ 1462a1b06ddSHari Bathini fadump_conf->reserve_dump_area_start = fdm->rgn[0].dest; 1472a1b06ddSHari Bathini 1486071e8f9SHari Bathini /* 1496071e8f9SHari Bathini * Rarely, but it can so happen that system crashes before all 1506071e8f9SHari Bathini * boot memory regions are registered for MPIPL. In such 1516071e8f9SHari Bathini * cases, warn that the vmcore may not be accurate and proceed 1526071e8f9SHari Bathini * anyway as that is the best bet considering free pages, cache 1536071e8f9SHari Bathini * pages, user pages, etc are usually filtered out. 1546071e8f9SHari Bathini * 1556071e8f9SHari Bathini * Hope the memory that could not be preserved only has pages 1566071e8f9SHari Bathini * that are usually filtered out while saving the vmcore. 1576071e8f9SHari Bathini */ 1586071e8f9SHari Bathini if (fdm->region_cnt > fdm->registered_regions) { 1596071e8f9SHari Bathini pr_warn("Not all memory regions were saved!!!\n"); 1606071e8f9SHari Bathini pr_warn(" Unsaved memory regions:\n"); 1616071e8f9SHari Bathini i = fdm->registered_regions; 1626071e8f9SHari Bathini while (i < fdm->region_cnt) { 1636071e8f9SHari Bathini pr_warn("\t[%03d] base: 0x%llx, size: 0x%llx\n", 1646071e8f9SHari Bathini i, fdm->rgn[i].src, fdm->rgn[i].size); 1656071e8f9SHari Bathini i++; 1666071e8f9SHari Bathini } 1676071e8f9SHari Bathini 1686071e8f9SHari Bathini pr_warn("If the unsaved regions only contain pages that are filtered out (eg. free/user pages), the vmcore should still be usable.\n"); 1696071e8f9SHari Bathini pr_warn("WARNING: If the unsaved regions contain kernel pages, the vmcore will be corrupted.\n"); 1706071e8f9SHari Bathini } 1716071e8f9SHari Bathini 1727dee93a9SHari Bathini fadump_conf->boot_mem_top = (fadump_conf->boot_memory_size + hole_size); 1737dee93a9SHari Bathini fadump_conf->boot_mem_regs_cnt = fdm->region_cnt; 1742a1b06ddSHari Bathini opal_fadump_update_config(fadump_conf, fdm); 1752a1b06ddSHari Bathini } 1762a1b06ddSHari Bathini 177742a265aSHari Bathini /* Initialize kernel metadata */ 178742a265aSHari Bathini static void opal_fadump_init_metadata(struct opal_fadump_mem_struct *fdm) 179742a265aSHari Bathini { 180742a265aSHari Bathini fdm->version = OPAL_FADUMP_VERSION; 181742a265aSHari Bathini fdm->region_cnt = 0; 182742a265aSHari Bathini fdm->registered_regions = 0; 183742a265aSHari Bathini fdm->fadumphdr_addr = 0; 184742a265aSHari Bathini } 185742a265aSHari Bathini 18641df5928SHari Bathini static u64 opal_fadump_init_mem_struct(struct fw_dump *fadump_conf) 18741df5928SHari Bathini { 1887dee93a9SHari Bathini u64 addr = fadump_conf->reserve_dump_area_start; 1897dee93a9SHari Bathini int i; 190742a265aSHari Bathini 191742a265aSHari Bathini opal_fdm = __va(fadump_conf->kernel_metadata); 192742a265aSHari Bathini opal_fadump_init_metadata(opal_fdm); 193742a265aSHari Bathini 19451bba8edSHari Bathini /* Boot memory regions */ 1957dee93a9SHari Bathini for (i = 0; i < fadump_conf->boot_mem_regs_cnt; i++) { 1967dee93a9SHari Bathini opal_fdm->rgn[i].src = fadump_conf->boot_mem_addr[i]; 1977dee93a9SHari Bathini opal_fdm->rgn[i].dest = addr; 1987dee93a9SHari Bathini opal_fdm->rgn[i].size = fadump_conf->boot_mem_sz[i]; 19951bba8edSHari Bathini 20051bba8edSHari Bathini opal_fdm->region_cnt++; 2017dee93a9SHari Bathini addr += fadump_conf->boot_mem_sz[i]; 20251bba8edSHari Bathini } 203742a265aSHari Bathini 204742a265aSHari Bathini /* 205742a265aSHari Bathini * Kernel metadata is passed to f/w and retrieved in capture kerenl. 206742a265aSHari Bathini * So, use it to save fadump header address instead of calculating it. 207742a265aSHari Bathini */ 208742a265aSHari Bathini opal_fdm->fadumphdr_addr = (opal_fdm->rgn[0].dest + 209742a265aSHari Bathini fadump_conf->boot_memory_size); 210742a265aSHari Bathini 211a20a8fa4SHari Bathini opal_fadump_update_config(fadump_conf, opal_fdm); 212a20a8fa4SHari Bathini 2137dee93a9SHari Bathini return addr; 214742a265aSHari Bathini } 215742a265aSHari Bathini 216742a265aSHari Bathini static u64 opal_fadump_get_metadata_size(void) 217742a265aSHari Bathini { 218742a265aSHari Bathini return PAGE_ALIGN(sizeof(struct opal_fadump_mem_struct)); 219742a265aSHari Bathini } 220742a265aSHari Bathini 221742a265aSHari Bathini static int opal_fadump_setup_metadata(struct fw_dump *fadump_conf) 222742a265aSHari Bathini { 223742a265aSHari Bathini int err = 0; 224742a265aSHari Bathini s64 ret; 225742a265aSHari Bathini 226742a265aSHari Bathini /* 227742a265aSHari Bathini * Use the last page(s) in FADump memory reservation for 228742a265aSHari Bathini * kernel metadata. 229742a265aSHari Bathini */ 230742a265aSHari Bathini fadump_conf->kernel_metadata = (fadump_conf->reserve_dump_area_start + 231742a265aSHari Bathini fadump_conf->reserve_dump_area_size - 232742a265aSHari Bathini opal_fadump_get_metadata_size()); 233742a265aSHari Bathini pr_info("Kernel metadata addr: %llx\n", fadump_conf->kernel_metadata); 234742a265aSHari Bathini 235742a265aSHari Bathini /* Initialize kernel metadata before registering the address with f/w */ 236742a265aSHari Bathini opal_fdm = __va(fadump_conf->kernel_metadata); 237742a265aSHari Bathini opal_fadump_init_metadata(opal_fdm); 238742a265aSHari Bathini 239742a265aSHari Bathini /* 240742a265aSHari Bathini * Register metadata address with f/w. Can be retrieved in 241742a265aSHari Bathini * the capture kernel. 242742a265aSHari Bathini */ 243742a265aSHari Bathini ret = opal_mpipl_register_tag(OPAL_MPIPL_TAG_KERNEL, 244742a265aSHari Bathini fadump_conf->kernel_metadata); 245742a265aSHari Bathini if (ret != OPAL_SUCCESS) { 246742a265aSHari Bathini pr_err("Failed to set kernel metadata tag!\n"); 247742a265aSHari Bathini err = -EPERM; 248742a265aSHari Bathini } 249742a265aSHari Bathini 250bec53196SHari Bathini /* 251bec53196SHari Bathini * Register boot memory top address with f/w. Should be retrieved 252bec53196SHari Bathini * by a kernel that intends to preserve crash'ed kernel's memory. 253bec53196SHari Bathini */ 254bec53196SHari Bathini ret = opal_mpipl_register_tag(OPAL_MPIPL_TAG_BOOT_MEM, 2557dee93a9SHari Bathini fadump_conf->boot_mem_top); 256bec53196SHari Bathini if (ret != OPAL_SUCCESS) { 257bec53196SHari Bathini pr_err("Failed to set boot memory tag!\n"); 258bec53196SHari Bathini err = -EPERM; 259bec53196SHari Bathini } 260bec53196SHari Bathini 261742a265aSHari Bathini return err; 26241df5928SHari Bathini } 26341df5928SHari Bathini 2647b1b3b48SHari Bathini static u64 opal_fadump_get_bootmem_min(void) 2657b1b3b48SHari Bathini { 2667b1b3b48SHari Bathini return OPAL_FADUMP_MIN_BOOT_MEM; 2677b1b3b48SHari Bathini } 2687b1b3b48SHari Bathini 26941df5928SHari Bathini static int opal_fadump_register(struct fw_dump *fadump_conf) 27041df5928SHari Bathini { 271a20a8fa4SHari Bathini s64 rc = OPAL_PARAMETER; 272a20a8fa4SHari Bathini int i, err = -EIO; 273a20a8fa4SHari Bathini 274a20a8fa4SHari Bathini for (i = 0; i < opal_fdm->region_cnt; i++) { 275a20a8fa4SHari Bathini rc = opal_mpipl_update(OPAL_MPIPL_ADD_RANGE, 276a20a8fa4SHari Bathini opal_fdm->rgn[i].src, 277a20a8fa4SHari Bathini opal_fdm->rgn[i].dest, 278a20a8fa4SHari Bathini opal_fdm->rgn[i].size); 279a20a8fa4SHari Bathini if (rc != OPAL_SUCCESS) 280a20a8fa4SHari Bathini break; 281a20a8fa4SHari Bathini 282a20a8fa4SHari Bathini opal_fdm->registered_regions++; 283a20a8fa4SHari Bathini } 284a20a8fa4SHari Bathini 285a20a8fa4SHari Bathini switch (rc) { 286a20a8fa4SHari Bathini case OPAL_SUCCESS: 287a20a8fa4SHari Bathini pr_info("Registration is successful!\n"); 288a20a8fa4SHari Bathini fadump_conf->dump_registered = 1; 289a20a8fa4SHari Bathini err = 0; 290a20a8fa4SHari Bathini break; 291a20a8fa4SHari Bathini case OPAL_RESOURCE: 292a20a8fa4SHari Bathini /* If MAX regions limit in f/w is hit, warn and proceed. */ 293a20a8fa4SHari Bathini pr_warn("%d regions could not be registered for MPIPL as MAX limit is reached!\n", 294a20a8fa4SHari Bathini (opal_fdm->region_cnt - opal_fdm->registered_regions)); 295a20a8fa4SHari Bathini fadump_conf->dump_registered = 1; 296a20a8fa4SHari Bathini err = 0; 297a20a8fa4SHari Bathini break; 298a20a8fa4SHari Bathini case OPAL_PARAMETER: 299a20a8fa4SHari Bathini pr_err("Failed to register. Parameter Error(%lld).\n", rc); 300a20a8fa4SHari Bathini break; 301a20a8fa4SHari Bathini case OPAL_HARDWARE: 302a20a8fa4SHari Bathini pr_err("Support not available.\n"); 303a20a8fa4SHari Bathini fadump_conf->fadump_supported = 0; 304a20a8fa4SHari Bathini fadump_conf->fadump_enabled = 0; 305a20a8fa4SHari Bathini break; 306a20a8fa4SHari Bathini default: 307a20a8fa4SHari Bathini pr_err("Failed to register. Unknown Error(%lld).\n", rc); 308a20a8fa4SHari Bathini break; 309a20a8fa4SHari Bathini } 310a20a8fa4SHari Bathini 311a20a8fa4SHari Bathini /* 312a20a8fa4SHari Bathini * If some regions were registered before OPAL_MPIPL_ADD_RANGE 313a20a8fa4SHari Bathini * OPAL call failed, unregister all regions. 314a20a8fa4SHari Bathini */ 315a20a8fa4SHari Bathini if ((err < 0) && (opal_fdm->registered_regions > 0)) 316a20a8fa4SHari Bathini opal_fadump_unregister(fadump_conf); 317a20a8fa4SHari Bathini 318a20a8fa4SHari Bathini return err; 31941df5928SHari Bathini } 32041df5928SHari Bathini 32141df5928SHari Bathini static int opal_fadump_unregister(struct fw_dump *fadump_conf) 32241df5928SHari Bathini { 323a20a8fa4SHari Bathini s64 rc; 324a20a8fa4SHari Bathini 325a20a8fa4SHari Bathini rc = opal_mpipl_update(OPAL_MPIPL_REMOVE_ALL, 0, 0, 0); 326a20a8fa4SHari Bathini if (rc) { 327a20a8fa4SHari Bathini pr_err("Failed to un-register - unexpected Error(%lld).\n", rc); 32841df5928SHari Bathini return -EIO; 32941df5928SHari Bathini } 33041df5928SHari Bathini 331a20a8fa4SHari Bathini opal_fdm->registered_regions = 0; 332a20a8fa4SHari Bathini fadump_conf->dump_registered = 0; 333a20a8fa4SHari Bathini return 0; 334a20a8fa4SHari Bathini } 335a20a8fa4SHari Bathini 33641df5928SHari Bathini static int opal_fadump_invalidate(struct fw_dump *fadump_conf) 33741df5928SHari Bathini { 338a4e2e2caSHari Bathini s64 rc; 339a4e2e2caSHari Bathini 340a4e2e2caSHari Bathini rc = opal_mpipl_update(OPAL_MPIPL_FREE_PRESERVED_MEMORY, 0, 0, 0); 341a4e2e2caSHari Bathini if (rc) { 342a4e2e2caSHari Bathini pr_err("Failed to invalidate - unexpected Error(%lld).\n", rc); 34341df5928SHari Bathini return -EIO; 34441df5928SHari Bathini } 34541df5928SHari Bathini 346a4e2e2caSHari Bathini fadump_conf->dump_active = 0; 347a4e2e2caSHari Bathini opal_fdm_active = NULL; 348a4e2e2caSHari Bathini return 0; 349a4e2e2caSHari Bathini } 350a4e2e2caSHari Bathini 3512790d01dSHari Bathini static void opal_fadump_cleanup(struct fw_dump *fadump_conf) 3522790d01dSHari Bathini { 3532790d01dSHari Bathini s64 ret; 3542790d01dSHari Bathini 3552790d01dSHari Bathini ret = opal_mpipl_register_tag(OPAL_MPIPL_TAG_KERNEL, 0); 3562790d01dSHari Bathini if (ret != OPAL_SUCCESS) 3572790d01dSHari Bathini pr_warn("Could not reset (%llu) kernel metadata tag!\n", ret); 3582790d01dSHari Bathini } 3592790d01dSHari Bathini 3605000a17aSHari Bathini /* 3615000a17aSHari Bathini * Verify if CPU state data is available. If available, do a bit of sanity 3625000a17aSHari Bathini * checking before processing this data. 3635000a17aSHari Bathini */ 3645000a17aSHari Bathini static bool __init is_opal_fadump_cpu_data_valid(struct fw_dump *fadump_conf) 3655000a17aSHari Bathini { 3665000a17aSHari Bathini if (!opal_cpu_metadata) 3675000a17aSHari Bathini return false; 3685000a17aSHari Bathini 3695000a17aSHari Bathini fadump_conf->cpu_state_data_version = 3705000a17aSHari Bathini be32_to_cpu(opal_cpu_metadata->cpu_data_version); 3715000a17aSHari Bathini fadump_conf->cpu_state_entry_size = 3725000a17aSHari Bathini be32_to_cpu(opal_cpu_metadata->cpu_data_size); 3735000a17aSHari Bathini fadump_conf->cpu_state_dest_vaddr = 3745000a17aSHari Bathini (u64)__va(be64_to_cpu(opal_cpu_metadata->region[0].dest)); 3755000a17aSHari Bathini fadump_conf->cpu_state_data_size = 3765000a17aSHari Bathini be64_to_cpu(opal_cpu_metadata->region[0].size); 3775000a17aSHari Bathini 3785000a17aSHari Bathini if (fadump_conf->cpu_state_data_version != HDAT_FADUMP_CPU_DATA_VER) { 3795000a17aSHari Bathini pr_warn("Supported CPU state data version: %u, found: %d!\n", 3805000a17aSHari Bathini HDAT_FADUMP_CPU_DATA_VER, 3815000a17aSHari Bathini fadump_conf->cpu_state_data_version); 3825000a17aSHari Bathini pr_warn("WARNING: F/W using newer CPU state data format!!\n"); 3835000a17aSHari Bathini } 3845000a17aSHari Bathini 3855000a17aSHari Bathini if ((fadump_conf->cpu_state_dest_vaddr == 0) || 3865000a17aSHari Bathini (fadump_conf->cpu_state_entry_size == 0) || 3875000a17aSHari Bathini (fadump_conf->cpu_state_entry_size > 3885000a17aSHari Bathini fadump_conf->cpu_state_data_size)) { 3895000a17aSHari Bathini pr_err("CPU state data is invalid. Ignoring!\n"); 3905000a17aSHari Bathini return false; 3915000a17aSHari Bathini } 3925000a17aSHari Bathini 3935000a17aSHari Bathini return true; 3945000a17aSHari Bathini } 3955000a17aSHari Bathini 3962a1b06ddSHari Bathini /* 3972a1b06ddSHari Bathini * Convert CPU state data saved at the time of crash into ELF notes. 3982a1b06ddSHari Bathini * 3995000a17aSHari Bathini * While the crashing CPU's register data is saved by the kernel, CPU state 4005000a17aSHari Bathini * data for all CPUs is saved by f/w. In CPU state data provided by f/w, 4015000a17aSHari Bathini * each register entry is of 16 bytes, a numerical identifier along with 4025000a17aSHari Bathini * a GPR/SPR flag in the first 8 bytes and the register value in the next 4035000a17aSHari Bathini * 8 bytes. For more details refer to F/W documentation. If this data is 4045000a17aSHari Bathini * missing or in unsupported format, append crashing CPU's register data 4055000a17aSHari Bathini * saved by the kernel in the PT_NOTE, to have something to work with in 4065000a17aSHari Bathini * the vmcore file. 4072a1b06ddSHari Bathini */ 4082a1b06ddSHari Bathini static int __init 4092a1b06ddSHari Bathini opal_fadump_build_cpu_notes(struct fw_dump *fadump_conf, 4102a1b06ddSHari Bathini struct fadump_crash_info_header *fdh) 4112a1b06ddSHari Bathini { 4125000a17aSHari Bathini u32 thread_pir, size_per_thread, regs_offset, regs_cnt, reg_esize; 4135000a17aSHari Bathini struct hdat_fadump_thread_hdr *thdr; 4145000a17aSHari Bathini bool is_cpu_data_valid = false; 4152a1b06ddSHari Bathini u32 num_cpus = 1, *note_buf; 4165000a17aSHari Bathini struct pt_regs regs; 4175000a17aSHari Bathini char *bufp; 4185000a17aSHari Bathini int rc, i; 4192a1b06ddSHari Bathini 4205000a17aSHari Bathini if (is_opal_fadump_cpu_data_valid(fadump_conf)) { 4215000a17aSHari Bathini size_per_thread = fadump_conf->cpu_state_entry_size; 4225000a17aSHari Bathini num_cpus = (fadump_conf->cpu_state_data_size / size_per_thread); 4235000a17aSHari Bathini bufp = __va(fadump_conf->cpu_state_dest_vaddr); 4245000a17aSHari Bathini is_cpu_data_valid = true; 4255000a17aSHari Bathini } 4262a1b06ddSHari Bathini 4272a1b06ddSHari Bathini rc = fadump_setup_cpu_notes_buf(num_cpus); 4282a1b06ddSHari Bathini if (rc != 0) 4292a1b06ddSHari Bathini return rc; 4302a1b06ddSHari Bathini 4312a1b06ddSHari Bathini note_buf = (u32 *)fadump_conf->cpu_notes_buf_vaddr; 4325000a17aSHari Bathini if (!is_cpu_data_valid) 4335000a17aSHari Bathini goto out; 4345000a17aSHari Bathini 4355000a17aSHari Bathini /* 4365000a17aSHari Bathini * Offset for register entries, entry size and registers count is 4375000a17aSHari Bathini * duplicated in every thread header in keeping with HDAT format. 4385000a17aSHari Bathini * Use these values from the first thread header. 4395000a17aSHari Bathini */ 4405000a17aSHari Bathini thdr = (struct hdat_fadump_thread_hdr *)bufp; 4415000a17aSHari Bathini regs_offset = (offsetof(struct hdat_fadump_thread_hdr, offset) + 4425000a17aSHari Bathini be32_to_cpu(thdr->offset)); 4435000a17aSHari Bathini reg_esize = be32_to_cpu(thdr->esize); 4445000a17aSHari Bathini regs_cnt = be32_to_cpu(thdr->ecnt); 4455000a17aSHari Bathini 4465000a17aSHari Bathini pr_debug("--------CPU State Data------------\n"); 4475000a17aSHari Bathini pr_debug("NumCpus : %u\n", num_cpus); 4485000a17aSHari Bathini pr_debug("\tOffset: %u, Entry size: %u, Cnt: %u\n", 4495000a17aSHari Bathini regs_offset, reg_esize, regs_cnt); 4505000a17aSHari Bathini 4515000a17aSHari Bathini for (i = 0; i < num_cpus; i++, bufp += size_per_thread) { 4525000a17aSHari Bathini thdr = (struct hdat_fadump_thread_hdr *)bufp; 4535000a17aSHari Bathini 4545000a17aSHari Bathini thread_pir = be32_to_cpu(thdr->pir); 4555000a17aSHari Bathini pr_debug("[%04d] PIR: 0x%x, core state: 0x%02x\n", 4565000a17aSHari Bathini i, thread_pir, thdr->core_state); 4575000a17aSHari Bathini 4585000a17aSHari Bathini /* 4595000a17aSHari Bathini * If this is kernel initiated crash, crashing_cpu would be set 4605000a17aSHari Bathini * appropriately and register data of the crashing CPU saved by 4615000a17aSHari Bathini * crashing kernel. Add this saved register data of crashing CPU 4625000a17aSHari Bathini * to elf notes and populate the pt_regs for the remaining CPUs 4635000a17aSHari Bathini * from register state data provided by firmware. 4645000a17aSHari Bathini */ 4655000a17aSHari Bathini if (fdh->crashing_cpu == thread_pir) { 4665000a17aSHari Bathini note_buf = fadump_regs_to_elf_notes(note_buf, 4675000a17aSHari Bathini &fdh->regs); 4685000a17aSHari Bathini pr_debug("Crashing CPU PIR: 0x%x - R1 : 0x%lx, NIP : 0x%lx\n", 4695000a17aSHari Bathini fdh->crashing_cpu, fdh->regs.gpr[1], 4705000a17aSHari Bathini fdh->regs.nip); 4715000a17aSHari Bathini continue; 4725000a17aSHari Bathini } 4735000a17aSHari Bathini 4745000a17aSHari Bathini /* 4755000a17aSHari Bathini * Register state data of MAX cores is provided by firmware, 4765000a17aSHari Bathini * but some of this cores may not be active. So, while 4775000a17aSHari Bathini * processing register state data, check core state and 4785000a17aSHari Bathini * skip threads that belong to inactive cores. 4795000a17aSHari Bathini */ 4805000a17aSHari Bathini if (thdr->core_state == HDAT_FADUMP_CORE_INACTIVE) 4815000a17aSHari Bathini continue; 4825000a17aSHari Bathini 4835000a17aSHari Bathini opal_fadump_read_regs((bufp + regs_offset), regs_cnt, 4846f713d18SHari Bathini reg_esize, true, ®s); 4855000a17aSHari Bathini note_buf = fadump_regs_to_elf_notes(note_buf, ®s); 4865000a17aSHari Bathini pr_debug("CPU PIR: 0x%x - R1 : 0x%lx, NIP : 0x%lx\n", 4875000a17aSHari Bathini thread_pir, regs.gpr[1], regs.nip); 4885000a17aSHari Bathini } 4895000a17aSHari Bathini 4905000a17aSHari Bathini out: 4915000a17aSHari Bathini /* 4925000a17aSHari Bathini * CPU state data is invalid/unsupported. Try appending crashing CPU's 4935000a17aSHari Bathini * register data, if it is saved by the kernel. 4945000a17aSHari Bathini */ 4955000a17aSHari Bathini if (fadump_conf->cpu_notes_buf_vaddr == (u64)note_buf) { 4965000a17aSHari Bathini if (fdh->crashing_cpu == FADUMP_CPU_UNKNOWN) { 4975000a17aSHari Bathini fadump_free_cpu_notes_buf(); 4985000a17aSHari Bathini return -ENODEV; 4995000a17aSHari Bathini } 5005000a17aSHari Bathini 5015000a17aSHari Bathini pr_warn("WARNING: appending only crashing CPU's register data\n"); 5022a1b06ddSHari Bathini note_buf = fadump_regs_to_elf_notes(note_buf, &(fdh->regs)); 5035000a17aSHari Bathini } 5045000a17aSHari Bathini 5052a1b06ddSHari Bathini final_note(note_buf); 5062a1b06ddSHari Bathini 5072a1b06ddSHari Bathini pr_debug("Updating elfcore header (%llx) with cpu notes\n", 5082a1b06ddSHari Bathini fdh->elfcorehdr_addr); 5092a1b06ddSHari Bathini fadump_update_elfcore_header(__va(fdh->elfcorehdr_addr)); 5102a1b06ddSHari Bathini return 0; 5112a1b06ddSHari Bathini } 5122a1b06ddSHari Bathini 51341df5928SHari Bathini static int __init opal_fadump_process(struct fw_dump *fadump_conf) 51441df5928SHari Bathini { 5152a1b06ddSHari Bathini struct fadump_crash_info_header *fdh; 5162a1b06ddSHari Bathini int rc = -EINVAL; 5172a1b06ddSHari Bathini 5182a1b06ddSHari Bathini if (!opal_fdm_active || !fadump_conf->fadumphdr_addr) 5192a1b06ddSHari Bathini return rc; 5202a1b06ddSHari Bathini 5212a1b06ddSHari Bathini /* Validate the fadump crash info header */ 5222a1b06ddSHari Bathini fdh = __va(fadump_conf->fadumphdr_addr); 5232a1b06ddSHari Bathini if (fdh->magic_number != FADUMP_CRASH_INFO_MAGIC) { 5242a1b06ddSHari Bathini pr_err("Crash info header is not valid.\n"); 5252a1b06ddSHari Bathini return rc; 5262a1b06ddSHari Bathini } 5272a1b06ddSHari Bathini 5286f713d18SHari Bathini #ifdef CONFIG_OPAL_CORE 5296f713d18SHari Bathini /* 5306f713d18SHari Bathini * If this is a kernel initiated crash, crashing_cpu would be set 5316f713d18SHari Bathini * appropriately and register data of the crashing CPU saved by 5326f713d18SHari Bathini * crashing kernel. Add this saved register data of crashing CPU 5336f713d18SHari Bathini * to elf notes and populate the pt_regs for the remaining CPUs 5346f713d18SHari Bathini * from register state data provided by firmware. 5356f713d18SHari Bathini */ 5366f713d18SHari Bathini if (fdh->crashing_cpu != FADUMP_CPU_UNKNOWN) 5376f713d18SHari Bathini kernel_initiated = true; 5386f713d18SHari Bathini #endif 5396f713d18SHari Bathini 5402a1b06ddSHari Bathini rc = opal_fadump_build_cpu_notes(fadump_conf, fdh); 5412a1b06ddSHari Bathini if (rc) 5422a1b06ddSHari Bathini return rc; 5432a1b06ddSHari Bathini 5442a1b06ddSHari Bathini /* 5452a1b06ddSHari Bathini * We are done validating dump info and elfcore header is now ready 5462a1b06ddSHari Bathini * to be exported. set elfcorehdr_addr so that vmcore module will 5472a1b06ddSHari Bathini * export the elfcore header through '/proc/vmcore'. 5482a1b06ddSHari Bathini */ 5492a1b06ddSHari Bathini elfcorehdr_addr = fdh->elfcorehdr_addr; 5502a1b06ddSHari Bathini 5512a1b06ddSHari Bathini return rc; 55241df5928SHari Bathini } 55341df5928SHari Bathini 55441df5928SHari Bathini static void opal_fadump_region_show(struct fw_dump *fadump_conf, 55541df5928SHari Bathini struct seq_file *m) 55641df5928SHari Bathini { 5572a1b06ddSHari Bathini const struct opal_fadump_mem_struct *fdm_ptr; 558742a265aSHari Bathini u64 dumped_bytes = 0; 559742a265aSHari Bathini int i; 560742a265aSHari Bathini 5612a1b06ddSHari Bathini if (fadump_conf->dump_active) 5622a1b06ddSHari Bathini fdm_ptr = opal_fdm_active; 5632a1b06ddSHari Bathini else 5642a1b06ddSHari Bathini fdm_ptr = opal_fdm; 5652a1b06ddSHari Bathini 566742a265aSHari Bathini for (i = 0; i < fdm_ptr->region_cnt; i++) { 5672a1b06ddSHari Bathini /* 5682a1b06ddSHari Bathini * Only regions that are registered for MPIPL 5692a1b06ddSHari Bathini * would have dump data. 5702a1b06ddSHari Bathini */ 5712a1b06ddSHari Bathini if ((fadump_conf->dump_active) && 5722a1b06ddSHari Bathini (i < fdm_ptr->registered_regions)) 5732a1b06ddSHari Bathini dumped_bytes = fdm_ptr->rgn[i].size; 5742a1b06ddSHari Bathini 575742a265aSHari Bathini seq_printf(m, "DUMP: Src: %#016llx, Dest: %#016llx, ", 576742a265aSHari Bathini fdm_ptr->rgn[i].src, fdm_ptr->rgn[i].dest); 577742a265aSHari Bathini seq_printf(m, "Size: %#llx, Dumped: %#llx bytes\n", 578742a265aSHari Bathini fdm_ptr->rgn[i].size, dumped_bytes); 579742a265aSHari Bathini } 5802a1b06ddSHari Bathini 5812a1b06ddSHari Bathini /* Dump is active. Show reserved area start address. */ 5822a1b06ddSHari Bathini if (fadump_conf->dump_active) { 5832a1b06ddSHari Bathini seq_printf(m, "\nMemory above %#016lx is reserved for saving crash dump\n", 5842a1b06ddSHari Bathini fadump_conf->reserve_dump_area_start); 5852a1b06ddSHari Bathini } 58641df5928SHari Bathini } 58741df5928SHari Bathini 58841df5928SHari Bathini static void opal_fadump_trigger(struct fadump_crash_info_header *fdh, 58941df5928SHari Bathini const char *msg) 59041df5928SHari Bathini { 59141df5928SHari Bathini int rc; 59241df5928SHari Bathini 5935000a17aSHari Bathini /* 5945000a17aSHari Bathini * Unlike on pSeries platform, logical CPU number is not provided 5955000a17aSHari Bathini * with architected register state data. So, store the crashing 5965000a17aSHari Bathini * CPU's PIR instead to plug the appropriate register data for 5975000a17aSHari Bathini * crashing CPU in the vmcore file. 5985000a17aSHari Bathini */ 5995000a17aSHari Bathini fdh->crashing_cpu = (u32)mfspr(SPRN_PIR); 6005000a17aSHari Bathini 60141df5928SHari Bathini rc = opal_cec_reboot2(OPAL_REBOOT_MPIPL, msg); 60241df5928SHari Bathini if (rc == OPAL_UNSUPPORTED) { 60341df5928SHari Bathini pr_emerg("Reboot type %d not supported.\n", 60441df5928SHari Bathini OPAL_REBOOT_MPIPL); 60541df5928SHari Bathini } else if (rc == OPAL_HARDWARE) 60641df5928SHari Bathini pr_emerg("No backend support for MPIPL!\n"); 60741df5928SHari Bathini } 60841df5928SHari Bathini 60941df5928SHari Bathini static struct fadump_ops opal_fadump_ops = { 61041df5928SHari Bathini .fadump_init_mem_struct = opal_fadump_init_mem_struct, 611742a265aSHari Bathini .fadump_get_metadata_size = opal_fadump_get_metadata_size, 612742a265aSHari Bathini .fadump_setup_metadata = opal_fadump_setup_metadata, 6137b1b3b48SHari Bathini .fadump_get_bootmem_min = opal_fadump_get_bootmem_min, 61441df5928SHari Bathini .fadump_register = opal_fadump_register, 61541df5928SHari Bathini .fadump_unregister = opal_fadump_unregister, 61641df5928SHari Bathini .fadump_invalidate = opal_fadump_invalidate, 6172790d01dSHari Bathini .fadump_cleanup = opal_fadump_cleanup, 61841df5928SHari Bathini .fadump_process = opal_fadump_process, 61941df5928SHari Bathini .fadump_region_show = opal_fadump_region_show, 62041df5928SHari Bathini .fadump_trigger = opal_fadump_trigger, 62141df5928SHari Bathini }; 62241df5928SHari Bathini 62341df5928SHari Bathini void __init opal_fadump_dt_scan(struct fw_dump *fadump_conf, u64 node) 62441df5928SHari Bathini { 6252a1b06ddSHari Bathini const __be32 *prop; 62641df5928SHari Bathini unsigned long dn; 6272a1b06ddSHari Bathini u64 addr = 0; 6287b1b3b48SHari Bathini int i, len; 6292a1b06ddSHari Bathini s64 ret; 6302a1b06ddSHari Bathini 63141df5928SHari Bathini /* 63241df5928SHari Bathini * Check if Firmware-Assisted Dump is supported. if yes, check 63341df5928SHari Bathini * if dump has been initiated on last reboot. 63441df5928SHari Bathini */ 63541df5928SHari Bathini dn = of_get_flat_dt_subnode_by_name(node, "dump"); 63641df5928SHari Bathini if (dn == -FDT_ERR_NOTFOUND) { 63741df5928SHari Bathini pr_debug("FADump support is missing!\n"); 63841df5928SHari Bathini return; 63941df5928SHari Bathini } 64041df5928SHari Bathini 64141df5928SHari Bathini if (!of_flat_dt_is_compatible(dn, "ibm,opal-dump")) { 64241df5928SHari Bathini pr_err("Support missing for this f/w version!\n"); 64341df5928SHari Bathini return; 64441df5928SHari Bathini } 64541df5928SHari Bathini 6467b1b3b48SHari Bathini prop = of_get_flat_dt_prop(dn, "fw-load-area", &len); 6477b1b3b48SHari Bathini if (prop) { 6487b1b3b48SHari Bathini /* 6497b1b3b48SHari Bathini * Each f/w load area is an (address,size) pair, 6507b1b3b48SHari Bathini * 2 cells each, totalling 4 cells per range. 6517b1b3b48SHari Bathini */ 6527b1b3b48SHari Bathini for (i = 0; i < len / (sizeof(*prop) * 4); i++) { 6537b1b3b48SHari Bathini u64 base, end; 6547b1b3b48SHari Bathini 6557b1b3b48SHari Bathini base = of_read_number(prop + (i * 4) + 0, 2); 6567b1b3b48SHari Bathini end = base; 6577b1b3b48SHari Bathini end += of_read_number(prop + (i * 4) + 2, 2); 6587b1b3b48SHari Bathini if (end > OPAL_FADUMP_MIN_BOOT_MEM) { 6597b1b3b48SHari Bathini pr_err("F/W load area: 0x%llx-0x%llx\n", 6607b1b3b48SHari Bathini base, end); 6617b1b3b48SHari Bathini pr_err("F/W version not supported!\n"); 6627b1b3b48SHari Bathini return; 6637b1b3b48SHari Bathini } 6647b1b3b48SHari Bathini } 6657b1b3b48SHari Bathini } 6667b1b3b48SHari Bathini 66741df5928SHari Bathini fadump_conf->ops = &opal_fadump_ops; 66841df5928SHari Bathini fadump_conf->fadump_supported = 1; 6692a1b06ddSHari Bathini 6702a1b06ddSHari Bathini /* 6717dee93a9SHari Bathini * Firmware supports 32-bit field for size. Align it to PAGE_SIZE 6727dee93a9SHari Bathini * and request firmware to copy multiple kernel boot memory regions. 6737dee93a9SHari Bathini */ 674e96d904eSChristophe Leroy fadump_conf->max_copy_size = ALIGN_DOWN(U32_MAX, PAGE_SIZE); 6757dee93a9SHari Bathini 6767dee93a9SHari Bathini /* 6772a1b06ddSHari Bathini * Check if dump has been initiated on last reboot. 6782a1b06ddSHari Bathini */ 6792a1b06ddSHari Bathini prop = of_get_flat_dt_prop(dn, "mpipl-boot", NULL); 6802a1b06ddSHari Bathini if (!prop) 6812a1b06ddSHari Bathini return; 6822a1b06ddSHari Bathini 6832a1b06ddSHari Bathini ret = opal_mpipl_query_tag(OPAL_MPIPL_TAG_KERNEL, &addr); 6842a1b06ddSHari Bathini if ((ret != OPAL_SUCCESS) || !addr) { 6852a1b06ddSHari Bathini pr_err("Failed to get Kernel metadata (%lld)\n", ret); 6862a1b06ddSHari Bathini return; 6872a1b06ddSHari Bathini } 6882a1b06ddSHari Bathini 6892a1b06ddSHari Bathini addr = be64_to_cpu(addr); 6902a1b06ddSHari Bathini pr_debug("Kernel metadata addr: %llx\n", addr); 6912a1b06ddSHari Bathini 6922a1b06ddSHari Bathini opal_fdm_active = __va(addr); 6932a1b06ddSHari Bathini if (opal_fdm_active->version != OPAL_FADUMP_VERSION) { 6942a1b06ddSHari Bathini pr_warn("Supported kernel metadata version: %u, found: %d!\n", 6952a1b06ddSHari Bathini OPAL_FADUMP_VERSION, opal_fdm_active->version); 6962a1b06ddSHari Bathini pr_warn("WARNING: Kernel metadata format mismatch identified! Core file maybe corrupted..\n"); 6972a1b06ddSHari Bathini } 6982a1b06ddSHari Bathini 6992a1b06ddSHari Bathini /* Kernel regions not registered with f/w for MPIPL */ 7002a1b06ddSHari Bathini if (opal_fdm_active->registered_regions == 0) { 7012a1b06ddSHari Bathini opal_fdm_active = NULL; 7022a1b06ddSHari Bathini return; 7032a1b06ddSHari Bathini } 7042a1b06ddSHari Bathini 7055000a17aSHari Bathini ret = opal_mpipl_query_tag(OPAL_MPIPL_TAG_CPU, &addr); 7065000a17aSHari Bathini if (addr) { 7075000a17aSHari Bathini addr = be64_to_cpu(addr); 7085000a17aSHari Bathini pr_debug("CPU metadata addr: %llx\n", addr); 7095000a17aSHari Bathini opal_cpu_metadata = __va(addr); 7105000a17aSHari Bathini } 7115000a17aSHari Bathini 7122a1b06ddSHari Bathini pr_info("Firmware-assisted dump is active.\n"); 7132a1b06ddSHari Bathini fadump_conf->dump_active = 1; 7142a1b06ddSHari Bathini opal_fadump_get_config(fadump_conf, opal_fdm_active); 71541df5928SHari Bathini } 716bec53196SHari Bathini #endif /* !CONFIG_PRESERVE_FA_DUMP */ 717