11a59d1b8SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 2eb39c880SMahesh Salgaonkar /* 3eb39c880SMahesh Salgaonkar * Firmware Assisted dump: A robust mechanism to get reliable kernel crash 4eb39c880SMahesh Salgaonkar * dump with assistance from firmware. This approach does not use kexec, 5eb39c880SMahesh Salgaonkar * instead firmware assists in booting the kdump kernel while preserving 6eb39c880SMahesh Salgaonkar * memory contents. The most of the code implementation has been adapted 7eb39c880SMahesh Salgaonkar * from phyp assisted dump implementation written by Linas Vepstas and 8eb39c880SMahesh Salgaonkar * Manish Ahuja 9eb39c880SMahesh Salgaonkar * 10eb39c880SMahesh Salgaonkar * Copyright 2011 IBM Corporation 11eb39c880SMahesh Salgaonkar * Author: Mahesh Salgaonkar <mahesh@linux.vnet.ibm.com> 12eb39c880SMahesh Salgaonkar */ 13eb39c880SMahesh Salgaonkar 14eb39c880SMahesh Salgaonkar #undef DEBUG 15eb39c880SMahesh Salgaonkar #define pr_fmt(fmt) "fadump: " fmt 16eb39c880SMahesh Salgaonkar 17eb39c880SMahesh Salgaonkar #include <linux/string.h> 18eb39c880SMahesh Salgaonkar #include <linux/memblock.h> 193ccc00a7SMahesh Salgaonkar #include <linux/delay.h> 203ccc00a7SMahesh Salgaonkar #include <linux/seq_file.h> 212df173d9SMahesh Salgaonkar #include <linux/crash_dump.h> 22b500afffSMahesh Salgaonkar #include <linux/kobject.h> 23b500afffSMahesh Salgaonkar #include <linux/sysfs.h> 24a5818313SHari Bathini #include <linux/slab.h> 25a4e92ce8SMahesh Salgaonkar #include <linux/cma.h> 2645d0ba52SChristophe Leroy #include <linux/hugetlb.h> 27eb39c880SMahesh Salgaonkar 287644d581SMichael Ellerman #include <asm/debugfs.h> 29eb39c880SMahesh Salgaonkar #include <asm/page.h> 30eb39c880SMahesh Salgaonkar #include <asm/prom.h> 31eb39c880SMahesh Salgaonkar #include <asm/fadump.h> 32ca986d7fSHari Bathini #include <asm/fadump-internal.h> 33cad3c834SStephen Rothwell #include <asm/setup.h> 34eb39c880SMahesh Salgaonkar 35eb39c880SMahesh Salgaonkar static struct fw_dump fw_dump; 363ccc00a7SMahesh Salgaonkar 37*b2a815a5SHari Bathini static void __init fadump_reserve_crash_area(u64 base); 38*b2a815a5SHari Bathini 393ccc00a7SMahesh Salgaonkar static DEFINE_MUTEX(fadump_mutex); 40e4fc48fbSHari Bathini struct fadump_mrange_info crash_mrange_info = { "crash", NULL, 0, 0, 0 }; 41dda9dbfeSHari Bathini struct fadump_mrange_info reserved_mrange_info = { "reserved", NULL, 0, 0, 0 }; 42eb39c880SMahesh Salgaonkar 43a4e92ce8SMahesh Salgaonkar #ifdef CONFIG_CMA 440226e552SHari Bathini static struct cma *fadump_cma; 450226e552SHari Bathini 46a4e92ce8SMahesh Salgaonkar /* 47a4e92ce8SMahesh Salgaonkar * fadump_cma_init() - Initialize CMA area from a fadump reserved memory 48a4e92ce8SMahesh Salgaonkar * 49a4e92ce8SMahesh Salgaonkar * This function initializes CMA area from fadump reserved memory. 50a4e92ce8SMahesh Salgaonkar * The total size of fadump reserved memory covers for boot memory size 51a4e92ce8SMahesh Salgaonkar * + cpu data size + hpte size and metadata. 52a4e92ce8SMahesh Salgaonkar * Initialize only the area equivalent to boot memory size for CMA use. 53a4e92ce8SMahesh Salgaonkar * The reamining portion of fadump reserved memory will be not given 54a4e92ce8SMahesh Salgaonkar * to CMA and pages for thoes will stay reserved. boot memory size is 55a4e92ce8SMahesh Salgaonkar * aligned per CMA requirement to satisy cma_init_reserved_mem() call. 56a4e92ce8SMahesh Salgaonkar * But for some reason even if it fails we still have the memory reservation 57a4e92ce8SMahesh Salgaonkar * with us and we can still continue doing fadump. 58a4e92ce8SMahesh Salgaonkar */ 59a4e92ce8SMahesh Salgaonkar int __init fadump_cma_init(void) 60a4e92ce8SMahesh Salgaonkar { 61a4e92ce8SMahesh Salgaonkar unsigned long long base, size; 62a4e92ce8SMahesh Salgaonkar int rc; 63a4e92ce8SMahesh Salgaonkar 64a4e92ce8SMahesh Salgaonkar if (!fw_dump.fadump_enabled) 65a4e92ce8SMahesh Salgaonkar return 0; 66a4e92ce8SMahesh Salgaonkar 67a4e92ce8SMahesh Salgaonkar /* 68a4e92ce8SMahesh Salgaonkar * Do not use CMA if user has provided fadump=nocma kernel parameter. 69a4e92ce8SMahesh Salgaonkar * Return 1 to continue with fadump old behaviour. 70a4e92ce8SMahesh Salgaonkar */ 71a4e92ce8SMahesh Salgaonkar if (fw_dump.nocma) 72a4e92ce8SMahesh Salgaonkar return 1; 73a4e92ce8SMahesh Salgaonkar 74a4e92ce8SMahesh Salgaonkar base = fw_dump.reserve_dump_area_start; 75a4e92ce8SMahesh Salgaonkar size = fw_dump.boot_memory_size; 76a4e92ce8SMahesh Salgaonkar 77a4e92ce8SMahesh Salgaonkar if (!size) 78a4e92ce8SMahesh Salgaonkar return 0; 79a4e92ce8SMahesh Salgaonkar 80a4e92ce8SMahesh Salgaonkar rc = cma_init_reserved_mem(base, size, 0, "fadump_cma", &fadump_cma); 81a4e92ce8SMahesh Salgaonkar if (rc) { 82a4e92ce8SMahesh Salgaonkar pr_err("Failed to init cma area for firmware-assisted dump,%d\n", rc); 83a4e92ce8SMahesh Salgaonkar /* 84a4e92ce8SMahesh Salgaonkar * Though the CMA init has failed we still have memory 85a4e92ce8SMahesh Salgaonkar * reservation with us. The reserved memory will be 86a4e92ce8SMahesh Salgaonkar * blocked from production system usage. Hence return 1, 87a4e92ce8SMahesh Salgaonkar * so that we can continue with fadump. 88a4e92ce8SMahesh Salgaonkar */ 89a4e92ce8SMahesh Salgaonkar return 1; 90a4e92ce8SMahesh Salgaonkar } 91a4e92ce8SMahesh Salgaonkar 92a4e92ce8SMahesh Salgaonkar /* 93a4e92ce8SMahesh Salgaonkar * So we now have successfully initialized cma area for fadump. 94a4e92ce8SMahesh Salgaonkar */ 95a4e92ce8SMahesh Salgaonkar pr_info("Initialized 0x%lx bytes cma area at %ldMB from 0x%lx " 96a4e92ce8SMahesh Salgaonkar "bytes of memory reserved for firmware-assisted dump\n", 97a4e92ce8SMahesh Salgaonkar cma_get_size(fadump_cma), 98a4e92ce8SMahesh Salgaonkar (unsigned long)cma_get_base(fadump_cma) >> 20, 99a4e92ce8SMahesh Salgaonkar fw_dump.reserve_dump_area_size); 100a4e92ce8SMahesh Salgaonkar return 1; 101a4e92ce8SMahesh Salgaonkar } 102a4e92ce8SMahesh Salgaonkar #else 103a4e92ce8SMahesh Salgaonkar static int __init fadump_cma_init(void) { return 1; } 104a4e92ce8SMahesh Salgaonkar #endif /* CONFIG_CMA */ 105a4e92ce8SMahesh Salgaonkar 106eb39c880SMahesh Salgaonkar /* Scan the Firmware Assisted dump configuration details. */ 107f3512011SHari Bathini int __init early_init_dt_scan_fw_dump(unsigned long node, const char *uname, 108f3512011SHari Bathini int depth, void *data) 109eb39c880SMahesh Salgaonkar { 11041df5928SHari Bathini if (depth != 1) 111eb39c880SMahesh Salgaonkar return 0; 112eb39c880SMahesh Salgaonkar 11341df5928SHari Bathini if (strcmp(uname, "rtas") == 0) { 114d3833a70SHari Bathini rtas_fadump_dt_scan(&fw_dump, node); 115eb39c880SMahesh Salgaonkar return 1; 116eb39c880SMahesh Salgaonkar } 117eb39c880SMahesh Salgaonkar 11841df5928SHari Bathini if (strcmp(uname, "ibm,opal") == 0) { 11941df5928SHari Bathini opal_fadump_dt_scan(&fw_dump, node); 12041df5928SHari Bathini return 1; 12141df5928SHari Bathini } 12241df5928SHari Bathini 12341df5928SHari Bathini return 0; 12441df5928SHari Bathini } 12541df5928SHari Bathini 126eae0dfccSHari Bathini /* 127eae0dfccSHari Bathini * If fadump is registered, check if the memory provided 1280db6896fSMahesh Salgaonkar * falls within boot memory area and reserved memory area. 129eae0dfccSHari Bathini */ 1300db6896fSMahesh Salgaonkar int is_fadump_memory_area(u64 addr, ulong size) 131eae0dfccSHari Bathini { 1320db6896fSMahesh Salgaonkar u64 d_start = fw_dump.reserve_dump_area_start; 1330db6896fSMahesh Salgaonkar u64 d_end = d_start + fw_dump.reserve_dump_area_size; 1340db6896fSMahesh Salgaonkar 135eae0dfccSHari Bathini if (!fw_dump.dump_registered) 136eae0dfccSHari Bathini return 0; 137eae0dfccSHari Bathini 1380db6896fSMahesh Salgaonkar if (((addr + size) > d_start) && (addr <= d_end)) 1390db6896fSMahesh Salgaonkar return 1; 1400db6896fSMahesh Salgaonkar 141eae0dfccSHari Bathini return (addr + size) > RMA_START && addr <= fw_dump.boot_memory_size; 142eae0dfccSHari Bathini } 143eae0dfccSHari Bathini 1446fcd6baaSNicholas Piggin int should_fadump_crash(void) 1456fcd6baaSNicholas Piggin { 1466fcd6baaSNicholas Piggin if (!fw_dump.dump_registered || !fw_dump.fadumphdr_addr) 1476fcd6baaSNicholas Piggin return 0; 1486fcd6baaSNicholas Piggin return 1; 1496fcd6baaSNicholas Piggin } 1506fcd6baaSNicholas Piggin 1513ccc00a7SMahesh Salgaonkar int is_fadump_active(void) 1523ccc00a7SMahesh Salgaonkar { 1533ccc00a7SMahesh Salgaonkar return fw_dump.dump_active; 1543ccc00a7SMahesh Salgaonkar } 1553ccc00a7SMahesh Salgaonkar 156a5a05b91SHari Bathini /* 157961cf26aSHari Bathini * Returns true, if there are no holes in memory area between d_start to d_end, 158961cf26aSHari Bathini * false otherwise. 159a5a05b91SHari Bathini */ 160961cf26aSHari Bathini static bool is_fadump_mem_area_contiguous(u64 d_start, u64 d_end) 161a5a05b91SHari Bathini { 162a5a05b91SHari Bathini struct memblock_region *reg; 163961cf26aSHari Bathini bool ret = false; 164961cf26aSHari Bathini u64 start, end; 165a5a05b91SHari Bathini 166a5a05b91SHari Bathini for_each_memblock(memory, reg) { 167961cf26aSHari Bathini start = max_t(u64, d_start, reg->base); 168961cf26aSHari Bathini end = min_t(u64, d_end, (reg->base + reg->size)); 169961cf26aSHari Bathini if (d_start < end) { 170961cf26aSHari Bathini /* Memory hole from d_start to start */ 171961cf26aSHari Bathini if (start > d_start) 172a5a05b91SHari Bathini break; 173a5a05b91SHari Bathini 174961cf26aSHari Bathini if (end == d_end) { 175961cf26aSHari Bathini ret = true; 176a5a05b91SHari Bathini break; 177a5a05b91SHari Bathini } 178a5a05b91SHari Bathini 179961cf26aSHari Bathini d_start = end + 1; 180a5a05b91SHari Bathini } 181a5a05b91SHari Bathini } 182a5a05b91SHari Bathini 183a5a05b91SHari Bathini return ret; 184a5a05b91SHari Bathini } 185a5a05b91SHari Bathini 186f86593beSMahesh Salgaonkar /* 187961cf26aSHari Bathini * Returns true, if there are no holes in boot memory area, 188961cf26aSHari Bathini * false otherwise. 189961cf26aSHari Bathini */ 1907f0ad11dSHari Bathini bool is_fadump_boot_mem_contiguous(void) 191961cf26aSHari Bathini { 192961cf26aSHari Bathini return is_fadump_mem_area_contiguous(0, fw_dump.boot_memory_size); 193961cf26aSHari Bathini } 194961cf26aSHari Bathini 195961cf26aSHari Bathini /* 196f86593beSMahesh Salgaonkar * Returns true, if there are no holes in reserved memory area, 197f86593beSMahesh Salgaonkar * false otherwise. 198f86593beSMahesh Salgaonkar */ 1997f0ad11dSHari Bathini bool is_fadump_reserved_mem_contiguous(void) 200f86593beSMahesh Salgaonkar { 201961cf26aSHari Bathini u64 d_start, d_end; 202f86593beSMahesh Salgaonkar 203961cf26aSHari Bathini d_start = fw_dump.reserve_dump_area_start; 204961cf26aSHari Bathini d_end = d_start + fw_dump.reserve_dump_area_size; 205961cf26aSHari Bathini return is_fadump_mem_area_contiguous(d_start, d_end); 206f86593beSMahesh Salgaonkar } 207f86593beSMahesh Salgaonkar 2083ccc00a7SMahesh Salgaonkar /* Print firmware assisted dump configurations for debugging purpose. */ 2093ccc00a7SMahesh Salgaonkar static void fadump_show_config(void) 2103ccc00a7SMahesh Salgaonkar { 2113ccc00a7SMahesh Salgaonkar pr_debug("Support for firmware-assisted dump (fadump): %s\n", 2123ccc00a7SMahesh Salgaonkar (fw_dump.fadump_supported ? "present" : "no support")); 2133ccc00a7SMahesh Salgaonkar 2143ccc00a7SMahesh Salgaonkar if (!fw_dump.fadump_supported) 2153ccc00a7SMahesh Salgaonkar return; 2163ccc00a7SMahesh Salgaonkar 2173ccc00a7SMahesh Salgaonkar pr_debug("Fadump enabled : %s\n", 2183ccc00a7SMahesh Salgaonkar (fw_dump.fadump_enabled ? "yes" : "no")); 2193ccc00a7SMahesh Salgaonkar pr_debug("Dump Active : %s\n", 2203ccc00a7SMahesh Salgaonkar (fw_dump.dump_active ? "yes" : "no")); 2213ccc00a7SMahesh Salgaonkar pr_debug("Dump section sizes:\n"); 2223ccc00a7SMahesh Salgaonkar pr_debug(" CPU state data size: %lx\n", fw_dump.cpu_state_data_size); 2233ccc00a7SMahesh Salgaonkar pr_debug(" HPTE region size : %lx\n", fw_dump.hpte_region_size); 2243ccc00a7SMahesh Salgaonkar pr_debug("Boot memory size : %lx\n", fw_dump.boot_memory_size); 2253ccc00a7SMahesh Salgaonkar } 2263ccc00a7SMahesh Salgaonkar 227eb39c880SMahesh Salgaonkar /** 228eb39c880SMahesh Salgaonkar * fadump_calculate_reserve_size(): reserve variable boot area 5% of System RAM 229eb39c880SMahesh Salgaonkar * 230eb39c880SMahesh Salgaonkar * Function to find the largest memory size we need to reserve during early 231eb39c880SMahesh Salgaonkar * boot process. This will be the size of the memory that is required for a 232eb39c880SMahesh Salgaonkar * kernel to boot successfully. 233eb39c880SMahesh Salgaonkar * 234eb39c880SMahesh Salgaonkar * This function has been taken from phyp-assisted dump feature implementation. 235eb39c880SMahesh Salgaonkar * 236eb39c880SMahesh Salgaonkar * returns larger of 256MB or 5% rounded down to multiples of 256MB. 237eb39c880SMahesh Salgaonkar * 238eb39c880SMahesh Salgaonkar * TODO: Come up with better approach to find out more accurate memory size 239eb39c880SMahesh Salgaonkar * that is required for a kernel to boot successfully. 240eb39c880SMahesh Salgaonkar * 241eb39c880SMahesh Salgaonkar */ 242eb39c880SMahesh Salgaonkar static inline unsigned long fadump_calculate_reserve_size(void) 243eb39c880SMahesh Salgaonkar { 24411550dc0SHari Bathini int ret; 24511550dc0SHari Bathini unsigned long long base, size; 246eb39c880SMahesh Salgaonkar 24781d9eca5SHari Bathini if (fw_dump.reserve_bootvar) 24881d9eca5SHari Bathini pr_warn("'fadump_reserve_mem=' parameter is deprecated in favor of 'crashkernel=' parameter.\n"); 24981d9eca5SHari Bathini 250eb39c880SMahesh Salgaonkar /* 25111550dc0SHari Bathini * Check if the size is specified through crashkernel= cmdline 252e7467dc6SHari Bathini * option. If yes, then use that but ignore base as fadump reserves 253e7467dc6SHari Bathini * memory at a predefined offset. 254eb39c880SMahesh Salgaonkar */ 25511550dc0SHari Bathini ret = parse_crashkernel(boot_command_line, memblock_phys_mem_size(), 25611550dc0SHari Bathini &size, &base); 25711550dc0SHari Bathini if (ret == 0 && size > 0) { 25848a316e3SHari Bathini unsigned long max_size; 25948a316e3SHari Bathini 26081d9eca5SHari Bathini if (fw_dump.reserve_bootvar) 26181d9eca5SHari Bathini pr_info("Using 'crashkernel=' parameter for memory reservation.\n"); 26281d9eca5SHari Bathini 26311550dc0SHari Bathini fw_dump.reserve_bootvar = (unsigned long)size; 26448a316e3SHari Bathini 26548a316e3SHari Bathini /* 26648a316e3SHari Bathini * Adjust if the boot memory size specified is above 26748a316e3SHari Bathini * the upper limit. 26848a316e3SHari Bathini */ 26948a316e3SHari Bathini max_size = memblock_phys_mem_size() / MAX_BOOT_MEM_RATIO; 27048a316e3SHari Bathini if (fw_dump.reserve_bootvar > max_size) { 27148a316e3SHari Bathini fw_dump.reserve_bootvar = max_size; 27248a316e3SHari Bathini pr_info("Adjusted boot memory size to %luMB\n", 27348a316e3SHari Bathini (fw_dump.reserve_bootvar >> 20)); 27448a316e3SHari Bathini } 27548a316e3SHari Bathini 276eb39c880SMahesh Salgaonkar return fw_dump.reserve_bootvar; 27781d9eca5SHari Bathini } else if (fw_dump.reserve_bootvar) { 27881d9eca5SHari Bathini /* 27981d9eca5SHari Bathini * 'fadump_reserve_mem=' is being used to reserve memory 28081d9eca5SHari Bathini * for firmware-assisted dump. 28181d9eca5SHari Bathini */ 28281d9eca5SHari Bathini return fw_dump.reserve_bootvar; 28311550dc0SHari Bathini } 284eb39c880SMahesh Salgaonkar 285eb39c880SMahesh Salgaonkar /* divide by 20 to get 5% of value */ 28648a316e3SHari Bathini size = memblock_phys_mem_size() / 20; 287eb39c880SMahesh Salgaonkar 288eb39c880SMahesh Salgaonkar /* round it down in multiples of 256 */ 289eb39c880SMahesh Salgaonkar size = size & ~0x0FFFFFFFUL; 290eb39c880SMahesh Salgaonkar 291eb39c880SMahesh Salgaonkar /* Truncate to memory_limit. We don't want to over reserve the memory.*/ 292eb39c880SMahesh Salgaonkar if (memory_limit && size > memory_limit) 293eb39c880SMahesh Salgaonkar size = memory_limit; 294eb39c880SMahesh Salgaonkar 295eb39c880SMahesh Salgaonkar return (size > MIN_BOOT_MEM ? size : MIN_BOOT_MEM); 296eb39c880SMahesh Salgaonkar } 297eb39c880SMahesh Salgaonkar 298eb39c880SMahesh Salgaonkar /* 299eb39c880SMahesh Salgaonkar * Calculate the total memory size required to be reserved for 300eb39c880SMahesh Salgaonkar * firmware-assisted dump registration. 301eb39c880SMahesh Salgaonkar */ 302eb39c880SMahesh Salgaonkar static unsigned long get_fadump_area_size(void) 303eb39c880SMahesh Salgaonkar { 304eb39c880SMahesh Salgaonkar unsigned long size = 0; 305eb39c880SMahesh Salgaonkar 306eb39c880SMahesh Salgaonkar size += fw_dump.cpu_state_data_size; 307eb39c880SMahesh Salgaonkar size += fw_dump.hpte_region_size; 308eb39c880SMahesh Salgaonkar size += fw_dump.boot_memory_size; 3092df173d9SMahesh Salgaonkar size += sizeof(struct fadump_crash_info_header); 3102df173d9SMahesh Salgaonkar size += sizeof(struct elfhdr); /* ELF core header.*/ 311ebaeb5aeSMahesh Salgaonkar size += sizeof(struct elf_phdr); /* place holder for cpu notes */ 3122df173d9SMahesh Salgaonkar /* Program headers for crash memory regions. */ 3132df173d9SMahesh Salgaonkar size += sizeof(struct elf_phdr) * (memblock_num_regions(memory) + 2); 314eb39c880SMahesh Salgaonkar 315eb39c880SMahesh Salgaonkar size = PAGE_ALIGN(size); 316742a265aSHari Bathini 317742a265aSHari Bathini /* This is to hold kernel metadata on platforms that support it */ 318742a265aSHari Bathini size += (fw_dump.ops->fadump_get_metadata_size ? 319742a265aSHari Bathini fw_dump.ops->fadump_get_metadata_size() : 0); 320eb39c880SMahesh Salgaonkar return size; 321eb39c880SMahesh Salgaonkar } 322eb39c880SMahesh Salgaonkar 323eb39c880SMahesh Salgaonkar int __init fadump_reserve_mem(void) 324eb39c880SMahesh Salgaonkar { 325579ca1a2SHari Bathini bool is_memblock_bottom_up = memblock_bottom_up(); 326579ca1a2SHari Bathini u64 base, size, mem_boundary, align = PAGE_SIZE; 3276abec12cSHari Bathini int ret = 1; 328eb39c880SMahesh Salgaonkar 329eb39c880SMahesh Salgaonkar if (!fw_dump.fadump_enabled) 330eb39c880SMahesh Salgaonkar return 0; 331eb39c880SMahesh Salgaonkar 332eb39c880SMahesh Salgaonkar if (!fw_dump.fadump_supported) { 3336abec12cSHari Bathini pr_info("Firmware-Assisted Dump is not supported on this hardware\n"); 3346abec12cSHari Bathini goto error_out; 335eb39c880SMahesh Salgaonkar } 336742a265aSHari Bathini 3373ccc00a7SMahesh Salgaonkar /* 3383ccc00a7SMahesh Salgaonkar * Initialize boot memory size 3393ccc00a7SMahesh Salgaonkar * If dump is active then we have already calculated the size during 3403ccc00a7SMahesh Salgaonkar * first kernel. 3413ccc00a7SMahesh Salgaonkar */ 342f3512011SHari Bathini if (!fw_dump.dump_active) { 3436abec12cSHari Bathini fw_dump.boot_memory_size = 3446abec12cSHari Bathini PAGE_ALIGN(fadump_calculate_reserve_size()); 345a4e92ce8SMahesh Salgaonkar #ifdef CONFIG_CMA 346579ca1a2SHari Bathini if (!fw_dump.nocma) { 347579ca1a2SHari Bathini align = FADUMP_CMA_ALIGNMENT; 348a4e92ce8SMahesh Salgaonkar fw_dump.boot_memory_size = 349579ca1a2SHari Bathini ALIGN(fw_dump.boot_memory_size, align); 350579ca1a2SHari Bathini } 351a4e92ce8SMahesh Salgaonkar #endif 352a4e92ce8SMahesh Salgaonkar } 353eb39c880SMahesh Salgaonkar 354eb39c880SMahesh Salgaonkar /* 355eb39c880SMahesh Salgaonkar * Calculate the memory boundary. 356eb39c880SMahesh Salgaonkar * If memory_limit is less than actual memory boundary then reserve 357eb39c880SMahesh Salgaonkar * the memory for fadump beyond the memory_limit and adjust the 358eb39c880SMahesh Salgaonkar * memory_limit accordingly, so that the running kernel can run with 359eb39c880SMahesh Salgaonkar * specified memory_limit. 360eb39c880SMahesh Salgaonkar */ 361eb39c880SMahesh Salgaonkar if (memory_limit && memory_limit < memblock_end_of_DRAM()) { 362eb39c880SMahesh Salgaonkar size = get_fadump_area_size(); 363eb39c880SMahesh Salgaonkar if ((memory_limit + size) < memblock_end_of_DRAM()) 364eb39c880SMahesh Salgaonkar memory_limit += size; 365eb39c880SMahesh Salgaonkar else 366eb39c880SMahesh Salgaonkar memory_limit = memblock_end_of_DRAM(); 367eb39c880SMahesh Salgaonkar printk(KERN_INFO "Adjusted memory_limit for firmware-assisted" 368a84fcd46SSuzuki Poulose " dump, now %#016llx\n", memory_limit); 369eb39c880SMahesh Salgaonkar } 370eb39c880SMahesh Salgaonkar if (memory_limit) 3716abec12cSHari Bathini mem_boundary = memory_limit; 372eb39c880SMahesh Salgaonkar else 3736abec12cSHari Bathini mem_boundary = memblock_end_of_DRAM(); 374eb39c880SMahesh Salgaonkar 3756abec12cSHari Bathini base = fw_dump.boot_memory_size; 3768255da95SHari Bathini size = get_fadump_area_size(); 3778255da95SHari Bathini fw_dump.reserve_dump_area_size = size; 378eb39c880SMahesh Salgaonkar if (fw_dump.dump_active) { 379b71a693dSMahesh Salgaonkar pr_info("Firmware-assisted dump is active.\n"); 380b71a693dSMahesh Salgaonkar 38185975387SHari Bathini #ifdef CONFIG_HUGETLB_PAGE 38285975387SHari Bathini /* 38385975387SHari Bathini * FADump capture kernel doesn't care much about hugepages. 38485975387SHari Bathini * In fact, handling hugepages in capture kernel is asking for 38585975387SHari Bathini * trouble. So, disable HugeTLB support when fadump is active. 38685975387SHari Bathini */ 38785975387SHari Bathini hugetlb_disabled = true; 38885975387SHari Bathini #endif 389eb39c880SMahesh Salgaonkar /* 390eb39c880SMahesh Salgaonkar * If last boot has crashed then reserve all the memory 391*b2a815a5SHari Bathini * above boot memory size so that we don't touch it until 392eb39c880SMahesh Salgaonkar * dump is written to disk by userspace tool. This memory 393*b2a815a5SHari Bathini * can be released for general use by invalidating fadump. 394eb39c880SMahesh Salgaonkar */ 395*b2a815a5SHari Bathini fadump_reserve_crash_area(base); 3962df173d9SMahesh Salgaonkar 397f3512011SHari Bathini pr_debug("fadumphdr_addr = %#016lx\n", fw_dump.fadumphdr_addr); 398f3512011SHari Bathini pr_debug("Reserve dump area start address: 0x%lx\n", 399f3512011SHari Bathini fw_dump.reserve_dump_area_start); 4008255da95SHari Bathini } else { 4018255da95SHari Bathini /* 402f6e6bedbSHari Bathini * Reserve memory at an offset closer to bottom of the RAM to 403579ca1a2SHari Bathini * minimize the impact of memory hot-remove operation. 404f6e6bedbSHari Bathini */ 405579ca1a2SHari Bathini memblock_set_bottom_up(true); 406579ca1a2SHari Bathini base = memblock_find_in_range(base, mem_boundary, size, align); 4076abec12cSHari Bathini 408579ca1a2SHari Bathini /* Restore the previous allocation mode */ 409579ca1a2SHari Bathini memblock_set_bottom_up(is_memblock_bottom_up); 410f6e6bedbSHari Bathini 411579ca1a2SHari Bathini if (!base) { 412742a265aSHari Bathini pr_err("Failed to find memory chunk for reservation!\n"); 413742a265aSHari Bathini goto error_out; 414742a265aSHari Bathini } 415742a265aSHari Bathini fw_dump.reserve_dump_area_start = base; 416742a265aSHari Bathini 417742a265aSHari Bathini /* 418742a265aSHari Bathini * Calculate the kernel metadata address and register it with 419742a265aSHari Bathini * f/w if the platform supports. 420742a265aSHari Bathini */ 421742a265aSHari Bathini if (fw_dump.ops->fadump_setup_metadata && 422742a265aSHari Bathini (fw_dump.ops->fadump_setup_metadata(&fw_dump) < 0)) 423742a265aSHari Bathini goto error_out; 424742a265aSHari Bathini 425742a265aSHari Bathini if (memblock_reserve(base, size)) { 4266abec12cSHari Bathini pr_err("Failed to reserve memory!\n"); 4276abec12cSHari Bathini goto error_out; 4286abec12cSHari Bathini } 4296abec12cSHari Bathini 4306abec12cSHari Bathini pr_info("Reserved %lldMB of memory at %#016llx (System RAM: %lldMB)\n", 4316abec12cSHari Bathini (size >> 20), base, (memblock_phys_mem_size() >> 20)); 432f6e6bedbSHari Bathini 4336abec12cSHari Bathini ret = fadump_cma_init(); 434a4e92ce8SMahesh Salgaonkar } 4356abec12cSHari Bathini 4366abec12cSHari Bathini return ret; 4376abec12cSHari Bathini error_out: 4386abec12cSHari Bathini fw_dump.fadump_enabled = 0; 4396abec12cSHari Bathini return 0; 440eb39c880SMahesh Salgaonkar } 441eb39c880SMahesh Salgaonkar 4421e76609cSSrikar Dronamraju unsigned long __init arch_reserved_kernel_pages(void) 4431e76609cSSrikar Dronamraju { 4441e76609cSSrikar Dronamraju return memblock_reserved_size() / PAGE_SIZE; 4451e76609cSSrikar Dronamraju } 4461e76609cSSrikar Dronamraju 447eb39c880SMahesh Salgaonkar /* Look for fadump= cmdline option. */ 448eb39c880SMahesh Salgaonkar static int __init early_fadump_param(char *p) 449eb39c880SMahesh Salgaonkar { 450eb39c880SMahesh Salgaonkar if (!p) 451eb39c880SMahesh Salgaonkar return 1; 452eb39c880SMahesh Salgaonkar 453eb39c880SMahesh Salgaonkar if (strncmp(p, "on", 2) == 0) 454eb39c880SMahesh Salgaonkar fw_dump.fadump_enabled = 1; 455eb39c880SMahesh Salgaonkar else if (strncmp(p, "off", 3) == 0) 456eb39c880SMahesh Salgaonkar fw_dump.fadump_enabled = 0; 457a4e92ce8SMahesh Salgaonkar else if (strncmp(p, "nocma", 5) == 0) { 458a4e92ce8SMahesh Salgaonkar fw_dump.fadump_enabled = 1; 459a4e92ce8SMahesh Salgaonkar fw_dump.nocma = 1; 460a4e92ce8SMahesh Salgaonkar } 461eb39c880SMahesh Salgaonkar 462eb39c880SMahesh Salgaonkar return 0; 463eb39c880SMahesh Salgaonkar } 464eb39c880SMahesh Salgaonkar early_param("fadump", early_fadump_param); 465eb39c880SMahesh Salgaonkar 46681d9eca5SHari Bathini /* 46781d9eca5SHari Bathini * Look for fadump_reserve_mem= cmdline option 46881d9eca5SHari Bathini * TODO: Remove references to 'fadump_reserve_mem=' parameter, 46981d9eca5SHari Bathini * the sooner 'crashkernel=' parameter is accustomed to. 47081d9eca5SHari Bathini */ 47181d9eca5SHari Bathini static int __init early_fadump_reserve_mem(char *p) 47281d9eca5SHari Bathini { 47381d9eca5SHari Bathini if (p) 47481d9eca5SHari Bathini fw_dump.reserve_bootvar = memparse(p, &p); 47581d9eca5SHari Bathini return 0; 47681d9eca5SHari Bathini } 47781d9eca5SHari Bathini early_param("fadump_reserve_mem", early_fadump_reserve_mem); 47881d9eca5SHari Bathini 479ebaeb5aeSMahesh Salgaonkar void crash_fadump(struct pt_regs *regs, const char *str) 480ebaeb5aeSMahesh Salgaonkar { 481ebaeb5aeSMahesh Salgaonkar struct fadump_crash_info_header *fdh = NULL; 482f2a5e8f0SMahesh Salgaonkar int old_cpu, this_cpu; 483ebaeb5aeSMahesh Salgaonkar 4846fcd6baaSNicholas Piggin if (!should_fadump_crash()) 485ebaeb5aeSMahesh Salgaonkar return; 486ebaeb5aeSMahesh Salgaonkar 487f2a5e8f0SMahesh Salgaonkar /* 488f2a5e8f0SMahesh Salgaonkar * old_cpu == -1 means this is the first CPU which has come here, 489f2a5e8f0SMahesh Salgaonkar * go ahead and trigger fadump. 490f2a5e8f0SMahesh Salgaonkar * 491f2a5e8f0SMahesh Salgaonkar * old_cpu != -1 means some other CPU has already on it's way 492f2a5e8f0SMahesh Salgaonkar * to trigger fadump, just keep looping here. 493f2a5e8f0SMahesh Salgaonkar */ 494f2a5e8f0SMahesh Salgaonkar this_cpu = smp_processor_id(); 495f2a5e8f0SMahesh Salgaonkar old_cpu = cmpxchg(&crashing_cpu, -1, this_cpu); 496f2a5e8f0SMahesh Salgaonkar 497f2a5e8f0SMahesh Salgaonkar if (old_cpu != -1) { 498f2a5e8f0SMahesh Salgaonkar /* 499f2a5e8f0SMahesh Salgaonkar * We can't loop here indefinitely. Wait as long as fadump 500f2a5e8f0SMahesh Salgaonkar * is in force. If we race with fadump un-registration this 501f2a5e8f0SMahesh Salgaonkar * loop will break and then we go down to normal panic path 502f2a5e8f0SMahesh Salgaonkar * and reboot. If fadump is in force the first crashing 503f2a5e8f0SMahesh Salgaonkar * cpu will definitely trigger fadump. 504f2a5e8f0SMahesh Salgaonkar */ 505f2a5e8f0SMahesh Salgaonkar while (fw_dump.dump_registered) 506f2a5e8f0SMahesh Salgaonkar cpu_relax(); 507f2a5e8f0SMahesh Salgaonkar return; 508f2a5e8f0SMahesh Salgaonkar } 509f2a5e8f0SMahesh Salgaonkar 510ebaeb5aeSMahesh Salgaonkar fdh = __va(fw_dump.fadumphdr_addr); 511ebaeb5aeSMahesh Salgaonkar fdh->crashing_cpu = crashing_cpu; 512ebaeb5aeSMahesh Salgaonkar crash_save_vmcoreinfo(); 513ebaeb5aeSMahesh Salgaonkar 514ebaeb5aeSMahesh Salgaonkar if (regs) 515ebaeb5aeSMahesh Salgaonkar fdh->regs = *regs; 516ebaeb5aeSMahesh Salgaonkar else 517ebaeb5aeSMahesh Salgaonkar ppc_save_regs(&fdh->regs); 518ebaeb5aeSMahesh Salgaonkar 519a0512164SRasmus Villemoes fdh->online_mask = *cpu_online_mask; 520ebaeb5aeSMahesh Salgaonkar 52141a65d16SHari Bathini fw_dump.ops->fadump_trigger(fdh, str); 522ebaeb5aeSMahesh Salgaonkar } 523ebaeb5aeSMahesh Salgaonkar 5247f0ad11dSHari Bathini u32 *fadump_regs_to_elf_notes(u32 *buf, struct pt_regs *regs) 525ebaeb5aeSMahesh Salgaonkar { 526ebaeb5aeSMahesh Salgaonkar struct elf_prstatus prstatus; 527ebaeb5aeSMahesh Salgaonkar 528ebaeb5aeSMahesh Salgaonkar memset(&prstatus, 0, sizeof(prstatus)); 529ebaeb5aeSMahesh Salgaonkar /* 530ebaeb5aeSMahesh Salgaonkar * FIXME: How do i get PID? Do I really need it? 531ebaeb5aeSMahesh Salgaonkar * prstatus.pr_pid = ???? 532ebaeb5aeSMahesh Salgaonkar */ 533ebaeb5aeSMahesh Salgaonkar elf_core_copy_kernel_regs(&prstatus.pr_reg, regs); 53422bd0177SHari Bathini buf = append_elf_note(buf, CRASH_CORE_NOTE_NAME, NT_PRSTATUS, 535ebaeb5aeSMahesh Salgaonkar &prstatus, sizeof(prstatus)); 536ebaeb5aeSMahesh Salgaonkar return buf; 537ebaeb5aeSMahesh Salgaonkar } 538ebaeb5aeSMahesh Salgaonkar 5397f0ad11dSHari Bathini void fadump_update_elfcore_header(char *bufp) 540ebaeb5aeSMahesh Salgaonkar { 541ebaeb5aeSMahesh Salgaonkar struct elfhdr *elf; 542ebaeb5aeSMahesh Salgaonkar struct elf_phdr *phdr; 543ebaeb5aeSMahesh Salgaonkar 544ebaeb5aeSMahesh Salgaonkar elf = (struct elfhdr *)bufp; 545ebaeb5aeSMahesh Salgaonkar bufp += sizeof(struct elfhdr); 546ebaeb5aeSMahesh Salgaonkar 547ebaeb5aeSMahesh Salgaonkar /* First note is a place holder for cpu notes info. */ 548ebaeb5aeSMahesh Salgaonkar phdr = (struct elf_phdr *)bufp; 549ebaeb5aeSMahesh Salgaonkar 550ebaeb5aeSMahesh Salgaonkar if (phdr->p_type == PT_NOTE) { 551961cf26aSHari Bathini phdr->p_paddr = __pa(fw_dump.cpu_notes_buf_vaddr); 552ebaeb5aeSMahesh Salgaonkar phdr->p_offset = phdr->p_paddr; 553ebaeb5aeSMahesh Salgaonkar phdr->p_filesz = fw_dump.cpu_notes_buf_size; 554ebaeb5aeSMahesh Salgaonkar phdr->p_memsz = fw_dump.cpu_notes_buf_size; 555ebaeb5aeSMahesh Salgaonkar } 556ebaeb5aeSMahesh Salgaonkar return; 557ebaeb5aeSMahesh Salgaonkar } 558ebaeb5aeSMahesh Salgaonkar 559961cf26aSHari Bathini static void *fadump_alloc_buffer(unsigned long size) 560ebaeb5aeSMahesh Salgaonkar { 56172aa6517SHari Bathini unsigned long count, i; 562ebaeb5aeSMahesh Salgaonkar struct page *page; 56372aa6517SHari Bathini void *vaddr; 564ebaeb5aeSMahesh Salgaonkar 56572aa6517SHari Bathini vaddr = alloc_pages_exact(size, GFP_KERNEL | __GFP_ZERO); 566ebaeb5aeSMahesh Salgaonkar if (!vaddr) 567ebaeb5aeSMahesh Salgaonkar return NULL; 568ebaeb5aeSMahesh Salgaonkar 56972aa6517SHari Bathini count = PAGE_ALIGN(size) / PAGE_SIZE; 570ebaeb5aeSMahesh Salgaonkar page = virt_to_page(vaddr); 571ebaeb5aeSMahesh Salgaonkar for (i = 0; i < count; i++) 57272aa6517SHari Bathini mark_page_reserved(page + i); 573ebaeb5aeSMahesh Salgaonkar return vaddr; 574ebaeb5aeSMahesh Salgaonkar } 575ebaeb5aeSMahesh Salgaonkar 576961cf26aSHari Bathini static void fadump_free_buffer(unsigned long vaddr, unsigned long size) 577ebaeb5aeSMahesh Salgaonkar { 57872aa6517SHari Bathini free_reserved_area((void *)vaddr, (void *)(vaddr + size), -1, NULL); 579ebaeb5aeSMahesh Salgaonkar } 580ebaeb5aeSMahesh Salgaonkar 5817f0ad11dSHari Bathini s32 fadump_setup_cpu_notes_buf(u32 num_cpus) 582961cf26aSHari Bathini { 583961cf26aSHari Bathini /* Allocate buffer to hold cpu crash notes. */ 584961cf26aSHari Bathini fw_dump.cpu_notes_buf_size = num_cpus * sizeof(note_buf_t); 585961cf26aSHari Bathini fw_dump.cpu_notes_buf_size = PAGE_ALIGN(fw_dump.cpu_notes_buf_size); 586961cf26aSHari Bathini fw_dump.cpu_notes_buf_vaddr = 587961cf26aSHari Bathini (unsigned long)fadump_alloc_buffer(fw_dump.cpu_notes_buf_size); 588961cf26aSHari Bathini if (!fw_dump.cpu_notes_buf_vaddr) { 589961cf26aSHari Bathini pr_err("Failed to allocate %ld bytes for CPU notes buffer\n", 590961cf26aSHari Bathini fw_dump.cpu_notes_buf_size); 591961cf26aSHari Bathini return -ENOMEM; 592961cf26aSHari Bathini } 593961cf26aSHari Bathini 594961cf26aSHari Bathini pr_debug("Allocated buffer for cpu notes of size %ld at 0x%lx\n", 595961cf26aSHari Bathini fw_dump.cpu_notes_buf_size, 596961cf26aSHari Bathini fw_dump.cpu_notes_buf_vaddr); 597961cf26aSHari Bathini return 0; 598961cf26aSHari Bathini } 599961cf26aSHari Bathini 6007f0ad11dSHari Bathini void fadump_free_cpu_notes_buf(void) 601961cf26aSHari Bathini { 602961cf26aSHari Bathini if (!fw_dump.cpu_notes_buf_vaddr) 603961cf26aSHari Bathini return; 604961cf26aSHari Bathini 605961cf26aSHari Bathini fadump_free_buffer(fw_dump.cpu_notes_buf_vaddr, 606961cf26aSHari Bathini fw_dump.cpu_notes_buf_size); 607961cf26aSHari Bathini fw_dump.cpu_notes_buf_vaddr = 0; 608961cf26aSHari Bathini fw_dump.cpu_notes_buf_size = 0; 609961cf26aSHari Bathini } 610961cf26aSHari Bathini 611e4fc48fbSHari Bathini static void fadump_free_mem_ranges(struct fadump_mrange_info *mrange_info) 6121bd6a1c4SHari Bathini { 613e4fc48fbSHari Bathini kfree(mrange_info->mem_ranges); 614e4fc48fbSHari Bathini mrange_info->mem_ranges = NULL; 615e4fc48fbSHari Bathini mrange_info->mem_ranges_sz = 0; 616e4fc48fbSHari Bathini mrange_info->max_mem_ranges = 0; 6171bd6a1c4SHari Bathini } 6181bd6a1c4SHari Bathini 6191bd6a1c4SHari Bathini /* 620e4fc48fbSHari Bathini * Allocate or reallocate mem_ranges array in incremental units 6211bd6a1c4SHari Bathini * of PAGE_SIZE. 6221bd6a1c4SHari Bathini */ 623e4fc48fbSHari Bathini static int fadump_alloc_mem_ranges(struct fadump_mrange_info *mrange_info) 6241bd6a1c4SHari Bathini { 625e4fc48fbSHari Bathini struct fadump_memory_range *new_array; 6261bd6a1c4SHari Bathini u64 new_size; 6271bd6a1c4SHari Bathini 628e4fc48fbSHari Bathini new_size = mrange_info->mem_ranges_sz + PAGE_SIZE; 629e4fc48fbSHari Bathini pr_debug("Allocating %llu bytes of memory for %s memory ranges\n", 630e4fc48fbSHari Bathini new_size, mrange_info->name); 6311bd6a1c4SHari Bathini 632e4fc48fbSHari Bathini new_array = krealloc(mrange_info->mem_ranges, new_size, GFP_KERNEL); 6331bd6a1c4SHari Bathini if (new_array == NULL) { 634e4fc48fbSHari Bathini pr_err("Insufficient memory for setting up %s memory ranges\n", 635e4fc48fbSHari Bathini mrange_info->name); 636e4fc48fbSHari Bathini fadump_free_mem_ranges(mrange_info); 6371bd6a1c4SHari Bathini return -ENOMEM; 6381bd6a1c4SHari Bathini } 6391bd6a1c4SHari Bathini 640e4fc48fbSHari Bathini mrange_info->mem_ranges = new_array; 641e4fc48fbSHari Bathini mrange_info->mem_ranges_sz = new_size; 642e4fc48fbSHari Bathini mrange_info->max_mem_ranges = (new_size / 643e4fc48fbSHari Bathini sizeof(struct fadump_memory_range)); 6441bd6a1c4SHari Bathini return 0; 6451bd6a1c4SHari Bathini } 6461bd6a1c4SHari Bathini 647e4fc48fbSHari Bathini static inline int fadump_add_mem_range(struct fadump_mrange_info *mrange_info, 648e4fc48fbSHari Bathini u64 base, u64 end) 6492df173d9SMahesh Salgaonkar { 650e4fc48fbSHari Bathini struct fadump_memory_range *mem_ranges = mrange_info->mem_ranges; 651ced1bf52SHari Bathini bool is_adjacent = false; 652e4fc48fbSHari Bathini u64 start, size; 653ced1bf52SHari Bathini 6542df173d9SMahesh Salgaonkar if (base == end) 6551bd6a1c4SHari Bathini return 0; 6561bd6a1c4SHari Bathini 657ced1bf52SHari Bathini /* 658ced1bf52SHari Bathini * Fold adjacent memory ranges to bring down the memory ranges/ 659ced1bf52SHari Bathini * PT_LOAD segments count. 660ced1bf52SHari Bathini */ 661e4fc48fbSHari Bathini if (mrange_info->mem_range_cnt) { 662e4fc48fbSHari Bathini start = mem_ranges[mrange_info->mem_range_cnt - 1].base; 663e4fc48fbSHari Bathini size = mem_ranges[mrange_info->mem_range_cnt - 1].size; 664ced1bf52SHari Bathini 665ced1bf52SHari Bathini if ((start + size) == base) 666ced1bf52SHari Bathini is_adjacent = true; 667ced1bf52SHari Bathini } 668ced1bf52SHari Bathini if (!is_adjacent) { 669ced1bf52SHari Bathini /* resize the array on reaching the limit */ 670e4fc48fbSHari Bathini if (mrange_info->mem_range_cnt == mrange_info->max_mem_ranges) { 6711bd6a1c4SHari Bathini int ret; 6721bd6a1c4SHari Bathini 673e4fc48fbSHari Bathini ret = fadump_alloc_mem_ranges(mrange_info); 6741bd6a1c4SHari Bathini if (ret) 6751bd6a1c4SHari Bathini return ret; 676e4fc48fbSHari Bathini 677e4fc48fbSHari Bathini /* Update to the new resized array */ 678e4fc48fbSHari Bathini mem_ranges = mrange_info->mem_ranges; 6791bd6a1c4SHari Bathini } 6802df173d9SMahesh Salgaonkar 681ced1bf52SHari Bathini start = base; 682e4fc48fbSHari Bathini mem_ranges[mrange_info->mem_range_cnt].base = start; 683e4fc48fbSHari Bathini mrange_info->mem_range_cnt++; 684ced1bf52SHari Bathini } 685ced1bf52SHari Bathini 686e4fc48fbSHari Bathini mem_ranges[mrange_info->mem_range_cnt - 1].size = (end - start); 687e4fc48fbSHari Bathini pr_debug("%s_memory_range[%d] [%#016llx-%#016llx], %#llx bytes\n", 688e4fc48fbSHari Bathini mrange_info->name, (mrange_info->mem_range_cnt - 1), 689e4fc48fbSHari Bathini start, end - 1, (end - start)); 6901bd6a1c4SHari Bathini return 0; 6912df173d9SMahesh Salgaonkar } 6922df173d9SMahesh Salgaonkar 693e4fc48fbSHari Bathini static int fadump_exclude_reserved_area(u64 start, u64 end) 6942df173d9SMahesh Salgaonkar { 695e4fc48fbSHari Bathini u64 ra_start, ra_end; 6961bd6a1c4SHari Bathini int ret = 0; 6972df173d9SMahesh Salgaonkar 6982df173d9SMahesh Salgaonkar ra_start = fw_dump.reserve_dump_area_start; 6992df173d9SMahesh Salgaonkar ra_end = ra_start + fw_dump.reserve_dump_area_size; 7002df173d9SMahesh Salgaonkar 7012df173d9SMahesh Salgaonkar if ((ra_start < end) && (ra_end > start)) { 7022df173d9SMahesh Salgaonkar if ((start < ra_start) && (end > ra_end)) { 703e4fc48fbSHari Bathini ret = fadump_add_mem_range(&crash_mrange_info, 704e4fc48fbSHari Bathini start, ra_start); 7051bd6a1c4SHari Bathini if (ret) 7061bd6a1c4SHari Bathini return ret; 7071bd6a1c4SHari Bathini 708e4fc48fbSHari Bathini ret = fadump_add_mem_range(&crash_mrange_info, 709e4fc48fbSHari Bathini ra_end, end); 7102df173d9SMahesh Salgaonkar } else if (start < ra_start) { 711e4fc48fbSHari Bathini ret = fadump_add_mem_range(&crash_mrange_info, 712e4fc48fbSHari Bathini start, ra_start); 7132df173d9SMahesh Salgaonkar } else if (ra_end < end) { 714e4fc48fbSHari Bathini ret = fadump_add_mem_range(&crash_mrange_info, 715e4fc48fbSHari Bathini ra_end, end); 7162df173d9SMahesh Salgaonkar } 7172df173d9SMahesh Salgaonkar } else 718e4fc48fbSHari Bathini ret = fadump_add_mem_range(&crash_mrange_info, start, end); 7191bd6a1c4SHari Bathini 7201bd6a1c4SHari Bathini return ret; 7212df173d9SMahesh Salgaonkar } 7222df173d9SMahesh Salgaonkar 7232df173d9SMahesh Salgaonkar static int fadump_init_elfcore_header(char *bufp) 7242df173d9SMahesh Salgaonkar { 7252df173d9SMahesh Salgaonkar struct elfhdr *elf; 7262df173d9SMahesh Salgaonkar 7272df173d9SMahesh Salgaonkar elf = (struct elfhdr *) bufp; 7282df173d9SMahesh Salgaonkar bufp += sizeof(struct elfhdr); 7292df173d9SMahesh Salgaonkar memcpy(elf->e_ident, ELFMAG, SELFMAG); 7302df173d9SMahesh Salgaonkar elf->e_ident[EI_CLASS] = ELF_CLASS; 7312df173d9SMahesh Salgaonkar elf->e_ident[EI_DATA] = ELF_DATA; 7322df173d9SMahesh Salgaonkar elf->e_ident[EI_VERSION] = EV_CURRENT; 7332df173d9SMahesh Salgaonkar elf->e_ident[EI_OSABI] = ELF_OSABI; 7342df173d9SMahesh Salgaonkar memset(elf->e_ident+EI_PAD, 0, EI_NIDENT-EI_PAD); 7352df173d9SMahesh Salgaonkar elf->e_type = ET_CORE; 7362df173d9SMahesh Salgaonkar elf->e_machine = ELF_ARCH; 7372df173d9SMahesh Salgaonkar elf->e_version = EV_CURRENT; 7382df173d9SMahesh Salgaonkar elf->e_entry = 0; 7392df173d9SMahesh Salgaonkar elf->e_phoff = sizeof(struct elfhdr); 7402df173d9SMahesh Salgaonkar elf->e_shoff = 0; 741d8bced27SDaniel Axtens #if defined(_CALL_ELF) 742d8bced27SDaniel Axtens elf->e_flags = _CALL_ELF; 743d8bced27SDaniel Axtens #else 744d8bced27SDaniel Axtens elf->e_flags = 0; 745d8bced27SDaniel Axtens #endif 7462df173d9SMahesh Salgaonkar elf->e_ehsize = sizeof(struct elfhdr); 7472df173d9SMahesh Salgaonkar elf->e_phentsize = sizeof(struct elf_phdr); 7482df173d9SMahesh Salgaonkar elf->e_phnum = 0; 7492df173d9SMahesh Salgaonkar elf->e_shentsize = 0; 7502df173d9SMahesh Salgaonkar elf->e_shnum = 0; 7512df173d9SMahesh Salgaonkar elf->e_shstrndx = 0; 7522df173d9SMahesh Salgaonkar 7532df173d9SMahesh Salgaonkar return 0; 7542df173d9SMahesh Salgaonkar } 7552df173d9SMahesh Salgaonkar 7562df173d9SMahesh Salgaonkar /* 7572df173d9SMahesh Salgaonkar * Traverse through memblock structure and setup crash memory ranges. These 7582df173d9SMahesh Salgaonkar * ranges will be used create PT_LOAD program headers in elfcore header. 7592df173d9SMahesh Salgaonkar */ 7601bd6a1c4SHari Bathini static int fadump_setup_crash_memory_ranges(void) 7612df173d9SMahesh Salgaonkar { 7622df173d9SMahesh Salgaonkar struct memblock_region *reg; 763e4fc48fbSHari Bathini u64 start, end; 7641bd6a1c4SHari Bathini int ret; 7652df173d9SMahesh Salgaonkar 7662df173d9SMahesh Salgaonkar pr_debug("Setup crash memory ranges.\n"); 767e4fc48fbSHari Bathini crash_mrange_info.mem_range_cnt = 0; 768ced1bf52SHari Bathini 7692df173d9SMahesh Salgaonkar /* 7702df173d9SMahesh Salgaonkar * add the first memory chunk (RMA_START through boot_memory_size) as 7712df173d9SMahesh Salgaonkar * a separate memory chunk. The reason is, at the time crash firmware 7722df173d9SMahesh Salgaonkar * will move the content of this memory chunk to different location 7732df173d9SMahesh Salgaonkar * specified during fadump registration. We need to create a separate 7742df173d9SMahesh Salgaonkar * program header for this chunk with the correct offset. 7752df173d9SMahesh Salgaonkar */ 776e4fc48fbSHari Bathini ret = fadump_add_mem_range(&crash_mrange_info, 777e4fc48fbSHari Bathini RMA_START, fw_dump.boot_memory_size); 7781bd6a1c4SHari Bathini if (ret) 7791bd6a1c4SHari Bathini return ret; 7802df173d9SMahesh Salgaonkar 7812df173d9SMahesh Salgaonkar for_each_memblock(memory, reg) { 782e4fc48fbSHari Bathini start = (u64)reg->base; 783e4fc48fbSHari Bathini end = start + (u64)reg->size; 784a77af552SHari Bathini 785a77af552SHari Bathini /* 786a77af552SHari Bathini * skip the first memory chunk that is already added (RMA_START 787a77af552SHari Bathini * through boot_memory_size). This logic needs a relook if and 788a77af552SHari Bathini * when RMA_START changes to a non-zero value. 789a77af552SHari Bathini */ 790a77af552SHari Bathini BUILD_BUG_ON(RMA_START != 0); 791a77af552SHari Bathini if (start < fw_dump.boot_memory_size) { 792a77af552SHari Bathini if (end > fw_dump.boot_memory_size) 7932df173d9SMahesh Salgaonkar start = fw_dump.boot_memory_size; 794a77af552SHari Bathini else 795a77af552SHari Bathini continue; 796a77af552SHari Bathini } 7972df173d9SMahesh Salgaonkar 7982df173d9SMahesh Salgaonkar /* add this range excluding the reserved dump area. */ 7991bd6a1c4SHari Bathini ret = fadump_exclude_reserved_area(start, end); 8001bd6a1c4SHari Bathini if (ret) 8011bd6a1c4SHari Bathini return ret; 8022df173d9SMahesh Salgaonkar } 8031bd6a1c4SHari Bathini 8041bd6a1c4SHari Bathini return 0; 8052df173d9SMahesh Salgaonkar } 8062df173d9SMahesh Salgaonkar 807d34c5f26SMahesh Salgaonkar /* 808d34c5f26SMahesh Salgaonkar * If the given physical address falls within the boot memory region then 809d34c5f26SMahesh Salgaonkar * return the relocated address that points to the dump region reserved 810d34c5f26SMahesh Salgaonkar * for saving initial boot memory contents. 811d34c5f26SMahesh Salgaonkar */ 812d34c5f26SMahesh Salgaonkar static inline unsigned long fadump_relocate(unsigned long paddr) 813d34c5f26SMahesh Salgaonkar { 814d34c5f26SMahesh Salgaonkar if (paddr > RMA_START && paddr < fw_dump.boot_memory_size) 81541a65d16SHari Bathini return fw_dump.boot_mem_dest_addr + paddr; 816d34c5f26SMahesh Salgaonkar else 817d34c5f26SMahesh Salgaonkar return paddr; 818d34c5f26SMahesh Salgaonkar } 819d34c5f26SMahesh Salgaonkar 8202df173d9SMahesh Salgaonkar static int fadump_create_elfcore_headers(char *bufp) 8212df173d9SMahesh Salgaonkar { 8222df173d9SMahesh Salgaonkar struct elfhdr *elf; 8232df173d9SMahesh Salgaonkar struct elf_phdr *phdr; 8242df173d9SMahesh Salgaonkar int i; 8252df173d9SMahesh Salgaonkar 8262df173d9SMahesh Salgaonkar fadump_init_elfcore_header(bufp); 8272df173d9SMahesh Salgaonkar elf = (struct elfhdr *)bufp; 8282df173d9SMahesh Salgaonkar bufp += sizeof(struct elfhdr); 8292df173d9SMahesh Salgaonkar 830ebaeb5aeSMahesh Salgaonkar /* 831ebaeb5aeSMahesh Salgaonkar * setup ELF PT_NOTE, place holder for cpu notes info. The notes info 832ebaeb5aeSMahesh Salgaonkar * will be populated during second kernel boot after crash. Hence 833ebaeb5aeSMahesh Salgaonkar * this PT_NOTE will always be the first elf note. 834ebaeb5aeSMahesh Salgaonkar * 835ebaeb5aeSMahesh Salgaonkar * NOTE: Any new ELF note addition should be placed after this note. 836ebaeb5aeSMahesh Salgaonkar */ 837ebaeb5aeSMahesh Salgaonkar phdr = (struct elf_phdr *)bufp; 838ebaeb5aeSMahesh Salgaonkar bufp += sizeof(struct elf_phdr); 839ebaeb5aeSMahesh Salgaonkar phdr->p_type = PT_NOTE; 840ebaeb5aeSMahesh Salgaonkar phdr->p_flags = 0; 841ebaeb5aeSMahesh Salgaonkar phdr->p_vaddr = 0; 842ebaeb5aeSMahesh Salgaonkar phdr->p_align = 0; 843ebaeb5aeSMahesh Salgaonkar 844ebaeb5aeSMahesh Salgaonkar phdr->p_offset = 0; 845ebaeb5aeSMahesh Salgaonkar phdr->p_paddr = 0; 846ebaeb5aeSMahesh Salgaonkar phdr->p_filesz = 0; 847ebaeb5aeSMahesh Salgaonkar phdr->p_memsz = 0; 848ebaeb5aeSMahesh Salgaonkar 849ebaeb5aeSMahesh Salgaonkar (elf->e_phnum)++; 850ebaeb5aeSMahesh Salgaonkar 851d34c5f26SMahesh Salgaonkar /* setup ELF PT_NOTE for vmcoreinfo */ 852d34c5f26SMahesh Salgaonkar phdr = (struct elf_phdr *)bufp; 853d34c5f26SMahesh Salgaonkar bufp += sizeof(struct elf_phdr); 854d34c5f26SMahesh Salgaonkar phdr->p_type = PT_NOTE; 855d34c5f26SMahesh Salgaonkar phdr->p_flags = 0; 856d34c5f26SMahesh Salgaonkar phdr->p_vaddr = 0; 857d34c5f26SMahesh Salgaonkar phdr->p_align = 0; 858d34c5f26SMahesh Salgaonkar 859d34c5f26SMahesh Salgaonkar phdr->p_paddr = fadump_relocate(paddr_vmcoreinfo_note()); 860d34c5f26SMahesh Salgaonkar phdr->p_offset = phdr->p_paddr; 8615203f499SXunlei Pang phdr->p_memsz = phdr->p_filesz = VMCOREINFO_NOTE_SIZE; 862d34c5f26SMahesh Salgaonkar 863d34c5f26SMahesh Salgaonkar /* Increment number of program headers. */ 864d34c5f26SMahesh Salgaonkar (elf->e_phnum)++; 865d34c5f26SMahesh Salgaonkar 8662df173d9SMahesh Salgaonkar /* setup PT_LOAD sections. */ 8672df173d9SMahesh Salgaonkar 868e4fc48fbSHari Bathini for (i = 0; i < crash_mrange_info.mem_range_cnt; i++) { 869e4fc48fbSHari Bathini u64 mbase, msize; 8702df173d9SMahesh Salgaonkar 871e4fc48fbSHari Bathini mbase = crash_mrange_info.mem_ranges[i].base; 872e4fc48fbSHari Bathini msize = crash_mrange_info.mem_ranges[i].size; 8732df173d9SMahesh Salgaonkar if (!msize) 8742df173d9SMahesh Salgaonkar continue; 8752df173d9SMahesh Salgaonkar 8762df173d9SMahesh Salgaonkar phdr = (struct elf_phdr *)bufp; 8772df173d9SMahesh Salgaonkar bufp += sizeof(struct elf_phdr); 8782df173d9SMahesh Salgaonkar phdr->p_type = PT_LOAD; 8792df173d9SMahesh Salgaonkar phdr->p_flags = PF_R|PF_W|PF_X; 8802df173d9SMahesh Salgaonkar phdr->p_offset = mbase; 8812df173d9SMahesh Salgaonkar 8822df173d9SMahesh Salgaonkar if (mbase == RMA_START) { 8832df173d9SMahesh Salgaonkar /* 8842df173d9SMahesh Salgaonkar * The entire RMA region will be moved by firmware 8852df173d9SMahesh Salgaonkar * to the specified destination_address. Hence set 8862df173d9SMahesh Salgaonkar * the correct offset. 8872df173d9SMahesh Salgaonkar */ 88841a65d16SHari Bathini phdr->p_offset = fw_dump.boot_mem_dest_addr; 8892df173d9SMahesh Salgaonkar } 8902df173d9SMahesh Salgaonkar 8912df173d9SMahesh Salgaonkar phdr->p_paddr = mbase; 8922df173d9SMahesh Salgaonkar phdr->p_vaddr = (unsigned long)__va(mbase); 8932df173d9SMahesh Salgaonkar phdr->p_filesz = msize; 8942df173d9SMahesh Salgaonkar phdr->p_memsz = msize; 8952df173d9SMahesh Salgaonkar phdr->p_align = 0; 8962df173d9SMahesh Salgaonkar 8972df173d9SMahesh Salgaonkar /* Increment number of program headers. */ 8982df173d9SMahesh Salgaonkar (elf->e_phnum)++; 8992df173d9SMahesh Salgaonkar } 9002df173d9SMahesh Salgaonkar return 0; 9012df173d9SMahesh Salgaonkar } 9022df173d9SMahesh Salgaonkar 9032df173d9SMahesh Salgaonkar static unsigned long init_fadump_header(unsigned long addr) 9042df173d9SMahesh Salgaonkar { 9052df173d9SMahesh Salgaonkar struct fadump_crash_info_header *fdh; 9062df173d9SMahesh Salgaonkar 9072df173d9SMahesh Salgaonkar if (!addr) 9082df173d9SMahesh Salgaonkar return 0; 9092df173d9SMahesh Salgaonkar 9102df173d9SMahesh Salgaonkar fdh = __va(addr); 9112df173d9SMahesh Salgaonkar addr += sizeof(struct fadump_crash_info_header); 9122df173d9SMahesh Salgaonkar 9132df173d9SMahesh Salgaonkar memset(fdh, 0, sizeof(struct fadump_crash_info_header)); 9142df173d9SMahesh Salgaonkar fdh->magic_number = FADUMP_CRASH_INFO_MAGIC; 9152df173d9SMahesh Salgaonkar fdh->elfcorehdr_addr = addr; 916ebaeb5aeSMahesh Salgaonkar /* We will set the crashing cpu id in crash_fadump() during crash. */ 9170226e552SHari Bathini fdh->crashing_cpu = FADUMP_CPU_UNKNOWN; 9182df173d9SMahesh Salgaonkar 9192df173d9SMahesh Salgaonkar return addr; 9202df173d9SMahesh Salgaonkar } 9212df173d9SMahesh Salgaonkar 92298b8cd7fSMichal Suchanek static int register_fadump(void) 9233ccc00a7SMahesh Salgaonkar { 9242df173d9SMahesh Salgaonkar unsigned long addr; 9252df173d9SMahesh Salgaonkar void *vaddr; 9261bd6a1c4SHari Bathini int ret; 9272df173d9SMahesh Salgaonkar 9283ccc00a7SMahesh Salgaonkar /* 9293ccc00a7SMahesh Salgaonkar * If no memory is reserved then we can not register for firmware- 9303ccc00a7SMahesh Salgaonkar * assisted dump. 9313ccc00a7SMahesh Salgaonkar */ 9323ccc00a7SMahesh Salgaonkar if (!fw_dump.reserve_dump_area_size) 93398b8cd7fSMichal Suchanek return -ENODEV; 9343ccc00a7SMahesh Salgaonkar 9351bd6a1c4SHari Bathini ret = fadump_setup_crash_memory_ranges(); 9361bd6a1c4SHari Bathini if (ret) 9371bd6a1c4SHari Bathini return ret; 9382df173d9SMahesh Salgaonkar 93941a65d16SHari Bathini addr = fw_dump.fadumphdr_addr; 94041a65d16SHari Bathini 9412df173d9SMahesh Salgaonkar /* Initialize fadump crash info header. */ 9422df173d9SMahesh Salgaonkar addr = init_fadump_header(addr); 9432df173d9SMahesh Salgaonkar vaddr = __va(addr); 9442df173d9SMahesh Salgaonkar 9452df173d9SMahesh Salgaonkar pr_debug("Creating ELF core headers at %#016lx\n", addr); 9462df173d9SMahesh Salgaonkar fadump_create_elfcore_headers(vaddr); 9472df173d9SMahesh Salgaonkar 9483ccc00a7SMahesh Salgaonkar /* register the future kernel dump with firmware. */ 94941a65d16SHari Bathini pr_debug("Registering for firmware-assisted kernel dump...\n"); 95041a65d16SHari Bathini return fw_dump.ops->fadump_register(&fw_dump); 9513ccc00a7SMahesh Salgaonkar } 9523ccc00a7SMahesh Salgaonkar 953b500afffSMahesh Salgaonkar void fadump_cleanup(void) 954b500afffSMahesh Salgaonkar { 9552790d01dSHari Bathini if (!fw_dump.fadump_supported) 9562790d01dSHari Bathini return; 9572790d01dSHari Bathini 958b500afffSMahesh Salgaonkar /* Invalidate the registration only if dump is active. */ 959b500afffSMahesh Salgaonkar if (fw_dump.dump_active) { 960f3512011SHari Bathini pr_debug("Invalidating firmware-assisted dump registration\n"); 961f3512011SHari Bathini fw_dump.ops->fadump_invalidate(&fw_dump); 962722cde76SMahesh Salgaonkar } else if (fw_dump.dump_registered) { 963722cde76SMahesh Salgaonkar /* Un-register Firmware-assisted dump if it was registered. */ 96441a65d16SHari Bathini fw_dump.ops->fadump_unregister(&fw_dump); 965e4fc48fbSHari Bathini fadump_free_mem_ranges(&crash_mrange_info); 966b500afffSMahesh Salgaonkar } 9672790d01dSHari Bathini 9682790d01dSHari Bathini if (fw_dump.ops->fadump_cleanup) 9692790d01dSHari Bathini fw_dump.ops->fadump_cleanup(&fw_dump); 970b500afffSMahesh Salgaonkar } 971b500afffSMahesh Salgaonkar 97268fa6478SHari Bathini static void fadump_free_reserved_memory(unsigned long start_pfn, 97368fa6478SHari Bathini unsigned long end_pfn) 97468fa6478SHari Bathini { 97568fa6478SHari Bathini unsigned long pfn; 97668fa6478SHari Bathini unsigned long time_limit = jiffies + HZ; 97768fa6478SHari Bathini 97868fa6478SHari Bathini pr_info("freeing reserved memory (0x%llx - 0x%llx)\n", 97968fa6478SHari Bathini PFN_PHYS(start_pfn), PFN_PHYS(end_pfn)); 98068fa6478SHari Bathini 98168fa6478SHari Bathini for (pfn = start_pfn; pfn < end_pfn; pfn++) { 98268fa6478SHari Bathini free_reserved_page(pfn_to_page(pfn)); 98368fa6478SHari Bathini 98468fa6478SHari Bathini if (time_after(jiffies, time_limit)) { 98568fa6478SHari Bathini cond_resched(); 98668fa6478SHari Bathini time_limit = jiffies + HZ; 98768fa6478SHari Bathini } 98868fa6478SHari Bathini } 98968fa6478SHari Bathini } 99068fa6478SHari Bathini 99168fa6478SHari Bathini /* 99268fa6478SHari Bathini * Skip memory holes and free memory that was actually reserved. 99368fa6478SHari Bathini */ 994dda9dbfeSHari Bathini static void fadump_release_reserved_area(u64 start, u64 end) 99568fa6478SHari Bathini { 996dda9dbfeSHari Bathini u64 tstart, tend, spfn, epfn; 99768fa6478SHari Bathini struct memblock_region *reg; 99868fa6478SHari Bathini 999dda9dbfeSHari Bathini spfn = PHYS_PFN(start); 1000dda9dbfeSHari Bathini epfn = PHYS_PFN(end); 100168fa6478SHari Bathini for_each_memblock(memory, reg) { 1002dda9dbfeSHari Bathini tstart = max_t(u64, spfn, memblock_region_memory_base_pfn(reg)); 1003dda9dbfeSHari Bathini tend = min_t(u64, epfn, memblock_region_memory_end_pfn(reg)); 100468fa6478SHari Bathini if (tstart < tend) { 100568fa6478SHari Bathini fadump_free_reserved_memory(tstart, tend); 100668fa6478SHari Bathini 1007dda9dbfeSHari Bathini if (tend == epfn) 100868fa6478SHari Bathini break; 100968fa6478SHari Bathini 1010dda9dbfeSHari Bathini spfn = tend; 101168fa6478SHari Bathini } 101268fa6478SHari Bathini } 101368fa6478SHari Bathini } 101468fa6478SHari Bathini 1015b500afffSMahesh Salgaonkar /* 1016dda9dbfeSHari Bathini * Sort the mem ranges in-place and merge adjacent ranges 1017dda9dbfeSHari Bathini * to minimize the memory ranges count. 1018b500afffSMahesh Salgaonkar */ 1019dda9dbfeSHari Bathini static void sort_and_merge_mem_ranges(struct fadump_mrange_info *mrange_info) 1020b500afffSMahesh Salgaonkar { 1021dda9dbfeSHari Bathini struct fadump_memory_range *mem_ranges; 1022dda9dbfeSHari Bathini struct fadump_memory_range tmp_range; 1023dda9dbfeSHari Bathini u64 base, size; 1024dda9dbfeSHari Bathini int i, j, idx; 1025dda9dbfeSHari Bathini 1026dda9dbfeSHari Bathini if (!reserved_mrange_info.mem_range_cnt) 1027dda9dbfeSHari Bathini return; 1028dda9dbfeSHari Bathini 1029dda9dbfeSHari Bathini /* Sort the memory ranges */ 1030dda9dbfeSHari Bathini mem_ranges = mrange_info->mem_ranges; 1031dda9dbfeSHari Bathini for (i = 0; i < mrange_info->mem_range_cnt; i++) { 1032dda9dbfeSHari Bathini idx = i; 1033dda9dbfeSHari Bathini for (j = (i + 1); j < mrange_info->mem_range_cnt; j++) { 1034dda9dbfeSHari Bathini if (mem_ranges[idx].base > mem_ranges[j].base) 1035dda9dbfeSHari Bathini idx = j; 1036dda9dbfeSHari Bathini } 1037dda9dbfeSHari Bathini if (idx != i) { 1038dda9dbfeSHari Bathini tmp_range = mem_ranges[idx]; 1039dda9dbfeSHari Bathini mem_ranges[idx] = mem_ranges[i]; 1040dda9dbfeSHari Bathini mem_ranges[i] = tmp_range; 1041dda9dbfeSHari Bathini } 1042dda9dbfeSHari Bathini } 1043dda9dbfeSHari Bathini 1044dda9dbfeSHari Bathini /* Merge adjacent reserved ranges */ 1045dda9dbfeSHari Bathini idx = 0; 1046dda9dbfeSHari Bathini for (i = 1; i < mrange_info->mem_range_cnt; i++) { 1047dda9dbfeSHari Bathini base = mem_ranges[i-1].base; 1048dda9dbfeSHari Bathini size = mem_ranges[i-1].size; 1049dda9dbfeSHari Bathini if (mem_ranges[i].base == (base + size)) 1050dda9dbfeSHari Bathini mem_ranges[idx].size += mem_ranges[i].size; 1051dda9dbfeSHari Bathini else { 1052dda9dbfeSHari Bathini idx++; 1053dda9dbfeSHari Bathini if (i == idx) 1054dda9dbfeSHari Bathini continue; 1055dda9dbfeSHari Bathini 1056dda9dbfeSHari Bathini mem_ranges[idx] = mem_ranges[i]; 1057dda9dbfeSHari Bathini } 1058dda9dbfeSHari Bathini } 1059dda9dbfeSHari Bathini mrange_info->mem_range_cnt = idx + 1; 1060dda9dbfeSHari Bathini } 1061dda9dbfeSHari Bathini 1062dda9dbfeSHari Bathini /* 1063dda9dbfeSHari Bathini * Scan reserved-ranges to consider them while reserving/releasing 1064dda9dbfeSHari Bathini * memory for FADump. 1065dda9dbfeSHari Bathini */ 1066dda9dbfeSHari Bathini static inline int fadump_scan_reserved_mem_ranges(void) 1067dda9dbfeSHari Bathini { 1068dda9dbfeSHari Bathini struct device_node *root; 1069dda9dbfeSHari Bathini const __be32 *prop; 1070dda9dbfeSHari Bathini int len, ret = -1; 1071dda9dbfeSHari Bathini unsigned long i; 1072dda9dbfeSHari Bathini 1073dda9dbfeSHari Bathini root = of_find_node_by_path("/"); 1074dda9dbfeSHari Bathini if (!root) 1075dda9dbfeSHari Bathini return ret; 1076dda9dbfeSHari Bathini 1077dda9dbfeSHari Bathini prop = of_get_property(root, "reserved-ranges", &len); 1078dda9dbfeSHari Bathini if (!prop) 1079dda9dbfeSHari Bathini return ret; 1080dda9dbfeSHari Bathini 1081dda9dbfeSHari Bathini /* 1082dda9dbfeSHari Bathini * Each reserved range is an (address,size) pair, 2 cells each, 1083dda9dbfeSHari Bathini * totalling 4 cells per range. 1084dda9dbfeSHari Bathini */ 1085dda9dbfeSHari Bathini for (i = 0; i < len / (sizeof(*prop) * 4); i++) { 1086dda9dbfeSHari Bathini u64 base, size; 1087dda9dbfeSHari Bathini 1088dda9dbfeSHari Bathini base = of_read_number(prop + (i * 4) + 0, 2); 1089dda9dbfeSHari Bathini size = of_read_number(prop + (i * 4) + 2, 2); 1090dda9dbfeSHari Bathini 1091dda9dbfeSHari Bathini if (size) { 1092dda9dbfeSHari Bathini ret = fadump_add_mem_range(&reserved_mrange_info, 1093dda9dbfeSHari Bathini base, base + size); 1094dda9dbfeSHari Bathini if (ret < 0) { 1095dda9dbfeSHari Bathini pr_warn("some reserved ranges are ignored!\n"); 1096dda9dbfeSHari Bathini break; 1097dda9dbfeSHari Bathini } 1098dda9dbfeSHari Bathini } 1099dda9dbfeSHari Bathini } 1100dda9dbfeSHari Bathini 1101dda9dbfeSHari Bathini return ret; 1102dda9dbfeSHari Bathini } 1103dda9dbfeSHari Bathini 1104dda9dbfeSHari Bathini /* 1105dda9dbfeSHari Bathini * Release the memory that was reserved during early boot to preserve the 1106dda9dbfeSHari Bathini * crash'ed kernel's memory contents except reserved dump area (permanent 1107dda9dbfeSHari Bathini * reservation) and reserved ranges used by F/W. The released memory will 1108dda9dbfeSHari Bathini * be available for general use. 1109dda9dbfeSHari Bathini */ 1110dda9dbfeSHari Bathini static void fadump_release_memory(u64 begin, u64 end) 1111dda9dbfeSHari Bathini { 1112dda9dbfeSHari Bathini u64 ra_start, ra_end, tstart; 1113dda9dbfeSHari Bathini int i, ret; 1114dda9dbfeSHari Bathini 1115dda9dbfeSHari Bathini fadump_scan_reserved_mem_ranges(); 1116b500afffSMahesh Salgaonkar 1117b500afffSMahesh Salgaonkar ra_start = fw_dump.reserve_dump_area_start; 1118b500afffSMahesh Salgaonkar ra_end = ra_start + fw_dump.reserve_dump_area_size; 1119b500afffSMahesh Salgaonkar 1120b500afffSMahesh Salgaonkar /* 1121dda9dbfeSHari Bathini * Add reserved dump area to reserved ranges list 1122dda9dbfeSHari Bathini * and exclude all these ranges while releasing memory. 1123dda9dbfeSHari Bathini */ 1124dda9dbfeSHari Bathini ret = fadump_add_mem_range(&reserved_mrange_info, ra_start, ra_end); 1125dda9dbfeSHari Bathini if (ret != 0) { 1126dda9dbfeSHari Bathini /* 1127dda9dbfeSHari Bathini * Not enough memory to setup reserved ranges but the system is 1128dda9dbfeSHari Bathini * running shortage of memory. So, release all the memory except 1129dda9dbfeSHari Bathini * Reserved dump area (reused for next fadump registration). 1130b500afffSMahesh Salgaonkar */ 113168fa6478SHari Bathini if (begin < ra_end && end > ra_start) { 113268fa6478SHari Bathini if (begin < ra_start) 113368fa6478SHari Bathini fadump_release_reserved_area(begin, ra_start); 113468fa6478SHari Bathini if (end > ra_end) 113568fa6478SHari Bathini fadump_release_reserved_area(ra_end, end); 113668fa6478SHari Bathini } else 113768fa6478SHari Bathini fadump_release_reserved_area(begin, end); 1138dda9dbfeSHari Bathini 1139dda9dbfeSHari Bathini return; 1140dda9dbfeSHari Bathini } 1141dda9dbfeSHari Bathini 1142dda9dbfeSHari Bathini /* Get the reserved ranges list in order first. */ 1143dda9dbfeSHari Bathini sort_and_merge_mem_ranges(&reserved_mrange_info); 1144dda9dbfeSHari Bathini 1145dda9dbfeSHari Bathini /* Exclude reserved ranges and release remaining memory */ 1146dda9dbfeSHari Bathini tstart = begin; 1147dda9dbfeSHari Bathini for (i = 0; i < reserved_mrange_info.mem_range_cnt; i++) { 1148dda9dbfeSHari Bathini ra_start = reserved_mrange_info.mem_ranges[i].base; 1149dda9dbfeSHari Bathini ra_end = ra_start + reserved_mrange_info.mem_ranges[i].size; 1150dda9dbfeSHari Bathini 1151dda9dbfeSHari Bathini if (tstart >= ra_end) 1152dda9dbfeSHari Bathini continue; 1153dda9dbfeSHari Bathini 1154dda9dbfeSHari Bathini if (tstart < ra_start) 1155dda9dbfeSHari Bathini fadump_release_reserved_area(tstart, ra_start); 1156dda9dbfeSHari Bathini tstart = ra_end; 1157dda9dbfeSHari Bathini } 1158dda9dbfeSHari Bathini 1159dda9dbfeSHari Bathini if (tstart < end) 1160dda9dbfeSHari Bathini fadump_release_reserved_area(tstart, end); 1161b500afffSMahesh Salgaonkar } 1162b500afffSMahesh Salgaonkar 1163b500afffSMahesh Salgaonkar static void fadump_invalidate_release_mem(void) 1164b500afffSMahesh Salgaonkar { 1165b500afffSMahesh Salgaonkar mutex_lock(&fadump_mutex); 1166b500afffSMahesh Salgaonkar if (!fw_dump.dump_active) { 1167b500afffSMahesh Salgaonkar mutex_unlock(&fadump_mutex); 1168b500afffSMahesh Salgaonkar return; 1169b500afffSMahesh Salgaonkar } 1170b500afffSMahesh Salgaonkar 1171b500afffSMahesh Salgaonkar fadump_cleanup(); 1172b500afffSMahesh Salgaonkar mutex_unlock(&fadump_mutex); 1173b500afffSMahesh Salgaonkar 11748255da95SHari Bathini fadump_release_memory(fw_dump.boot_memory_size, memblock_end_of_DRAM()); 1175961cf26aSHari Bathini fadump_free_cpu_notes_buf(); 1176961cf26aSHari Bathini 1177a4e2e2caSHari Bathini /* 1178a4e2e2caSHari Bathini * Setup kernel metadata and initialize the kernel dump 1179a4e2e2caSHari Bathini * memory structure for FADump re-registration. 1180a4e2e2caSHari Bathini */ 1181a4e2e2caSHari Bathini if (fw_dump.ops->fadump_setup_metadata && 1182a4e2e2caSHari Bathini (fw_dump.ops->fadump_setup_metadata(&fw_dump) < 0)) 1183a4e2e2caSHari Bathini pr_warn("Failed to setup kernel metadata!\n"); 118441a65d16SHari Bathini fw_dump.ops->fadump_init_mem_struct(&fw_dump); 1185b500afffSMahesh Salgaonkar } 1186b500afffSMahesh Salgaonkar 1187b500afffSMahesh Salgaonkar static ssize_t fadump_release_memory_store(struct kobject *kobj, 1188b500afffSMahesh Salgaonkar struct kobj_attribute *attr, 1189b500afffSMahesh Salgaonkar const char *buf, size_t count) 1190b500afffSMahesh Salgaonkar { 1191dcdc4679SMichal Suchanek int input = -1; 1192dcdc4679SMichal Suchanek 1193b500afffSMahesh Salgaonkar if (!fw_dump.dump_active) 1194b500afffSMahesh Salgaonkar return -EPERM; 1195b500afffSMahesh Salgaonkar 1196dcdc4679SMichal Suchanek if (kstrtoint(buf, 0, &input)) 1197dcdc4679SMichal Suchanek return -EINVAL; 1198dcdc4679SMichal Suchanek 1199dcdc4679SMichal Suchanek if (input == 1) { 1200b500afffSMahesh Salgaonkar /* 1201b500afffSMahesh Salgaonkar * Take away the '/proc/vmcore'. We are releasing the dump 1202b500afffSMahesh Salgaonkar * memory, hence it will not be valid anymore. 1203b500afffSMahesh Salgaonkar */ 12042685f826SMichael Ellerman #ifdef CONFIG_PROC_VMCORE 1205b500afffSMahesh Salgaonkar vmcore_cleanup(); 12062685f826SMichael Ellerman #endif 1207b500afffSMahesh Salgaonkar fadump_invalidate_release_mem(); 1208b500afffSMahesh Salgaonkar 1209b500afffSMahesh Salgaonkar } else 1210b500afffSMahesh Salgaonkar return -EINVAL; 1211b500afffSMahesh Salgaonkar return count; 1212b500afffSMahesh Salgaonkar } 1213b500afffSMahesh Salgaonkar 12143ccc00a7SMahesh Salgaonkar static ssize_t fadump_enabled_show(struct kobject *kobj, 12153ccc00a7SMahesh Salgaonkar struct kobj_attribute *attr, 12163ccc00a7SMahesh Salgaonkar char *buf) 12173ccc00a7SMahesh Salgaonkar { 12183ccc00a7SMahesh Salgaonkar return sprintf(buf, "%d\n", fw_dump.fadump_enabled); 12193ccc00a7SMahesh Salgaonkar } 12203ccc00a7SMahesh Salgaonkar 12213ccc00a7SMahesh Salgaonkar static ssize_t fadump_register_show(struct kobject *kobj, 12223ccc00a7SMahesh Salgaonkar struct kobj_attribute *attr, 12233ccc00a7SMahesh Salgaonkar char *buf) 12243ccc00a7SMahesh Salgaonkar { 12253ccc00a7SMahesh Salgaonkar return sprintf(buf, "%d\n", fw_dump.dump_registered); 12263ccc00a7SMahesh Salgaonkar } 12273ccc00a7SMahesh Salgaonkar 12283ccc00a7SMahesh Salgaonkar static ssize_t fadump_register_store(struct kobject *kobj, 12293ccc00a7SMahesh Salgaonkar struct kobj_attribute *attr, 12303ccc00a7SMahesh Salgaonkar const char *buf, size_t count) 12313ccc00a7SMahesh Salgaonkar { 12323ccc00a7SMahesh Salgaonkar int ret = 0; 1233dcdc4679SMichal Suchanek int input = -1; 12343ccc00a7SMahesh Salgaonkar 1235f3512011SHari Bathini if (!fw_dump.fadump_enabled || fw_dump.dump_active) 12363ccc00a7SMahesh Salgaonkar return -EPERM; 12373ccc00a7SMahesh Salgaonkar 1238dcdc4679SMichal Suchanek if (kstrtoint(buf, 0, &input)) 1239dcdc4679SMichal Suchanek return -EINVAL; 1240dcdc4679SMichal Suchanek 12413ccc00a7SMahesh Salgaonkar mutex_lock(&fadump_mutex); 12423ccc00a7SMahesh Salgaonkar 1243dcdc4679SMichal Suchanek switch (input) { 1244dcdc4679SMichal Suchanek case 0: 12453ccc00a7SMahesh Salgaonkar if (fw_dump.dump_registered == 0) { 12463ccc00a7SMahesh Salgaonkar goto unlock_out; 12473ccc00a7SMahesh Salgaonkar } 1248f3512011SHari Bathini 12493ccc00a7SMahesh Salgaonkar /* Un-register Firmware-assisted dump */ 125041a65d16SHari Bathini pr_debug("Un-register firmware-assisted dump\n"); 125141a65d16SHari Bathini fw_dump.ops->fadump_unregister(&fw_dump); 12523ccc00a7SMahesh Salgaonkar break; 1253dcdc4679SMichal Suchanek case 1: 12543ccc00a7SMahesh Salgaonkar if (fw_dump.dump_registered == 1) { 12550823c68bSHari Bathini /* Un-register Firmware-assisted dump */ 125641a65d16SHari Bathini fw_dump.ops->fadump_unregister(&fw_dump); 12573ccc00a7SMahesh Salgaonkar } 12583ccc00a7SMahesh Salgaonkar /* Register Firmware-assisted dump */ 125998b8cd7fSMichal Suchanek ret = register_fadump(); 12603ccc00a7SMahesh Salgaonkar break; 12613ccc00a7SMahesh Salgaonkar default: 12623ccc00a7SMahesh Salgaonkar ret = -EINVAL; 12633ccc00a7SMahesh Salgaonkar break; 12643ccc00a7SMahesh Salgaonkar } 12653ccc00a7SMahesh Salgaonkar 12663ccc00a7SMahesh Salgaonkar unlock_out: 12673ccc00a7SMahesh Salgaonkar mutex_unlock(&fadump_mutex); 12683ccc00a7SMahesh Salgaonkar return ret < 0 ? ret : count; 12693ccc00a7SMahesh Salgaonkar } 12703ccc00a7SMahesh Salgaonkar 12713ccc00a7SMahesh Salgaonkar static int fadump_region_show(struct seq_file *m, void *private) 12723ccc00a7SMahesh Salgaonkar { 12733ccc00a7SMahesh Salgaonkar if (!fw_dump.fadump_enabled) 12743ccc00a7SMahesh Salgaonkar return 0; 12753ccc00a7SMahesh Salgaonkar 1276b500afffSMahesh Salgaonkar mutex_lock(&fadump_mutex); 127741a65d16SHari Bathini fw_dump.ops->fadump_region_show(&fw_dump, m); 1278b500afffSMahesh Salgaonkar mutex_unlock(&fadump_mutex); 12793ccc00a7SMahesh Salgaonkar return 0; 12803ccc00a7SMahesh Salgaonkar } 12813ccc00a7SMahesh Salgaonkar 1282b500afffSMahesh Salgaonkar static struct kobj_attribute fadump_release_attr = __ATTR(fadump_release_mem, 1283b500afffSMahesh Salgaonkar 0200, NULL, 1284b500afffSMahesh Salgaonkar fadump_release_memory_store); 12853ccc00a7SMahesh Salgaonkar static struct kobj_attribute fadump_attr = __ATTR(fadump_enabled, 12863ccc00a7SMahesh Salgaonkar 0444, fadump_enabled_show, 12873ccc00a7SMahesh Salgaonkar NULL); 12883ccc00a7SMahesh Salgaonkar static struct kobj_attribute fadump_register_attr = __ATTR(fadump_registered, 12893ccc00a7SMahesh Salgaonkar 0644, fadump_register_show, 12903ccc00a7SMahesh Salgaonkar fadump_register_store); 12913ccc00a7SMahesh Salgaonkar 1292f6cee260SYangtao Li DEFINE_SHOW_ATTRIBUTE(fadump_region); 12933ccc00a7SMahesh Salgaonkar 12943ccc00a7SMahesh Salgaonkar static void fadump_init_files(void) 12953ccc00a7SMahesh Salgaonkar { 12963ccc00a7SMahesh Salgaonkar struct dentry *debugfs_file; 12973ccc00a7SMahesh Salgaonkar int rc = 0; 12983ccc00a7SMahesh Salgaonkar 12993ccc00a7SMahesh Salgaonkar rc = sysfs_create_file(kernel_kobj, &fadump_attr.attr); 13003ccc00a7SMahesh Salgaonkar if (rc) 13013ccc00a7SMahesh Salgaonkar printk(KERN_ERR "fadump: unable to create sysfs file" 13023ccc00a7SMahesh Salgaonkar " fadump_enabled (%d)\n", rc); 13033ccc00a7SMahesh Salgaonkar 13043ccc00a7SMahesh Salgaonkar rc = sysfs_create_file(kernel_kobj, &fadump_register_attr.attr); 13053ccc00a7SMahesh Salgaonkar if (rc) 13063ccc00a7SMahesh Salgaonkar printk(KERN_ERR "fadump: unable to create sysfs file" 13073ccc00a7SMahesh Salgaonkar " fadump_registered (%d)\n", rc); 13083ccc00a7SMahesh Salgaonkar 13093ccc00a7SMahesh Salgaonkar debugfs_file = debugfs_create_file("fadump_region", 0444, 13103ccc00a7SMahesh Salgaonkar powerpc_debugfs_root, NULL, 13113ccc00a7SMahesh Salgaonkar &fadump_region_fops); 13123ccc00a7SMahesh Salgaonkar if (!debugfs_file) 13133ccc00a7SMahesh Salgaonkar printk(KERN_ERR "fadump: unable to create debugfs file" 13143ccc00a7SMahesh Salgaonkar " fadump_region\n"); 1315b500afffSMahesh Salgaonkar 1316b500afffSMahesh Salgaonkar if (fw_dump.dump_active) { 1317b500afffSMahesh Salgaonkar rc = sysfs_create_file(kernel_kobj, &fadump_release_attr.attr); 1318b500afffSMahesh Salgaonkar if (rc) 1319b500afffSMahesh Salgaonkar printk(KERN_ERR "fadump: unable to create sysfs file" 1320b500afffSMahesh Salgaonkar " fadump_release_mem (%d)\n", rc); 1321b500afffSMahesh Salgaonkar } 13223ccc00a7SMahesh Salgaonkar return; 13233ccc00a7SMahesh Salgaonkar } 13243ccc00a7SMahesh Salgaonkar 13253ccc00a7SMahesh Salgaonkar /* 13263ccc00a7SMahesh Salgaonkar * Prepare for firmware-assisted dump. 13273ccc00a7SMahesh Salgaonkar */ 13283ccc00a7SMahesh Salgaonkar int __init setup_fadump(void) 13293ccc00a7SMahesh Salgaonkar { 13303ccc00a7SMahesh Salgaonkar if (!fw_dump.fadump_enabled) 13313ccc00a7SMahesh Salgaonkar return 0; 13323ccc00a7SMahesh Salgaonkar 13333ccc00a7SMahesh Salgaonkar if (!fw_dump.fadump_supported) { 13343ccc00a7SMahesh Salgaonkar printk(KERN_ERR "Firmware-assisted dump is not supported on" 13353ccc00a7SMahesh Salgaonkar " this hardware\n"); 13363ccc00a7SMahesh Salgaonkar return 0; 13373ccc00a7SMahesh Salgaonkar } 13383ccc00a7SMahesh Salgaonkar 13393ccc00a7SMahesh Salgaonkar fadump_show_config(); 13402df173d9SMahesh Salgaonkar /* 13412df173d9SMahesh Salgaonkar * If dump data is available then see if it is valid and prepare for 13422df173d9SMahesh Salgaonkar * saving it to the disk. 13432df173d9SMahesh Salgaonkar */ 1344b500afffSMahesh Salgaonkar if (fw_dump.dump_active) { 1345b500afffSMahesh Salgaonkar /* 1346b500afffSMahesh Salgaonkar * if dump process fails then invalidate the registration 1347b500afffSMahesh Salgaonkar * and release memory before proceeding for re-registration. 1348b500afffSMahesh Salgaonkar */ 1349f3512011SHari Bathini if (fw_dump.ops->fadump_process(&fw_dump) < 0) 1350b500afffSMahesh Salgaonkar fadump_invalidate_release_mem(); 1351b500afffSMahesh Salgaonkar } 13523ccc00a7SMahesh Salgaonkar /* Initialize the kernel dump memory structure for FAD registration. */ 13532df173d9SMahesh Salgaonkar else if (fw_dump.reserve_dump_area_size) 135441a65d16SHari Bathini fw_dump.ops->fadump_init_mem_struct(&fw_dump); 1355f3512011SHari Bathini 13563ccc00a7SMahesh Salgaonkar fadump_init_files(); 13573ccc00a7SMahesh Salgaonkar 13583ccc00a7SMahesh Salgaonkar return 1; 13593ccc00a7SMahesh Salgaonkar } 13603ccc00a7SMahesh Salgaonkar subsys_initcall(setup_fadump); 1361*b2a815a5SHari Bathini 1362*b2a815a5SHari Bathini /* Preserve everything above the base address */ 1363*b2a815a5SHari Bathini static void __init fadump_reserve_crash_area(u64 base) 1364*b2a815a5SHari Bathini { 1365*b2a815a5SHari Bathini struct memblock_region *reg; 1366*b2a815a5SHari Bathini u64 mstart, msize; 1367*b2a815a5SHari Bathini 1368*b2a815a5SHari Bathini for_each_memblock(memory, reg) { 1369*b2a815a5SHari Bathini mstart = reg->base; 1370*b2a815a5SHari Bathini msize = reg->size; 1371*b2a815a5SHari Bathini 1372*b2a815a5SHari Bathini if ((mstart + msize) < base) 1373*b2a815a5SHari Bathini continue; 1374*b2a815a5SHari Bathini 1375*b2a815a5SHari Bathini if (mstart < base) { 1376*b2a815a5SHari Bathini msize -= (base - mstart); 1377*b2a815a5SHari Bathini mstart = base; 1378*b2a815a5SHari Bathini } 1379*b2a815a5SHari Bathini 1380*b2a815a5SHari Bathini pr_info("Reserving %lluMB of memory at %#016llx for preserving crash data", 1381*b2a815a5SHari Bathini (msize >> 20), mstart); 1382*b2a815a5SHari Bathini memblock_reserve(mstart, msize); 1383*b2a815a5SHari Bathini } 1384*b2a815a5SHari Bathini } 1385