1 /* 2 * Copyright (C) 1995 Linus Torvalds 3 * 4 * Support of BIGMEM added by Gerhard Wichert, Siemens AG, July 1999 5 * 6 * Memory region support 7 * David Parsons <orc@pell.chi.il.us>, July-August 1999 8 * 9 * Added E820 sanitization routine (removes overlapping memory regions); 10 * Brian Moyle <bmoyle@mvista.com>, February 2001 11 * 12 * Moved CPU detection code to cpu/${cpu}.c 13 * Patrick Mochel <mochel@osdl.org>, March 2002 14 * 15 * Provisions for empty E820 memory regions (reported by certain BIOSes). 16 * Alex Achenbach <xela@slit.de>, December 2002. 17 * 18 */ 19 20 /* 21 * This file handles the architecture-dependent parts of initialization 22 */ 23 24 #include <linux/sched.h> 25 #include <linux/mm.h> 26 #include <linux/mmzone.h> 27 #include <linux/screen_info.h> 28 #include <linux/ioport.h> 29 #include <linux/acpi.h> 30 #include <linux/apm_bios.h> 31 #include <linux/initrd.h> 32 #include <linux/bootmem.h> 33 #include <linux/seq_file.h> 34 #include <linux/console.h> 35 #include <linux/mca.h> 36 #include <linux/root_dev.h> 37 #include <linux/highmem.h> 38 #include <linux/module.h> 39 #include <linux/efi.h> 40 #include <linux/init.h> 41 #include <linux/edd.h> 42 #include <linux/iscsi_ibft.h> 43 #include <linux/nodemask.h> 44 #include <linux/kexec.h> 45 #include <linux/dmi.h> 46 #include <linux/pfn.h> 47 #include <linux/pci.h> 48 #include <asm/pci-direct.h> 49 #include <linux/init_ohci1394_dma.h> 50 #include <linux/kvm_para.h> 51 52 #include <linux/errno.h> 53 #include <linux/kernel.h> 54 #include <linux/stddef.h> 55 #include <linux/unistd.h> 56 #include <linux/ptrace.h> 57 #include <linux/slab.h> 58 #include <linux/user.h> 59 #include <linux/delay.h> 60 61 #include <linux/kallsyms.h> 62 #include <linux/cpufreq.h> 63 #include <linux/dma-mapping.h> 64 #include <linux/ctype.h> 65 #include <linux/uaccess.h> 66 67 #include <linux/percpu.h> 68 #include <linux/crash_dump.h> 69 70 #include <video/edid.h> 71 72 #include <asm/mtrr.h> 73 #include <asm/apic.h> 74 #include <asm/e820.h> 75 #include <asm/mpspec.h> 76 #include <asm/setup.h> 77 #include <asm/arch_hooks.h> 78 #include <asm/efi.h> 79 #include <asm/sections.h> 80 #include <asm/dmi.h> 81 #include <asm/io_apic.h> 82 #include <asm/ist.h> 83 #include <asm/vmi.h> 84 #include <setup_arch.h> 85 #include <asm/bios_ebda.h> 86 #include <asm/cacheflush.h> 87 #include <asm/processor.h> 88 #include <asm/bugs.h> 89 90 #include <asm/system.h> 91 #include <asm/vsyscall.h> 92 #include <asm/smp.h> 93 #include <asm/desc.h> 94 #include <asm/dma.h> 95 #include <asm/iommu.h> 96 #include <asm/mmu_context.h> 97 #include <asm/proto.h> 98 99 #include <mach_apic.h> 100 #include <asm/paravirt.h> 101 102 #include <asm/percpu.h> 103 #include <asm/topology.h> 104 #include <asm/apicdef.h> 105 #ifdef CONFIG_X86_64 106 #include <asm/numa_64.h> 107 #endif 108 109 #ifndef ARCH_SETUP 110 #define ARCH_SETUP 111 #endif 112 113 #ifndef CONFIG_DEBUG_BOOT_PARAMS 114 struct boot_params __initdata boot_params; 115 #else 116 struct boot_params boot_params; 117 #endif 118 119 /* 120 * Machine setup.. 121 */ 122 static struct resource data_resource = { 123 .name = "Kernel data", 124 .start = 0, 125 .end = 0, 126 .flags = IORESOURCE_BUSY | IORESOURCE_MEM 127 }; 128 129 static struct resource code_resource = { 130 .name = "Kernel code", 131 .start = 0, 132 .end = 0, 133 .flags = IORESOURCE_BUSY | IORESOURCE_MEM 134 }; 135 136 static struct resource bss_resource = { 137 .name = "Kernel bss", 138 .start = 0, 139 .end = 0, 140 .flags = IORESOURCE_BUSY | IORESOURCE_MEM 141 }; 142 143 144 #ifdef CONFIG_X86_32 145 /* This value is set up by the early boot code to point to the value 146 immediately after the boot time page tables. It contains a *physical* 147 address, and must not be in the .bss segment! */ 148 unsigned long init_pg_tables_start __initdata = ~0UL; 149 unsigned long init_pg_tables_end __initdata = ~0UL; 150 151 static struct resource video_ram_resource = { 152 .name = "Video RAM area", 153 .start = 0xa0000, 154 .end = 0xbffff, 155 .flags = IORESOURCE_BUSY | IORESOURCE_MEM 156 }; 157 158 /* cpu data as detected by the assembly code in head.S */ 159 struct cpuinfo_x86 new_cpu_data __cpuinitdata = {0, 0, 0, 0, -1, 1, 0, 0, -1}; 160 /* common cpu data for all cpus */ 161 struct cpuinfo_x86 boot_cpu_data __read_mostly = {0, 0, 0, 0, -1, 1, 0, 0, -1}; 162 EXPORT_SYMBOL(boot_cpu_data); 163 static void set_mca_bus(int x) 164 { 165 #ifdef CONFIG_MCA 166 MCA_bus = x; 167 #endif 168 } 169 170 unsigned int def_to_bigsmp; 171 172 /* for MCA, but anyone else can use it if they want */ 173 unsigned int machine_id; 174 unsigned int machine_submodel_id; 175 unsigned int BIOS_revision; 176 177 struct apm_info apm_info; 178 EXPORT_SYMBOL(apm_info); 179 180 #if defined(CONFIG_X86_SPEEDSTEP_SMI) || \ 181 defined(CONFIG_X86_SPEEDSTEP_SMI_MODULE) 182 struct ist_info ist_info; 183 EXPORT_SYMBOL(ist_info); 184 #else 185 struct ist_info ist_info; 186 #endif 187 188 #else 189 struct cpuinfo_x86 boot_cpu_data __read_mostly; 190 EXPORT_SYMBOL(boot_cpu_data); 191 #endif 192 193 194 #if !defined(CONFIG_X86_PAE) || defined(CONFIG_X86_64) 195 unsigned long mmu_cr4_features; 196 #else 197 unsigned long mmu_cr4_features = X86_CR4_PAE; 198 #endif 199 200 /* Boot loader ID as an integer, for the benefit of proc_dointvec */ 201 int bootloader_type; 202 203 /* 204 * Early DMI memory 205 */ 206 int dmi_alloc_index; 207 char dmi_alloc_data[DMI_MAX_DATA]; 208 209 /* 210 * Setup options 211 */ 212 struct screen_info screen_info; 213 EXPORT_SYMBOL(screen_info); 214 struct edid_info edid_info; 215 EXPORT_SYMBOL_GPL(edid_info); 216 217 extern int root_mountflags; 218 219 unsigned long saved_video_mode; 220 221 #define RAMDISK_IMAGE_START_MASK 0x07FF 222 #define RAMDISK_PROMPT_FLAG 0x8000 223 #define RAMDISK_LOAD_FLAG 0x4000 224 225 static char __initdata command_line[COMMAND_LINE_SIZE]; 226 #ifdef CONFIG_CMDLINE_BOOL 227 static char __initdata builtin_cmdline[COMMAND_LINE_SIZE] = CONFIG_CMDLINE; 228 #endif 229 230 #if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE) 231 struct edd edd; 232 #ifdef CONFIG_EDD_MODULE 233 EXPORT_SYMBOL(edd); 234 #endif 235 /** 236 * copy_edd() - Copy the BIOS EDD information 237 * from boot_params into a safe place. 238 * 239 */ 240 static inline void copy_edd(void) 241 { 242 memcpy(edd.mbr_signature, boot_params.edd_mbr_sig_buffer, 243 sizeof(edd.mbr_signature)); 244 memcpy(edd.edd_info, boot_params.eddbuf, sizeof(edd.edd_info)); 245 edd.mbr_signature_nr = boot_params.edd_mbr_sig_buf_entries; 246 edd.edd_info_nr = boot_params.eddbuf_entries; 247 } 248 #else 249 static inline void copy_edd(void) 250 { 251 } 252 #endif 253 254 #ifdef CONFIG_BLK_DEV_INITRD 255 256 #ifdef CONFIG_X86_32 257 258 #define MAX_MAP_CHUNK (NR_FIX_BTMAPS << PAGE_SHIFT) 259 static void __init relocate_initrd(void) 260 { 261 262 u64 ramdisk_image = boot_params.hdr.ramdisk_image; 263 u64 ramdisk_size = boot_params.hdr.ramdisk_size; 264 u64 end_of_lowmem = max_low_pfn << PAGE_SHIFT; 265 u64 ramdisk_here; 266 unsigned long slop, clen, mapaddr; 267 char *p, *q; 268 269 /* We need to move the initrd down into lowmem */ 270 ramdisk_here = find_e820_area(0, end_of_lowmem, ramdisk_size, 271 PAGE_SIZE); 272 273 if (ramdisk_here == -1ULL) 274 panic("Cannot find place for new RAMDISK of size %lld\n", 275 ramdisk_size); 276 277 /* Note: this includes all the lowmem currently occupied by 278 the initrd, we rely on that fact to keep the data intact. */ 279 reserve_early(ramdisk_here, ramdisk_here + ramdisk_size, 280 "NEW RAMDISK"); 281 initrd_start = ramdisk_here + PAGE_OFFSET; 282 initrd_end = initrd_start + ramdisk_size; 283 printk(KERN_INFO "Allocated new RAMDISK: %08llx - %08llx\n", 284 ramdisk_here, ramdisk_here + ramdisk_size); 285 286 q = (char *)initrd_start; 287 288 /* Copy any lowmem portion of the initrd */ 289 if (ramdisk_image < end_of_lowmem) { 290 clen = end_of_lowmem - ramdisk_image; 291 p = (char *)__va(ramdisk_image); 292 memcpy(q, p, clen); 293 q += clen; 294 ramdisk_image += clen; 295 ramdisk_size -= clen; 296 } 297 298 /* Copy the highmem portion of the initrd */ 299 while (ramdisk_size) { 300 slop = ramdisk_image & ~PAGE_MASK; 301 clen = ramdisk_size; 302 if (clen > MAX_MAP_CHUNK-slop) 303 clen = MAX_MAP_CHUNK-slop; 304 mapaddr = ramdisk_image & PAGE_MASK; 305 p = early_memremap(mapaddr, clen+slop); 306 memcpy(q, p+slop, clen); 307 early_iounmap(p, clen+slop); 308 q += clen; 309 ramdisk_image += clen; 310 ramdisk_size -= clen; 311 } 312 /* high pages is not converted by early_res_to_bootmem */ 313 ramdisk_image = boot_params.hdr.ramdisk_image; 314 ramdisk_size = boot_params.hdr.ramdisk_size; 315 printk(KERN_INFO "Move RAMDISK from %016llx - %016llx to" 316 " %08llx - %08llx\n", 317 ramdisk_image, ramdisk_image + ramdisk_size - 1, 318 ramdisk_here, ramdisk_here + ramdisk_size - 1); 319 } 320 #endif 321 322 static void __init reserve_initrd(void) 323 { 324 u64 ramdisk_image = boot_params.hdr.ramdisk_image; 325 u64 ramdisk_size = boot_params.hdr.ramdisk_size; 326 u64 ramdisk_end = ramdisk_image + ramdisk_size; 327 u64 end_of_lowmem = max_low_pfn << PAGE_SHIFT; 328 329 if (!boot_params.hdr.type_of_loader || 330 !ramdisk_image || !ramdisk_size) 331 return; /* No initrd provided by bootloader */ 332 333 initrd_start = 0; 334 335 if (ramdisk_size >= (end_of_lowmem>>1)) { 336 free_early(ramdisk_image, ramdisk_end); 337 printk(KERN_ERR "initrd too large to handle, " 338 "disabling initrd\n"); 339 return; 340 } 341 342 printk(KERN_INFO "RAMDISK: %08llx - %08llx\n", ramdisk_image, 343 ramdisk_end); 344 345 346 if (ramdisk_end <= end_of_lowmem) { 347 /* All in lowmem, easy case */ 348 /* 349 * don't need to reserve again, already reserved early 350 * in i386_start_kernel 351 */ 352 initrd_start = ramdisk_image + PAGE_OFFSET; 353 initrd_end = initrd_start + ramdisk_size; 354 return; 355 } 356 357 #ifdef CONFIG_X86_32 358 relocate_initrd(); 359 #else 360 printk(KERN_ERR "initrd extends beyond end of memory " 361 "(0x%08llx > 0x%08llx)\ndisabling initrd\n", 362 ramdisk_end, end_of_lowmem); 363 initrd_start = 0; 364 #endif 365 free_early(ramdisk_image, ramdisk_end); 366 } 367 #else 368 static void __init reserve_initrd(void) 369 { 370 } 371 #endif /* CONFIG_BLK_DEV_INITRD */ 372 373 static void __init parse_setup_data(void) 374 { 375 struct setup_data *data; 376 u64 pa_data; 377 378 if (boot_params.hdr.version < 0x0209) 379 return; 380 pa_data = boot_params.hdr.setup_data; 381 while (pa_data) { 382 data = early_memremap(pa_data, PAGE_SIZE); 383 switch (data->type) { 384 case SETUP_E820_EXT: 385 parse_e820_ext(data, pa_data); 386 break; 387 default: 388 break; 389 } 390 pa_data = data->next; 391 early_iounmap(data, PAGE_SIZE); 392 } 393 } 394 395 static void __init e820_reserve_setup_data(void) 396 { 397 struct setup_data *data; 398 u64 pa_data; 399 int found = 0; 400 401 if (boot_params.hdr.version < 0x0209) 402 return; 403 pa_data = boot_params.hdr.setup_data; 404 while (pa_data) { 405 data = early_memremap(pa_data, sizeof(*data)); 406 e820_update_range(pa_data, sizeof(*data)+data->len, 407 E820_RAM, E820_RESERVED_KERN); 408 found = 1; 409 pa_data = data->next; 410 early_iounmap(data, sizeof(*data)); 411 } 412 if (!found) 413 return; 414 415 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map); 416 memcpy(&e820_saved, &e820, sizeof(struct e820map)); 417 printk(KERN_INFO "extended physical RAM map:\n"); 418 e820_print_map("reserve setup_data"); 419 } 420 421 static void __init reserve_early_setup_data(void) 422 { 423 struct setup_data *data; 424 u64 pa_data; 425 char buf[32]; 426 427 if (boot_params.hdr.version < 0x0209) 428 return; 429 pa_data = boot_params.hdr.setup_data; 430 while (pa_data) { 431 data = early_memremap(pa_data, sizeof(*data)); 432 sprintf(buf, "setup data %x", data->type); 433 reserve_early(pa_data, pa_data+sizeof(*data)+data->len, buf); 434 pa_data = data->next; 435 early_iounmap(data, sizeof(*data)); 436 } 437 } 438 439 /* 440 * --------- Crashkernel reservation ------------------------------ 441 */ 442 443 #ifdef CONFIG_KEXEC 444 445 /** 446 * Reserve @size bytes of crashkernel memory at any suitable offset. 447 * 448 * @size: Size of the crashkernel memory to reserve. 449 * Returns the base address on success, and -1ULL on failure. 450 */ 451 unsigned long long __init find_and_reserve_crashkernel(unsigned long long size) 452 { 453 const unsigned long long alignment = 16<<20; /* 16M */ 454 unsigned long long start = 0LL; 455 456 while (1) { 457 int ret; 458 459 start = find_e820_area(start, ULONG_MAX, size, alignment); 460 if (start == -1ULL) 461 return start; 462 463 /* try to reserve it */ 464 ret = reserve_bootmem_generic(start, size, BOOTMEM_EXCLUSIVE); 465 if (ret >= 0) 466 return start; 467 468 start += alignment; 469 } 470 } 471 472 static inline unsigned long long get_total_mem(void) 473 { 474 unsigned long long total; 475 476 total = max_low_pfn - min_low_pfn; 477 #ifdef CONFIG_HIGHMEM 478 total += highend_pfn - highstart_pfn; 479 #endif 480 481 return total << PAGE_SHIFT; 482 } 483 484 static void __init reserve_crashkernel(void) 485 { 486 unsigned long long total_mem; 487 unsigned long long crash_size, crash_base; 488 int ret; 489 490 total_mem = get_total_mem(); 491 492 ret = parse_crashkernel(boot_command_line, total_mem, 493 &crash_size, &crash_base); 494 if (ret != 0 || crash_size <= 0) 495 return; 496 497 /* 0 means: find the address automatically */ 498 if (crash_base <= 0) { 499 crash_base = find_and_reserve_crashkernel(crash_size); 500 if (crash_base == -1ULL) { 501 pr_info("crashkernel reservation failed. " 502 "No suitable area found.\n"); 503 return; 504 } 505 } else { 506 ret = reserve_bootmem_generic(crash_base, crash_size, 507 BOOTMEM_EXCLUSIVE); 508 if (ret < 0) { 509 pr_info("crashkernel reservation failed - " 510 "memory is in use\n"); 511 return; 512 } 513 } 514 515 printk(KERN_INFO "Reserving %ldMB of memory at %ldMB " 516 "for crashkernel (System RAM: %ldMB)\n", 517 (unsigned long)(crash_size >> 20), 518 (unsigned long)(crash_base >> 20), 519 (unsigned long)(total_mem >> 20)); 520 521 crashk_res.start = crash_base; 522 crashk_res.end = crash_base + crash_size - 1; 523 insert_resource(&iomem_resource, &crashk_res); 524 } 525 #else 526 static void __init reserve_crashkernel(void) 527 { 528 } 529 #endif 530 531 static struct resource standard_io_resources[] = { 532 { .name = "dma1", .start = 0x00, .end = 0x1f, 533 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 534 { .name = "pic1", .start = 0x20, .end = 0x21, 535 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 536 { .name = "timer0", .start = 0x40, .end = 0x43, 537 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 538 { .name = "timer1", .start = 0x50, .end = 0x53, 539 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 540 { .name = "keyboard", .start = 0x60, .end = 0x60, 541 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 542 { .name = "keyboard", .start = 0x64, .end = 0x64, 543 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 544 { .name = "dma page reg", .start = 0x80, .end = 0x8f, 545 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 546 { .name = "pic2", .start = 0xa0, .end = 0xa1, 547 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 548 { .name = "dma2", .start = 0xc0, .end = 0xdf, 549 .flags = IORESOURCE_BUSY | IORESOURCE_IO }, 550 { .name = "fpu", .start = 0xf0, .end = 0xff, 551 .flags = IORESOURCE_BUSY | IORESOURCE_IO } 552 }; 553 554 static void __init reserve_standard_io_resources(void) 555 { 556 int i; 557 558 /* request I/O space for devices used on all i[345]86 PCs */ 559 for (i = 0; i < ARRAY_SIZE(standard_io_resources); i++) 560 request_resource(&ioport_resource, &standard_io_resources[i]); 561 562 } 563 564 /* 565 * Note: elfcorehdr_addr is not just limited to vmcore. It is also used by 566 * is_kdump_kernel() to determine if we are booting after a panic. Hence 567 * ifdef it under CONFIG_CRASH_DUMP and not CONFIG_PROC_VMCORE. 568 */ 569 570 #ifdef CONFIG_CRASH_DUMP 571 /* elfcorehdr= specifies the location of elf core header 572 * stored by the crashed kernel. This option will be passed 573 * by kexec loader to the capture kernel. 574 */ 575 static int __init setup_elfcorehdr(char *arg) 576 { 577 char *end; 578 if (!arg) 579 return -EINVAL; 580 elfcorehdr_addr = memparse(arg, &end); 581 return end > arg ? 0 : -EINVAL; 582 } 583 early_param("elfcorehdr", setup_elfcorehdr); 584 #endif 585 586 static struct x86_quirks default_x86_quirks __initdata; 587 588 struct x86_quirks *x86_quirks __initdata = &default_x86_quirks; 589 590 /* 591 * Some BIOSes seem to corrupt the low 64k of memory during events 592 * like suspend/resume and unplugging an HDMI cable. Reserve all 593 * remaining free memory in that area and fill it with a distinct 594 * pattern. 595 */ 596 #ifdef CONFIG_X86_CHECK_BIOS_CORRUPTION 597 #define MAX_SCAN_AREAS 8 598 599 static int __read_mostly memory_corruption_check = -1; 600 601 static unsigned __read_mostly corruption_check_size = 64*1024; 602 static unsigned __read_mostly corruption_check_period = 60; /* seconds */ 603 604 static struct e820entry scan_areas[MAX_SCAN_AREAS]; 605 static int num_scan_areas; 606 607 608 static int set_corruption_check(char *arg) 609 { 610 char *end; 611 612 memory_corruption_check = simple_strtol(arg, &end, 10); 613 614 return (*end == 0) ? 0 : -EINVAL; 615 } 616 early_param("memory_corruption_check", set_corruption_check); 617 618 static int set_corruption_check_period(char *arg) 619 { 620 char *end; 621 622 corruption_check_period = simple_strtoul(arg, &end, 10); 623 624 return (*end == 0) ? 0 : -EINVAL; 625 } 626 early_param("memory_corruption_check_period", set_corruption_check_period); 627 628 static int set_corruption_check_size(char *arg) 629 { 630 char *end; 631 unsigned size; 632 633 size = memparse(arg, &end); 634 635 if (*end == '\0') 636 corruption_check_size = size; 637 638 return (size == corruption_check_size) ? 0 : -EINVAL; 639 } 640 early_param("memory_corruption_check_size", set_corruption_check_size); 641 642 643 static void __init setup_bios_corruption_check(void) 644 { 645 u64 addr = PAGE_SIZE; /* assume first page is reserved anyway */ 646 647 if (memory_corruption_check == -1) { 648 memory_corruption_check = 649 #ifdef CONFIG_X86_BOOTPARAM_MEMORY_CORRUPTION_CHECK 650 1 651 #else 652 0 653 #endif 654 ; 655 } 656 657 if (corruption_check_size == 0) 658 memory_corruption_check = 0; 659 660 if (!memory_corruption_check) 661 return; 662 663 corruption_check_size = round_up(corruption_check_size, PAGE_SIZE); 664 665 while(addr < corruption_check_size && num_scan_areas < MAX_SCAN_AREAS) { 666 u64 size; 667 addr = find_e820_area_size(addr, &size, PAGE_SIZE); 668 669 if (addr == 0) 670 break; 671 672 if ((addr + size) > corruption_check_size) 673 size = corruption_check_size - addr; 674 675 if (size == 0) 676 break; 677 678 e820_update_range(addr, size, E820_RAM, E820_RESERVED); 679 scan_areas[num_scan_areas].addr = addr; 680 scan_areas[num_scan_areas].size = size; 681 num_scan_areas++; 682 683 /* Assume we've already mapped this early memory */ 684 memset(__va(addr), 0, size); 685 686 addr += size; 687 } 688 689 printk(KERN_INFO "Scanning %d areas for low memory corruption\n", 690 num_scan_areas); 691 update_e820(); 692 } 693 694 static struct timer_list periodic_check_timer; 695 696 void check_for_bios_corruption(void) 697 { 698 int i; 699 int corruption = 0; 700 701 if (!memory_corruption_check) 702 return; 703 704 for(i = 0; i < num_scan_areas; i++) { 705 unsigned long *addr = __va(scan_areas[i].addr); 706 unsigned long size = scan_areas[i].size; 707 708 for(; size; addr++, size -= sizeof(unsigned long)) { 709 if (!*addr) 710 continue; 711 printk(KERN_ERR "Corrupted low memory at %p (%lx phys) = %08lx\n", 712 addr, __pa(addr), *addr); 713 corruption = 1; 714 *addr = 0; 715 } 716 } 717 718 WARN(corruption, KERN_ERR "Memory corruption detected in low memory\n"); 719 } 720 721 static void periodic_check_for_corruption(unsigned long data) 722 { 723 check_for_bios_corruption(); 724 mod_timer(&periodic_check_timer, round_jiffies(jiffies + corruption_check_period*HZ)); 725 } 726 727 void start_periodic_check_for_corruption(void) 728 { 729 if (!memory_corruption_check || corruption_check_period == 0) 730 return; 731 732 printk(KERN_INFO "Scanning for low memory corruption every %d seconds\n", 733 corruption_check_period); 734 735 init_timer(&periodic_check_timer); 736 periodic_check_timer.function = &periodic_check_for_corruption; 737 periodic_check_for_corruption(0); 738 } 739 #endif 740 741 static int __init dmi_low_memory_corruption(const struct dmi_system_id *d) 742 { 743 printk(KERN_NOTICE 744 "%s detected: BIOS may corrupt low RAM, working it around.\n", 745 d->ident); 746 747 e820_update_range(0, 0x10000, E820_RAM, E820_RESERVED); 748 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map); 749 750 return 0; 751 } 752 753 /* List of systems that have known low memory corruption BIOS problems */ 754 static struct dmi_system_id __initdata bad_bios_dmi_table[] = { 755 #ifdef CONFIG_X86_RESERVE_LOW_64K 756 { 757 .callback = dmi_low_memory_corruption, 758 .ident = "AMI BIOS", 759 .matches = { 760 DMI_MATCH(DMI_BIOS_VENDOR, "American Megatrends Inc."), 761 }, 762 }, 763 { 764 .callback = dmi_low_memory_corruption, 765 .ident = "Phoenix BIOS", 766 .matches = { 767 DMI_MATCH(DMI_BIOS_VENDOR, "Phoenix Technologies, LTD"), 768 }, 769 }, 770 #endif 771 {} 772 }; 773 774 /* 775 * Determine if we were loaded by an EFI loader. If so, then we have also been 776 * passed the efi memmap, systab, etc., so we should use these data structures 777 * for initialization. Note, the efi init code path is determined by the 778 * global efi_enabled. This allows the same kernel image to be used on existing 779 * systems (with a traditional BIOS) as well as on EFI systems. 780 */ 781 /* 782 * setup_arch - architecture-specific boot-time initializations 783 * 784 * Note: On x86_64, fixmaps are ready for use even before this is called. 785 */ 786 787 void __init setup_arch(char **cmdline_p) 788 { 789 #ifdef CONFIG_X86_32 790 memcpy(&boot_cpu_data, &new_cpu_data, sizeof(new_cpu_data)); 791 visws_early_detect(); 792 pre_setup_arch_hook(); 793 #else 794 printk(KERN_INFO "Command line: %s\n", boot_command_line); 795 #endif 796 797 early_cpu_init(); 798 early_ioremap_init(); 799 800 ROOT_DEV = old_decode_dev(boot_params.hdr.root_dev); 801 screen_info = boot_params.screen_info; 802 edid_info = boot_params.edid_info; 803 #ifdef CONFIG_X86_32 804 apm_info.bios = boot_params.apm_bios_info; 805 ist_info = boot_params.ist_info; 806 if (boot_params.sys_desc_table.length != 0) { 807 set_mca_bus(boot_params.sys_desc_table.table[3] & 0x2); 808 machine_id = boot_params.sys_desc_table.table[0]; 809 machine_submodel_id = boot_params.sys_desc_table.table[1]; 810 BIOS_revision = boot_params.sys_desc_table.table[2]; 811 } 812 #endif 813 saved_video_mode = boot_params.hdr.vid_mode; 814 bootloader_type = boot_params.hdr.type_of_loader; 815 816 #ifdef CONFIG_BLK_DEV_RAM 817 rd_image_start = boot_params.hdr.ram_size & RAMDISK_IMAGE_START_MASK; 818 rd_prompt = ((boot_params.hdr.ram_size & RAMDISK_PROMPT_FLAG) != 0); 819 rd_doload = ((boot_params.hdr.ram_size & RAMDISK_LOAD_FLAG) != 0); 820 #endif 821 #ifdef CONFIG_EFI 822 if (!strncmp((char *)&boot_params.efi_info.efi_loader_signature, 823 #ifdef CONFIG_X86_32 824 "EL32", 825 #else 826 "EL64", 827 #endif 828 4)) { 829 efi_enabled = 1; 830 efi_reserve_early(); 831 } 832 #endif 833 834 ARCH_SETUP 835 836 setup_memory_map(); 837 parse_setup_data(); 838 /* update the e820_saved too */ 839 e820_reserve_setup_data(); 840 841 copy_edd(); 842 843 if (!boot_params.hdr.root_flags) 844 root_mountflags &= ~MS_RDONLY; 845 init_mm.start_code = (unsigned long) _text; 846 init_mm.end_code = (unsigned long) _etext; 847 init_mm.end_data = (unsigned long) _edata; 848 #ifdef CONFIG_X86_32 849 init_mm.brk = init_pg_tables_end + PAGE_OFFSET; 850 #else 851 init_mm.brk = (unsigned long) &_end; 852 #endif 853 854 code_resource.start = virt_to_phys(_text); 855 code_resource.end = virt_to_phys(_etext)-1; 856 data_resource.start = virt_to_phys(_etext); 857 data_resource.end = virt_to_phys(_edata)-1; 858 bss_resource.start = virt_to_phys(&__bss_start); 859 bss_resource.end = virt_to_phys(&__bss_stop)-1; 860 861 #ifdef CONFIG_CMDLINE_BOOL 862 #ifdef CONFIG_CMDLINE_OVERRIDE 863 strlcpy(boot_command_line, builtin_cmdline, COMMAND_LINE_SIZE); 864 #else 865 if (builtin_cmdline[0]) { 866 /* append boot loader cmdline to builtin */ 867 strlcat(builtin_cmdline, " ", COMMAND_LINE_SIZE); 868 strlcat(builtin_cmdline, boot_command_line, COMMAND_LINE_SIZE); 869 strlcpy(boot_command_line, builtin_cmdline, COMMAND_LINE_SIZE); 870 } 871 #endif 872 #endif 873 874 strlcpy(command_line, boot_command_line, COMMAND_LINE_SIZE); 875 *cmdline_p = command_line; 876 877 parse_early_param(); 878 879 #ifdef CONFIG_X86_64 880 check_efer(); 881 #endif 882 883 #if defined(CONFIG_VMI) && defined(CONFIG_X86_32) 884 /* 885 * Must be before kernel pagetables are setup 886 * or fixmap area is touched. 887 */ 888 vmi_init(); 889 #endif 890 891 /* after early param, so could get panic from serial */ 892 reserve_early_setup_data(); 893 894 if (acpi_mps_check()) { 895 #ifdef CONFIG_X86_LOCAL_APIC 896 disable_apic = 1; 897 #endif 898 setup_clear_cpu_cap(X86_FEATURE_APIC); 899 } 900 901 #ifdef CONFIG_PCI 902 if (pci_early_dump_regs) 903 early_dump_pci_devices(); 904 #endif 905 906 finish_e820_parsing(); 907 908 dmi_scan_machine(); 909 910 dmi_check_system(bad_bios_dmi_table); 911 912 #ifdef CONFIG_X86_32 913 probe_roms(); 914 #endif 915 916 /* after parse_early_param, so could debug it */ 917 insert_resource(&iomem_resource, &code_resource); 918 insert_resource(&iomem_resource, &data_resource); 919 insert_resource(&iomem_resource, &bss_resource); 920 921 if (efi_enabled) 922 efi_init(); 923 924 #ifdef CONFIG_X86_32 925 if (ppro_with_ram_bug()) { 926 e820_update_range(0x70000000ULL, 0x40000ULL, E820_RAM, 927 E820_RESERVED); 928 sanitize_e820_map(e820.map, ARRAY_SIZE(e820.map), &e820.nr_map); 929 printk(KERN_INFO "fixed physical RAM map:\n"); 930 e820_print_map("bad_ppro"); 931 } 932 #else 933 early_gart_iommu_check(); 934 #endif 935 936 /* 937 * partially used pages are not usable - thus 938 * we are rounding upwards: 939 */ 940 max_pfn = e820_end_of_ram_pfn(); 941 942 /* preallocate 4k for mptable mpc */ 943 early_reserve_e820_mpc_new(); 944 /* update e820 for memory not covered by WB MTRRs */ 945 mtrr_bp_init(); 946 if (mtrr_trim_uncached_memory(max_pfn)) 947 max_pfn = e820_end_of_ram_pfn(); 948 949 #ifdef CONFIG_X86_32 950 /* max_low_pfn get updated here */ 951 find_low_pfn_range(); 952 #else 953 num_physpages = max_pfn; 954 955 if (cpu_has_x2apic) 956 check_x2apic(); 957 958 /* How many end-of-memory variables you have, grandma! */ 959 /* need this before calling reserve_initrd */ 960 if (max_pfn > (1UL<<(32 - PAGE_SHIFT))) 961 max_low_pfn = e820_end_of_low_ram_pfn(); 962 else 963 max_low_pfn = max_pfn; 964 965 high_memory = (void *)__va(max_pfn * PAGE_SIZE - 1) + 1; 966 #endif 967 968 #ifdef CONFIG_X86_CHECK_BIOS_CORRUPTION 969 setup_bios_corruption_check(); 970 #endif 971 972 /* max_pfn_mapped is updated here */ 973 max_low_pfn_mapped = init_memory_mapping(0, max_low_pfn<<PAGE_SHIFT); 974 max_pfn_mapped = max_low_pfn_mapped; 975 976 #ifdef CONFIG_X86_64 977 if (max_pfn > max_low_pfn) { 978 max_pfn_mapped = init_memory_mapping(1UL<<32, 979 max_pfn<<PAGE_SHIFT); 980 /* can we preseve max_low_pfn ?*/ 981 max_low_pfn = max_pfn; 982 } 983 #endif 984 985 /* 986 * NOTE: On x86-32, only from this point on, fixmaps are ready for use. 987 */ 988 989 #ifdef CONFIG_PROVIDE_OHCI1394_DMA_INIT 990 if (init_ohci1394_dma_early) 991 init_ohci1394_dma_on_all_controllers(); 992 #endif 993 994 reserve_initrd(); 995 996 #ifdef CONFIG_X86_64 997 vsmp_init(); 998 #endif 999 1000 io_delay_init(); 1001 1002 /* 1003 * Parse the ACPI tables for possible boot-time SMP configuration. 1004 */ 1005 acpi_boot_table_init(); 1006 1007 early_acpi_boot_init(); 1008 1009 #ifdef CONFIG_ACPI_NUMA 1010 /* 1011 * Parse SRAT to discover nodes. 1012 */ 1013 acpi_numa_init(); 1014 #endif 1015 1016 initmem_init(0, max_pfn); 1017 1018 #ifdef CONFIG_ACPI_SLEEP 1019 /* 1020 * Reserve low memory region for sleep support. 1021 */ 1022 acpi_reserve_bootmem(); 1023 #endif 1024 #ifdef CONFIG_X86_FIND_SMP_CONFIG 1025 /* 1026 * Find and reserve possible boot-time SMP configuration: 1027 */ 1028 find_smp_config(); 1029 #endif 1030 reserve_crashkernel(); 1031 1032 #ifdef CONFIG_X86_64 1033 /* 1034 * dma32_reserve_bootmem() allocates bootmem which may conflict 1035 * with the crashkernel command line, so do that after 1036 * reserve_crashkernel() 1037 */ 1038 dma32_reserve_bootmem(); 1039 #endif 1040 1041 reserve_ibft_region(); 1042 1043 #ifdef CONFIG_KVM_CLOCK 1044 kvmclock_init(); 1045 #endif 1046 1047 paravirt_pagetable_setup_start(swapper_pg_dir); 1048 paging_init(); 1049 paravirt_pagetable_setup_done(swapper_pg_dir); 1050 paravirt_post_allocator_init(); 1051 1052 #ifdef CONFIG_X86_64 1053 map_vsyscall(); 1054 #endif 1055 1056 #ifdef CONFIG_X86_GENERICARCH 1057 generic_apic_probe(); 1058 #endif 1059 1060 early_quirks(); 1061 1062 /* 1063 * Read APIC and some other early information from ACPI tables. 1064 */ 1065 acpi_boot_init(); 1066 1067 #if defined(CONFIG_X86_MPPARSE) || defined(CONFIG_X86_VISWS) 1068 /* 1069 * get boot-time SMP configuration: 1070 */ 1071 if (smp_found_config) 1072 get_smp_config(); 1073 #endif 1074 1075 prefill_possible_map(); 1076 1077 #ifdef CONFIG_X86_64 1078 init_cpu_to_node(); 1079 #endif 1080 1081 init_apic_mappings(); 1082 ioapic_init_mappings(); 1083 1084 /* need to wait for io_apic is mapped */ 1085 nr_irqs = probe_nr_irqs(); 1086 1087 kvm_guest_init(); 1088 1089 e820_reserve_resources(); 1090 e820_mark_nosave_regions(max_low_pfn); 1091 1092 #ifdef CONFIG_X86_32 1093 request_resource(&iomem_resource, &video_ram_resource); 1094 #endif 1095 reserve_standard_io_resources(); 1096 1097 e820_setup_gap(); 1098 1099 #ifdef CONFIG_VT 1100 #if defined(CONFIG_VGA_CONSOLE) 1101 if (!efi_enabled || (efi_mem_type(0xa0000) != EFI_CONVENTIONAL_MEMORY)) 1102 conswitchp = &vga_con; 1103 #elif defined(CONFIG_DUMMY_CONSOLE) 1104 conswitchp = &dummy_con; 1105 #endif 1106 #endif 1107 } 1108 1109 1110