1 /* 2 * 64-bit pSeries and RS/6000 setup code. 3 * 4 * Copyright (C) 1995 Linus Torvalds 5 * Adapted from 'alpha' version by Gary Thomas 6 * Modified by Cort Dougan (cort@cs.nmt.edu) 7 * Modified by PPC64 Team, IBM Corp 8 * 9 * This program is free software; you can redistribute it and/or 10 * modify it under the terms of the GNU General Public License 11 * as published by the Free Software Foundation; either version 12 * 2 of the License, or (at your option) any later version. 13 */ 14 15 /* 16 * bootup setup stuff.. 17 */ 18 19 #include <linux/cpu.h> 20 #include <linux/errno.h> 21 #include <linux/sched.h> 22 #include <linux/kernel.h> 23 #include <linux/mm.h> 24 #include <linux/stddef.h> 25 #include <linux/unistd.h> 26 #include <linux/user.h> 27 #include <linux/tty.h> 28 #include <linux/major.h> 29 #include <linux/interrupt.h> 30 #include <linux/reboot.h> 31 #include <linux/init.h> 32 #include <linux/ioport.h> 33 #include <linux/console.h> 34 #include <linux/pci.h> 35 #include <linux/utsname.h> 36 #include <linux/adb.h> 37 #include <linux/module.h> 38 #include <linux/delay.h> 39 #include <linux/irq.h> 40 #include <linux/seq_file.h> 41 #include <linux/root_dev.h> 42 43 #include <asm/mmu.h> 44 #include <asm/processor.h> 45 #include <asm/io.h> 46 #include <asm/pgtable.h> 47 #include <asm/prom.h> 48 #include <asm/rtas.h> 49 #include <asm/pci-bridge.h> 50 #include <asm/iommu.h> 51 #include <asm/dma.h> 52 #include <asm/machdep.h> 53 #include <asm/irq.h> 54 #include <asm/time.h> 55 #include <asm/nvram.h> 56 #include "xics.h" 57 #include <asm/pmc.h> 58 #include <asm/mpic.h> 59 #include <asm/ppc-pci.h> 60 #include <asm/i8259.h> 61 #include <asm/udbg.h> 62 #include <asm/smp.h> 63 #include <asm/firmware.h> 64 #include <asm/eeh.h> 65 #include <asm/pSeries_reconfig.h> 66 67 #include "plpar_wrappers.h" 68 #include "pseries.h" 69 70 int CMO_PrPSP = -1; 71 int CMO_SecPSP = -1; 72 unsigned long CMO_PageSize = (ASM_CONST(1) << IOMMU_PAGE_SHIFT); 73 EXPORT_SYMBOL(CMO_PageSize); 74 75 int fwnmi_active; /* TRUE if an FWNMI handler is present */ 76 77 static void pseries_shared_idle_sleep(void); 78 static void pseries_dedicated_idle_sleep(void); 79 80 static struct device_node *pSeries_mpic_node; 81 82 static void pSeries_show_cpuinfo(struct seq_file *m) 83 { 84 struct device_node *root; 85 const char *model = ""; 86 87 root = of_find_node_by_path("/"); 88 if (root) 89 model = of_get_property(root, "model", NULL); 90 seq_printf(m, "machine\t\t: CHRP %s\n", model); 91 of_node_put(root); 92 } 93 94 /* Initialize firmware assisted non-maskable interrupts if 95 * the firmware supports this feature. 96 */ 97 static void __init fwnmi_init(void) 98 { 99 unsigned long system_reset_addr, machine_check_addr; 100 101 int ibm_nmi_register = rtas_token("ibm,nmi-register"); 102 if (ibm_nmi_register == RTAS_UNKNOWN_SERVICE) 103 return; 104 105 /* If the kernel's not linked at zero we point the firmware at low 106 * addresses anyway, and use a trampoline to get to the real code. */ 107 system_reset_addr = __pa(system_reset_fwnmi) - PHYSICAL_START; 108 machine_check_addr = __pa(machine_check_fwnmi) - PHYSICAL_START; 109 110 if (0 == rtas_call(ibm_nmi_register, 2, 1, NULL, system_reset_addr, 111 machine_check_addr)) 112 fwnmi_active = 1; 113 } 114 115 static void pseries_8259_cascade(unsigned int irq, struct irq_desc *desc) 116 { 117 struct irq_chip *chip = get_irq_desc_chip(desc); 118 unsigned int cascade_irq = i8259_irq(); 119 120 if (cascade_irq != NO_IRQ) 121 generic_handle_irq(cascade_irq); 122 123 chip->irq_eoi(&desc->irq_data); 124 } 125 126 static void __init pseries_setup_i8259_cascade(void) 127 { 128 struct device_node *np, *old, *found = NULL; 129 unsigned int cascade; 130 const u32 *addrp; 131 unsigned long intack = 0; 132 int naddr; 133 134 for_each_node_by_type(np, "interrupt-controller") { 135 if (of_device_is_compatible(np, "chrp,iic")) { 136 found = np; 137 break; 138 } 139 } 140 141 if (found == NULL) { 142 printk(KERN_DEBUG "pic: no ISA interrupt controller\n"); 143 return; 144 } 145 146 cascade = irq_of_parse_and_map(found, 0); 147 if (cascade == NO_IRQ) { 148 printk(KERN_ERR "pic: failed to map cascade interrupt"); 149 return; 150 } 151 pr_debug("pic: cascade mapped to irq %d\n", cascade); 152 153 for (old = of_node_get(found); old != NULL ; old = np) { 154 np = of_get_parent(old); 155 of_node_put(old); 156 if (np == NULL) 157 break; 158 if (strcmp(np->name, "pci") != 0) 159 continue; 160 addrp = of_get_property(np, "8259-interrupt-acknowledge", NULL); 161 if (addrp == NULL) 162 continue; 163 naddr = of_n_addr_cells(np); 164 intack = addrp[naddr-1]; 165 if (naddr > 1) 166 intack |= ((unsigned long)addrp[naddr-2]) << 32; 167 } 168 if (intack) 169 printk(KERN_DEBUG "pic: PCI 8259 intack at 0x%016lx\n", intack); 170 i8259_init(found, intack); 171 of_node_put(found); 172 set_irq_chained_handler(cascade, pseries_8259_cascade); 173 } 174 175 static void __init pseries_mpic_init_IRQ(void) 176 { 177 struct device_node *np; 178 const unsigned int *opprop; 179 unsigned long openpic_addr = 0; 180 int naddr, n, i, opplen; 181 struct mpic *mpic; 182 183 np = of_find_node_by_path("/"); 184 naddr = of_n_addr_cells(np); 185 opprop = of_get_property(np, "platform-open-pic", &opplen); 186 if (opprop != 0) { 187 openpic_addr = of_read_number(opprop, naddr); 188 printk(KERN_DEBUG "OpenPIC addr: %lx\n", openpic_addr); 189 } 190 of_node_put(np); 191 192 BUG_ON(openpic_addr == 0); 193 194 /* Setup the openpic driver */ 195 mpic = mpic_alloc(pSeries_mpic_node, openpic_addr, 196 MPIC_PRIMARY, 197 16, 250, /* isu size, irq count */ 198 " MPIC "); 199 BUG_ON(mpic == NULL); 200 201 /* Add ISUs */ 202 opplen /= sizeof(u32); 203 for (n = 0, i = naddr; i < opplen; i += naddr, n++) { 204 unsigned long isuaddr = of_read_number(opprop + i, naddr); 205 mpic_assign_isu(mpic, n, isuaddr); 206 } 207 208 /* All ISUs are setup, complete initialization */ 209 mpic_init(mpic); 210 211 /* Look for cascade */ 212 pseries_setup_i8259_cascade(); 213 } 214 215 static void __init pseries_xics_init_IRQ(void) 216 { 217 xics_init_IRQ(); 218 pseries_setup_i8259_cascade(); 219 } 220 221 static void pseries_lpar_enable_pmcs(void) 222 { 223 unsigned long set, reset; 224 225 set = 1UL << 63; 226 reset = 0; 227 plpar_hcall_norets(H_PERFMON, set, reset); 228 } 229 230 static void __init pseries_discover_pic(void) 231 { 232 struct device_node *np; 233 const char *typep; 234 235 for (np = NULL; (np = of_find_node_by_name(np, 236 "interrupt-controller"));) { 237 typep = of_get_property(np, "compatible", NULL); 238 if (strstr(typep, "open-pic")) { 239 pSeries_mpic_node = of_node_get(np); 240 ppc_md.init_IRQ = pseries_mpic_init_IRQ; 241 ppc_md.get_irq = mpic_get_irq; 242 setup_kexec_cpu_down_mpic(); 243 smp_init_pseries_mpic(); 244 return; 245 } else if (strstr(typep, "ppc-xicp")) { 246 ppc_md.init_IRQ = pseries_xics_init_IRQ; 247 setup_kexec_cpu_down_xics(); 248 smp_init_pseries_xics(); 249 return; 250 } 251 } 252 printk(KERN_ERR "pSeries_discover_pic: failed to recognize" 253 " interrupt-controller\n"); 254 } 255 256 static int pci_dn_reconfig_notifier(struct notifier_block *nb, unsigned long action, void *node) 257 { 258 struct device_node *np = node; 259 struct pci_dn *pci = NULL; 260 int err = NOTIFY_OK; 261 262 switch (action) { 263 case PSERIES_RECONFIG_ADD: 264 pci = np->parent->data; 265 if (pci) 266 update_dn_pci_info(np, pci->phb); 267 break; 268 default: 269 err = NOTIFY_DONE; 270 break; 271 } 272 return err; 273 } 274 275 static struct notifier_block pci_dn_reconfig_nb = { 276 .notifier_call = pci_dn_reconfig_notifier, 277 }; 278 279 #ifdef CONFIG_VIRT_CPU_ACCOUNTING 280 /* 281 * Allocate space for the dispatch trace log for all possible cpus 282 * and register the buffers with the hypervisor. This is used for 283 * computing time stolen by the hypervisor. 284 */ 285 static int alloc_dispatch_logs(void) 286 { 287 int cpu, ret; 288 struct paca_struct *pp; 289 struct dtl_entry *dtl; 290 291 if (!firmware_has_feature(FW_FEATURE_SPLPAR)) 292 return 0; 293 294 for_each_possible_cpu(cpu) { 295 pp = &paca[cpu]; 296 dtl = kmalloc_node(DISPATCH_LOG_BYTES, GFP_KERNEL, 297 cpu_to_node(cpu)); 298 if (!dtl) { 299 pr_warn("Failed to allocate dispatch trace log for cpu %d\n", 300 cpu); 301 pr_warn("Stolen time statistics will be unreliable\n"); 302 break; 303 } 304 305 pp->dtl_ridx = 0; 306 pp->dispatch_log = dtl; 307 pp->dispatch_log_end = dtl + N_DISPATCH_LOG; 308 pp->dtl_curr = dtl; 309 } 310 311 /* Register the DTL for the current (boot) cpu */ 312 dtl = get_paca()->dispatch_log; 313 get_paca()->dtl_ridx = 0; 314 get_paca()->dtl_curr = dtl; 315 get_paca()->lppaca_ptr->dtl_idx = 0; 316 317 /* hypervisor reads buffer length from this field */ 318 dtl->enqueue_to_dispatch_time = DISPATCH_LOG_BYTES; 319 ret = register_dtl(hard_smp_processor_id(), __pa(dtl)); 320 if (ret) 321 pr_warn("DTL registration failed for boot cpu %d (%d)\n", 322 smp_processor_id(), ret); 323 get_paca()->lppaca_ptr->dtl_enable_mask = 2; 324 325 return 0; 326 } 327 328 early_initcall(alloc_dispatch_logs); 329 #endif /* CONFIG_VIRT_CPU_ACCOUNTING */ 330 331 static void __init pSeries_setup_arch(void) 332 { 333 /* Discover PIC type and setup ppc_md accordingly */ 334 pseries_discover_pic(); 335 336 /* openpic global configuration register (64-bit format). */ 337 /* openpic Interrupt Source Unit pointer (64-bit format). */ 338 /* python0 facility area (mmio) (64-bit format) REAL address. */ 339 340 /* init to some ~sane value until calibrate_delay() runs */ 341 loops_per_jiffy = 50000000; 342 343 fwnmi_init(); 344 345 /* Find and initialize PCI host bridges */ 346 init_pci_config_tokens(); 347 find_and_init_phbs(); 348 pSeries_reconfig_notifier_register(&pci_dn_reconfig_nb); 349 eeh_init(); 350 351 pSeries_nvram_init(); 352 353 /* Choose an idle loop */ 354 if (firmware_has_feature(FW_FEATURE_SPLPAR)) { 355 vpa_init(boot_cpuid); 356 if (get_lppaca()->shared_proc) { 357 printk(KERN_DEBUG "Using shared processor idle loop\n"); 358 ppc_md.power_save = pseries_shared_idle_sleep; 359 } else { 360 printk(KERN_DEBUG "Using dedicated idle loop\n"); 361 ppc_md.power_save = pseries_dedicated_idle_sleep; 362 } 363 } else { 364 printk(KERN_DEBUG "Using default idle loop\n"); 365 } 366 367 if (firmware_has_feature(FW_FEATURE_LPAR)) 368 ppc_md.enable_pmcs = pseries_lpar_enable_pmcs; 369 else 370 ppc_md.enable_pmcs = power4_enable_pmcs; 371 } 372 373 static int __init pSeries_init_panel(void) 374 { 375 /* Manually leave the kernel version on the panel. */ 376 ppc_md.progress("Linux ppc64\n", 0); 377 ppc_md.progress(init_utsname()->version, 0); 378 379 return 0; 380 } 381 arch_initcall(pSeries_init_panel); 382 383 static int pseries_set_dabr(unsigned long dabr) 384 { 385 return plpar_hcall_norets(H_SET_DABR, dabr); 386 } 387 388 static int pseries_set_xdabr(unsigned long dabr) 389 { 390 /* We want to catch accesses from kernel and userspace */ 391 return plpar_hcall_norets(H_SET_XDABR, dabr, 392 H_DABRX_KERNEL | H_DABRX_USER); 393 } 394 395 #define CMO_CHARACTERISTICS_TOKEN 44 396 #define CMO_MAXLENGTH 1026 397 398 /** 399 * fw_cmo_feature_init - FW_FEATURE_CMO is not stored in ibm,hypertas-functions, 400 * handle that here. (Stolen from parse_system_parameter_string) 401 */ 402 void pSeries_cmo_feature_init(void) 403 { 404 char *ptr, *key, *value, *end; 405 int call_status; 406 int page_order = IOMMU_PAGE_SHIFT; 407 408 pr_debug(" -> fw_cmo_feature_init()\n"); 409 spin_lock(&rtas_data_buf_lock); 410 memset(rtas_data_buf, 0, RTAS_DATA_BUF_SIZE); 411 call_status = rtas_call(rtas_token("ibm,get-system-parameter"), 3, 1, 412 NULL, 413 CMO_CHARACTERISTICS_TOKEN, 414 __pa(rtas_data_buf), 415 RTAS_DATA_BUF_SIZE); 416 417 if (call_status != 0) { 418 spin_unlock(&rtas_data_buf_lock); 419 pr_debug("CMO not available\n"); 420 pr_debug(" <- fw_cmo_feature_init()\n"); 421 return; 422 } 423 424 end = rtas_data_buf + CMO_MAXLENGTH - 2; 425 ptr = rtas_data_buf + 2; /* step over strlen value */ 426 key = value = ptr; 427 428 while (*ptr && (ptr <= end)) { 429 /* Separate the key and value by replacing '=' with '\0' and 430 * point the value at the string after the '=' 431 */ 432 if (ptr[0] == '=') { 433 ptr[0] = '\0'; 434 value = ptr + 1; 435 } else if (ptr[0] == '\0' || ptr[0] == ',') { 436 /* Terminate the string containing the key/value pair */ 437 ptr[0] = '\0'; 438 439 if (key == value) { 440 pr_debug("Malformed key/value pair\n"); 441 /* Never found a '=', end processing */ 442 break; 443 } 444 445 if (0 == strcmp(key, "CMOPageSize")) 446 page_order = simple_strtol(value, NULL, 10); 447 else if (0 == strcmp(key, "PrPSP")) 448 CMO_PrPSP = simple_strtol(value, NULL, 10); 449 else if (0 == strcmp(key, "SecPSP")) 450 CMO_SecPSP = simple_strtol(value, NULL, 10); 451 value = key = ptr + 1; 452 } 453 ptr++; 454 } 455 456 /* Page size is returned as the power of 2 of the page size, 457 * convert to the page size in bytes before returning 458 */ 459 CMO_PageSize = 1 << page_order; 460 pr_debug("CMO_PageSize = %lu\n", CMO_PageSize); 461 462 if (CMO_PrPSP != -1 || CMO_SecPSP != -1) { 463 pr_info("CMO enabled\n"); 464 pr_debug("CMO enabled, PrPSP=%d, SecPSP=%d\n", CMO_PrPSP, 465 CMO_SecPSP); 466 powerpc_firmware_features |= FW_FEATURE_CMO; 467 } else 468 pr_debug("CMO not enabled, PrPSP=%d, SecPSP=%d\n", CMO_PrPSP, 469 CMO_SecPSP); 470 spin_unlock(&rtas_data_buf_lock); 471 pr_debug(" <- fw_cmo_feature_init()\n"); 472 } 473 474 /* 475 * Early initialization. Relocation is on but do not reference unbolted pages 476 */ 477 static void __init pSeries_init_early(void) 478 { 479 pr_debug(" -> pSeries_init_early()\n"); 480 481 if (firmware_has_feature(FW_FEATURE_LPAR)) 482 find_udbg_vterm(); 483 484 if (firmware_has_feature(FW_FEATURE_DABR)) 485 ppc_md.set_dabr = pseries_set_dabr; 486 else if (firmware_has_feature(FW_FEATURE_XDABR)) 487 ppc_md.set_dabr = pseries_set_xdabr; 488 489 pSeries_cmo_feature_init(); 490 iommu_init_early_pSeries(); 491 492 pr_debug(" <- pSeries_init_early()\n"); 493 } 494 495 /* 496 * Called very early, MMU is off, device-tree isn't unflattened 497 */ 498 499 static int __init pSeries_probe_hypertas(unsigned long node, 500 const char *uname, int depth, 501 void *data) 502 { 503 const char *hypertas; 504 unsigned long len; 505 506 if (depth != 1 || 507 (strcmp(uname, "rtas") != 0 && strcmp(uname, "rtas@0") != 0)) 508 return 0; 509 510 hypertas = of_get_flat_dt_prop(node, "ibm,hypertas-functions", &len); 511 if (!hypertas) 512 return 1; 513 514 powerpc_firmware_features |= FW_FEATURE_LPAR; 515 fw_feature_init(hypertas, len); 516 517 return 1; 518 } 519 520 static int __init pSeries_probe(void) 521 { 522 unsigned long root = of_get_flat_dt_root(); 523 char *dtype = of_get_flat_dt_prop(root, "device_type", NULL); 524 525 if (dtype == NULL) 526 return 0; 527 if (strcmp(dtype, "chrp")) 528 return 0; 529 530 /* Cell blades firmware claims to be chrp while it's not. Until this 531 * is fixed, we need to avoid those here. 532 */ 533 if (of_flat_dt_is_compatible(root, "IBM,CPBW-1.0") || 534 of_flat_dt_is_compatible(root, "IBM,CBEA")) 535 return 0; 536 537 pr_debug("pSeries detected, looking for LPAR capability...\n"); 538 539 /* Now try to figure out if we are running on LPAR */ 540 of_scan_flat_dt(pSeries_probe_hypertas, NULL); 541 542 if (firmware_has_feature(FW_FEATURE_LPAR)) 543 hpte_init_lpar(); 544 else 545 hpte_init_native(); 546 547 pr_debug("Machine is%s LPAR !\n", 548 (powerpc_firmware_features & FW_FEATURE_LPAR) ? "" : " not"); 549 550 return 1; 551 } 552 553 554 DECLARE_PER_CPU(long, smt_snooze_delay); 555 556 static void pseries_dedicated_idle_sleep(void) 557 { 558 unsigned int cpu = smp_processor_id(); 559 unsigned long start_snooze; 560 unsigned long in_purr, out_purr; 561 long snooze = __get_cpu_var(smt_snooze_delay); 562 563 /* 564 * Indicate to the HV that we are idle. Now would be 565 * a good time to find other work to dispatch. 566 */ 567 get_lppaca()->idle = 1; 568 get_lppaca()->donate_dedicated_cpu = 1; 569 in_purr = mfspr(SPRN_PURR); 570 571 /* 572 * We come in with interrupts disabled, and need_resched() 573 * has been checked recently. If we should poll for a little 574 * while, do so. 575 */ 576 if (snooze) { 577 start_snooze = get_tb() + snooze * tb_ticks_per_usec; 578 local_irq_enable(); 579 set_thread_flag(TIF_POLLING_NRFLAG); 580 581 while ((snooze < 0) || (get_tb() < start_snooze)) { 582 if (need_resched() || cpu_is_offline(cpu)) 583 goto out; 584 ppc64_runlatch_off(); 585 HMT_low(); 586 HMT_very_low(); 587 } 588 589 HMT_medium(); 590 clear_thread_flag(TIF_POLLING_NRFLAG); 591 smp_mb(); 592 local_irq_disable(); 593 if (need_resched() || cpu_is_offline(cpu)) 594 goto out; 595 } 596 597 cede_processor(); 598 599 out: 600 HMT_medium(); 601 out_purr = mfspr(SPRN_PURR); 602 get_lppaca()->wait_state_cycles += out_purr - in_purr; 603 get_lppaca()->donate_dedicated_cpu = 0; 604 get_lppaca()->idle = 0; 605 } 606 607 static void pseries_shared_idle_sleep(void) 608 { 609 /* 610 * Indicate to the HV that we are idle. Now would be 611 * a good time to find other work to dispatch. 612 */ 613 get_lppaca()->idle = 1; 614 615 /* 616 * Yield the processor to the hypervisor. We return if 617 * an external interrupt occurs (which are driven prior 618 * to returning here) or if a prod occurs from another 619 * processor. When returning here, external interrupts 620 * are enabled. 621 */ 622 cede_processor(); 623 624 get_lppaca()->idle = 0; 625 } 626 627 static int pSeries_pci_probe_mode(struct pci_bus *bus) 628 { 629 if (firmware_has_feature(FW_FEATURE_LPAR)) 630 return PCI_PROBE_DEVTREE; 631 return PCI_PROBE_NORMAL; 632 } 633 634 /** 635 * pSeries_power_off - tell firmware about how to power off the system. 636 * 637 * This function calls either the power-off rtas token in normal cases 638 * or the ibm,power-off-ups token (if present & requested) in case of 639 * a power failure. If power-off token is used, power on will only be 640 * possible with power button press. If ibm,power-off-ups token is used 641 * it will allow auto poweron after power is restored. 642 */ 643 static void pSeries_power_off(void) 644 { 645 int rc; 646 int rtas_poweroff_ups_token = rtas_token("ibm,power-off-ups"); 647 648 if (rtas_flash_term_hook) 649 rtas_flash_term_hook(SYS_POWER_OFF); 650 651 if (rtas_poweron_auto == 0 || 652 rtas_poweroff_ups_token == RTAS_UNKNOWN_SERVICE) { 653 rc = rtas_call(rtas_token("power-off"), 2, 1, NULL, -1, -1); 654 printk(KERN_INFO "RTAS power-off returned %d\n", rc); 655 } else { 656 rc = rtas_call(rtas_poweroff_ups_token, 0, 1, NULL); 657 printk(KERN_INFO "RTAS ibm,power-off-ups returned %d\n", rc); 658 } 659 for (;;); 660 } 661 662 #ifndef CONFIG_PCI 663 void pSeries_final_fixup(void) { } 664 #endif 665 666 define_machine(pseries) { 667 .name = "pSeries", 668 .probe = pSeries_probe, 669 .setup_arch = pSeries_setup_arch, 670 .init_early = pSeries_init_early, 671 .show_cpuinfo = pSeries_show_cpuinfo, 672 .log_error = pSeries_log_error, 673 .pcibios_fixup = pSeries_final_fixup, 674 .pci_probe_mode = pSeries_pci_probe_mode, 675 .restart = rtas_restart, 676 .power_off = pSeries_power_off, 677 .halt = rtas_halt, 678 .panic = rtas_os_term, 679 .get_boot_time = rtas_get_boot_time, 680 .get_rtc_time = rtas_get_rtc_time, 681 .set_rtc_time = rtas_set_rtc_time, 682 .calibrate_decr = generic_calibrate_decr, 683 .progress = rtas_progress, 684 .system_reset_exception = pSeries_system_reset_exception, 685 .machine_check_exception = pSeries_machine_check_exception, 686 }; 687