1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* 3 * Derived from arch/i386/kernel/irq.c 4 * Copyright (C) 1992 Linus Torvalds 5 * Adapted from arch/i386 by Gary Thomas 6 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org) 7 * Updated and modified by Cort Dougan <cort@fsmlabs.com> 8 * Copyright (C) 1996-2001 Cort Dougan 9 * Adapted for Power Macintosh by Paul Mackerras 10 * Copyright (C) 1996 Paul Mackerras (paulus@cs.anu.edu.au) 11 * 12 * This file contains the code used by various IRQ handling routines: 13 * asking for different IRQ's should be done through these routines 14 * instead of just grabbing them. Thus setups with different IRQ numbers 15 * shouldn't result in any weird surprises, and installing new handlers 16 * should be easier. 17 * 18 * The MPC8xx has an interrupt mask in the SIU. If a bit is set, the 19 * interrupt is _enabled_. As expected, IRQ0 is bit 0 in the 32-bit 20 * mask register (of which only 16 are defined), hence the weird shifting 21 * and complement of the cached_irq_mask. I want to be able to stuff 22 * this right into the SIU SMASK register. 23 * Many of the prep/chrp functions are conditional compiled on CONFIG_PPC_8xx 24 * to reduce code space and undefined function references. 25 */ 26 27 #undef DEBUG 28 29 #include <linux/export.h> 30 #include <linux/threads.h> 31 #include <linux/kernel_stat.h> 32 #include <linux/signal.h> 33 #include <linux/sched.h> 34 #include <linux/ptrace.h> 35 #include <linux/ioport.h> 36 #include <linux/interrupt.h> 37 #include <linux/timex.h> 38 #include <linux/init.h> 39 #include <linux/slab.h> 40 #include <linux/delay.h> 41 #include <linux/irq.h> 42 #include <linux/seq_file.h> 43 #include <linux/cpumask.h> 44 #include <linux/profile.h> 45 #include <linux/bitops.h> 46 #include <linux/list.h> 47 #include <linux/radix-tree.h> 48 #include <linux/mutex.h> 49 #include <linux/pci.h> 50 #include <linux/debugfs.h> 51 #include <linux/of.h> 52 #include <linux/of_irq.h> 53 #include <linux/vmalloc.h> 54 55 #include <linux/uaccess.h> 56 #include <asm/io.h> 57 #include <asm/pgtable.h> 58 #include <asm/irq.h> 59 #include <asm/cache.h> 60 #include <asm/prom.h> 61 #include <asm/ptrace.h> 62 #include <asm/machdep.h> 63 #include <asm/udbg.h> 64 #include <asm/smp.h> 65 #include <asm/livepatch.h> 66 #include <asm/asm-prototypes.h> 67 #include <asm/hw_irq.h> 68 69 #ifdef CONFIG_PPC64 70 #include <asm/paca.h> 71 #include <asm/firmware.h> 72 #include <asm/lv1call.h> 73 #include <asm/dbell.h> 74 #endif 75 #define CREATE_TRACE_POINTS 76 #include <asm/trace.h> 77 #include <asm/cpu_has_feature.h> 78 79 DEFINE_PER_CPU_SHARED_ALIGNED(irq_cpustat_t, irq_stat); 80 EXPORT_PER_CPU_SYMBOL(irq_stat); 81 82 #ifdef CONFIG_PPC32 83 atomic_t ppc_n_lost_interrupts; 84 85 #ifdef CONFIG_TAU_INT 86 extern int tau_initialized; 87 u32 tau_interrupts(unsigned long cpu); 88 #endif 89 #endif /* CONFIG_PPC32 */ 90 91 #ifdef CONFIG_PPC64 92 93 int distribute_irqs = 1; 94 95 static inline notrace unsigned long get_irq_happened(void) 96 { 97 unsigned long happened; 98 99 __asm__ __volatile__("lbz %0,%1(13)" 100 : "=r" (happened) : "i" (offsetof(struct paca_struct, irq_happened))); 101 102 return happened; 103 } 104 105 static inline notrace int decrementer_check_overflow(void) 106 { 107 u64 now = get_tb_or_rtc(); 108 u64 *next_tb = this_cpu_ptr(&decrementers_next_tb); 109 110 return now >= *next_tb; 111 } 112 113 #ifdef CONFIG_PPC_BOOK3E 114 115 /* This is called whenever we are re-enabling interrupts 116 * and returns either 0 (nothing to do) or 500/900/280/a00/e80 if 117 * there's an EE, DEC or DBELL to generate. 118 * 119 * This is called in two contexts: From arch_local_irq_restore() 120 * before soft-enabling interrupts, and from the exception exit 121 * path when returning from an interrupt from a soft-disabled to 122 * a soft enabled context. In both case we have interrupts hard 123 * disabled. 124 * 125 * We take care of only clearing the bits we handled in the 126 * PACA irq_happened field since we can only re-emit one at a 127 * time and we don't want to "lose" one. 128 */ 129 notrace unsigned int __check_irq_replay(void) 130 { 131 /* 132 * We use local_paca rather than get_paca() to avoid all 133 * the debug_smp_processor_id() business in this low level 134 * function 135 */ 136 unsigned char happened = local_paca->irq_happened; 137 138 /* 139 * We are responding to the next interrupt, so interrupt-off 140 * latencies should be reset here. 141 */ 142 trace_hardirqs_on(); 143 trace_hardirqs_off(); 144 145 /* 146 * We are always hard disabled here, but PACA_IRQ_HARD_DIS may 147 * not be set, which means interrupts have only just been hard 148 * disabled as part of the local_irq_restore or interrupt return 149 * code. In that case, skip the decrementr check becaus it's 150 * expensive to read the TB. 151 * 152 * HARD_DIS then gets cleared here, but it's reconciled later. 153 * Either local_irq_disable will replay the interrupt and that 154 * will reconcile state like other hard interrupts. Or interrupt 155 * retur will replay the interrupt and in that case it sets 156 * PACA_IRQ_HARD_DIS by hand (see comments in entry_64.S). 157 */ 158 if (happened & PACA_IRQ_HARD_DIS) { 159 local_paca->irq_happened &= ~PACA_IRQ_HARD_DIS; 160 161 /* 162 * We may have missed a decrementer interrupt if hard disabled. 163 * Check the decrementer register in case we had a rollover 164 * while hard disabled. 165 */ 166 if (!(happened & PACA_IRQ_DEC)) { 167 if (decrementer_check_overflow()) { 168 local_paca->irq_happened |= PACA_IRQ_DEC; 169 happened |= PACA_IRQ_DEC; 170 } 171 } 172 } 173 174 if (happened & PACA_IRQ_DEC) { 175 local_paca->irq_happened &= ~PACA_IRQ_DEC; 176 return 0x900; 177 } 178 179 if (happened & PACA_IRQ_EE) { 180 local_paca->irq_happened &= ~PACA_IRQ_EE; 181 return 0x500; 182 } 183 184 /* 185 * Check if an EPR external interrupt happened this bit is typically 186 * set if we need to handle another "edge" interrupt from within the 187 * MPIC "EPR" handler. 188 */ 189 if (happened & PACA_IRQ_EE_EDGE) { 190 local_paca->irq_happened &= ~PACA_IRQ_EE_EDGE; 191 return 0x500; 192 } 193 194 if (happened & PACA_IRQ_DBELL) { 195 local_paca->irq_happened &= ~PACA_IRQ_DBELL; 196 return 0x280; 197 } 198 199 /* There should be nothing left ! */ 200 BUG_ON(local_paca->irq_happened != 0); 201 202 return 0; 203 } 204 #endif /* CONFIG_PPC_BOOK3E */ 205 206 void replay_soft_interrupts(void) 207 { 208 /* 209 * We use local_paca rather than get_paca() to avoid all 210 * the debug_smp_processor_id() business in this low level 211 * function 212 */ 213 unsigned char happened = local_paca->irq_happened; 214 struct pt_regs regs; 215 216 ppc_save_regs(®s); 217 regs.softe = IRQS_ALL_DISABLED; 218 219 again: 220 if (IS_ENABLED(CONFIG_PPC_IRQ_SOFT_MASK_DEBUG)) 221 WARN_ON_ONCE(mfmsr() & MSR_EE); 222 223 if (happened & PACA_IRQ_HARD_DIS) { 224 /* 225 * We may have missed a decrementer interrupt if hard disabled. 226 * Check the decrementer register in case we had a rollover 227 * while hard disabled. 228 */ 229 if (!(happened & PACA_IRQ_DEC)) { 230 if (decrementer_check_overflow()) 231 happened |= PACA_IRQ_DEC; 232 } 233 } 234 235 /* 236 * Force the delivery of pending soft-disabled interrupts on PS3. 237 * Any HV call will have this side effect. 238 */ 239 if (firmware_has_feature(FW_FEATURE_PS3_LV1)) { 240 u64 tmp, tmp2; 241 lv1_get_version_info(&tmp, &tmp2); 242 } 243 244 /* 245 * Check if an hypervisor Maintenance interrupt happened. 246 * This is a higher priority interrupt than the others, so 247 * replay it first. 248 */ 249 if (IS_ENABLED(CONFIG_PPC_BOOK3S) && (happened & PACA_IRQ_HMI)) { 250 local_paca->irq_happened &= ~PACA_IRQ_HMI; 251 regs.trap = 0xe60; 252 handle_hmi_exception(®s); 253 if (!(local_paca->irq_happened & PACA_IRQ_HARD_DIS)) 254 hard_irq_disable(); 255 } 256 257 if (happened & PACA_IRQ_DEC) { 258 local_paca->irq_happened &= ~PACA_IRQ_DEC; 259 regs.trap = 0x900; 260 timer_interrupt(®s); 261 if (!(local_paca->irq_happened & PACA_IRQ_HARD_DIS)) 262 hard_irq_disable(); 263 } 264 265 if (happened & PACA_IRQ_EE) { 266 local_paca->irq_happened &= ~PACA_IRQ_EE; 267 regs.trap = 0x500; 268 do_IRQ(®s); 269 if (!(local_paca->irq_happened & PACA_IRQ_HARD_DIS)) 270 hard_irq_disable(); 271 } 272 273 /* 274 * Check if an EPR external interrupt happened this bit is typically 275 * set if we need to handle another "edge" interrupt from within the 276 * MPIC "EPR" handler. 277 */ 278 if (IS_ENABLED(CONFIG_PPC_BOOK3E) && (happened & PACA_IRQ_EE_EDGE)) { 279 local_paca->irq_happened &= ~PACA_IRQ_EE_EDGE; 280 regs.trap = 0x500; 281 do_IRQ(®s); 282 if (!(local_paca->irq_happened & PACA_IRQ_HARD_DIS)) 283 hard_irq_disable(); 284 } 285 286 if (IS_ENABLED(CONFIG_PPC_DOORBELL) && (happened & PACA_IRQ_DBELL)) { 287 local_paca->irq_happened &= ~PACA_IRQ_DBELL; 288 if (IS_ENABLED(CONFIG_PPC_BOOK3E)) 289 regs.trap = 0x280; 290 else 291 regs.trap = 0xa00; 292 doorbell_exception(®s); 293 if (!(local_paca->irq_happened & PACA_IRQ_HARD_DIS)) 294 hard_irq_disable(); 295 } 296 297 /* Book3E does not support soft-masking PMI interrupts */ 298 if (IS_ENABLED(CONFIG_PPC_BOOK3S) && (happened & PACA_IRQ_PMI)) { 299 local_paca->irq_happened &= ~PACA_IRQ_PMI; 300 regs.trap = 0xf00; 301 performance_monitor_exception(®s); 302 if (!(local_paca->irq_happened & PACA_IRQ_HARD_DIS)) 303 hard_irq_disable(); 304 } 305 306 happened = local_paca->irq_happened; 307 if (happened & ~PACA_IRQ_HARD_DIS) { 308 /* 309 * We are responding to the next interrupt, so interrupt-off 310 * latencies should be reset here. 311 */ 312 trace_hardirqs_on(); 313 trace_hardirqs_off(); 314 goto again; 315 } 316 } 317 318 notrace void arch_local_irq_restore(unsigned long mask) 319 { 320 unsigned char irq_happened; 321 322 /* Write the new soft-enabled value */ 323 irq_soft_mask_set(mask); 324 if (mask) 325 return; 326 327 /* 328 * From this point onward, we can take interrupts, preempt, 329 * etc... unless we got hard-disabled. We check if an event 330 * happened. If none happened, we know we can just return. 331 * 332 * We may have preempted before the check below, in which case 333 * we are checking the "new" CPU instead of the old one. This 334 * is only a problem if an event happened on the "old" CPU. 335 * 336 * External interrupt events will have caused interrupts to 337 * be hard-disabled, so there is no problem, we 338 * cannot have preempted. 339 */ 340 irq_happened = get_irq_happened(); 341 if (!irq_happened) { 342 if (IS_ENABLED(CONFIG_PPC_IRQ_SOFT_MASK_DEBUG)) 343 WARN_ON_ONCE(!(mfmsr() & MSR_EE)); 344 return; 345 } 346 347 /* We need to hard disable to replay. */ 348 if (!(irq_happened & PACA_IRQ_HARD_DIS)) { 349 if (IS_ENABLED(CONFIG_PPC_IRQ_SOFT_MASK_DEBUG)) 350 WARN_ON_ONCE(!(mfmsr() & MSR_EE)); 351 __hard_irq_disable(); 352 } else { 353 /* 354 * We should already be hard disabled here. We had bugs 355 * where that wasn't the case so let's dbl check it and 356 * warn if we are wrong. Only do that when IRQ tracing 357 * is enabled as mfmsr() can be costly. 358 */ 359 if (IS_ENABLED(CONFIG_PPC_IRQ_SOFT_MASK_DEBUG)) { 360 if (WARN_ON_ONCE(mfmsr() & MSR_EE)) 361 __hard_irq_disable(); 362 } 363 364 if (irq_happened == PACA_IRQ_HARD_DIS) { 365 local_paca->irq_happened = 0; 366 __hard_irq_enable(); 367 return; 368 } 369 } 370 371 irq_soft_mask_set(IRQS_ALL_DISABLED); 372 trace_hardirqs_off(); 373 374 replay_soft_interrupts(); 375 local_paca->irq_happened = 0; 376 377 trace_hardirqs_on(); 378 irq_soft_mask_set(IRQS_ENABLED); 379 __hard_irq_enable(); 380 } 381 EXPORT_SYMBOL(arch_local_irq_restore); 382 383 /* 384 * This is specifically called by assembly code to re-enable interrupts 385 * if they are currently disabled. This is typically called before 386 * schedule() or do_signal() when returning to userspace. We do it 387 * in C to avoid the burden of dealing with lockdep etc... 388 * 389 * NOTE: This is called with interrupts hard disabled but not marked 390 * as such in paca->irq_happened, so we need to resync this. 391 */ 392 void notrace restore_interrupts(void) 393 { 394 if (irqs_disabled()) { 395 local_paca->irq_happened |= PACA_IRQ_HARD_DIS; 396 local_irq_enable(); 397 } else 398 __hard_irq_enable(); 399 } 400 401 /* 402 * This is a helper to use when about to go into idle low-power 403 * when the latter has the side effect of re-enabling interrupts 404 * (such as calling H_CEDE under pHyp). 405 * 406 * You call this function with interrupts soft-disabled (this is 407 * already the case when ppc_md.power_save is called). The function 408 * will return whether to enter power save or just return. 409 * 410 * In the former case, it will have notified lockdep of interrupts 411 * being re-enabled and generally sanitized the lazy irq state, 412 * and in the latter case it will leave with interrupts hard 413 * disabled and marked as such, so the local_irq_enable() call 414 * in arch_cpu_idle() will properly re-enable everything. 415 */ 416 bool prep_irq_for_idle(void) 417 { 418 /* 419 * First we need to hard disable to ensure no interrupt 420 * occurs before we effectively enter the low power state 421 */ 422 __hard_irq_disable(); 423 local_paca->irq_happened |= PACA_IRQ_HARD_DIS; 424 425 /* 426 * If anything happened while we were soft-disabled, 427 * we return now and do not enter the low power state. 428 */ 429 if (lazy_irq_pending()) 430 return false; 431 432 /* Tell lockdep we are about to re-enable */ 433 trace_hardirqs_on(); 434 435 /* 436 * Mark interrupts as soft-enabled and clear the 437 * PACA_IRQ_HARD_DIS from the pending mask since we 438 * are about to hard enable as well as a side effect 439 * of entering the low power state. 440 */ 441 local_paca->irq_happened &= ~PACA_IRQ_HARD_DIS; 442 irq_soft_mask_set(IRQS_ENABLED); 443 444 /* Tell the caller to enter the low power state */ 445 return true; 446 } 447 448 #ifdef CONFIG_PPC_BOOK3S 449 /* 450 * This is for idle sequences that return with IRQs off, but the 451 * idle state itself wakes on interrupt. Tell the irq tracer that 452 * IRQs are enabled for the duration of idle so it does not get long 453 * off times. Must be paired with fini_irq_for_idle_irqsoff. 454 */ 455 bool prep_irq_for_idle_irqsoff(void) 456 { 457 WARN_ON(!irqs_disabled()); 458 459 /* 460 * First we need to hard disable to ensure no interrupt 461 * occurs before we effectively enter the low power state 462 */ 463 __hard_irq_disable(); 464 local_paca->irq_happened |= PACA_IRQ_HARD_DIS; 465 466 /* 467 * If anything happened while we were soft-disabled, 468 * we return now and do not enter the low power state. 469 */ 470 if (lazy_irq_pending()) 471 return false; 472 473 /* Tell lockdep we are about to re-enable */ 474 trace_hardirqs_on(); 475 476 return true; 477 } 478 479 /* 480 * Take the SRR1 wakeup reason, index into this table to find the 481 * appropriate irq_happened bit. 482 * 483 * Sytem reset exceptions taken in idle state also come through here, 484 * but they are NMI interrupts so do not need to wait for IRQs to be 485 * restored, and should be taken as early as practical. These are marked 486 * with 0xff in the table. The Power ISA specifies 0100b as the system 487 * reset interrupt reason. 488 */ 489 #define IRQ_SYSTEM_RESET 0xff 490 491 static const u8 srr1_to_lazyirq[0x10] = { 492 0, 0, 0, 493 PACA_IRQ_DBELL, 494 IRQ_SYSTEM_RESET, 495 PACA_IRQ_DBELL, 496 PACA_IRQ_DEC, 497 0, 498 PACA_IRQ_EE, 499 PACA_IRQ_EE, 500 PACA_IRQ_HMI, 501 0, 0, 0, 0, 0 }; 502 503 void replay_system_reset(void) 504 { 505 struct pt_regs regs; 506 507 ppc_save_regs(®s); 508 regs.trap = 0x100; 509 get_paca()->in_nmi = 1; 510 system_reset_exception(®s); 511 get_paca()->in_nmi = 0; 512 } 513 EXPORT_SYMBOL_GPL(replay_system_reset); 514 515 void irq_set_pending_from_srr1(unsigned long srr1) 516 { 517 unsigned int idx = (srr1 & SRR1_WAKEMASK_P8) >> 18; 518 u8 reason = srr1_to_lazyirq[idx]; 519 520 /* 521 * Take the system reset now, which is immediately after registers 522 * are restored from idle. It's an NMI, so interrupts need not be 523 * re-enabled before it is taken. 524 */ 525 if (unlikely(reason == IRQ_SYSTEM_RESET)) { 526 replay_system_reset(); 527 return; 528 } 529 530 if (reason == PACA_IRQ_DBELL) { 531 /* 532 * When doorbell triggers a system reset wakeup, the message 533 * is not cleared, so if the doorbell interrupt is replayed 534 * and the IPI handled, the doorbell interrupt would still 535 * fire when EE is enabled. 536 * 537 * To avoid taking the superfluous doorbell interrupt, 538 * execute a msgclr here before the interrupt is replayed. 539 */ 540 ppc_msgclr(PPC_DBELL_MSGTYPE); 541 } 542 543 /* 544 * The 0 index (SRR1[42:45]=b0000) must always evaluate to 0, 545 * so this can be called unconditionally with the SRR1 wake 546 * reason as returned by the idle code, which uses 0 to mean no 547 * interrupt. 548 * 549 * If a future CPU was to designate this as an interrupt reason, 550 * then a new index for no interrupt must be assigned. 551 */ 552 local_paca->irq_happened |= reason; 553 } 554 #endif /* CONFIG_PPC_BOOK3S */ 555 556 /* 557 * Force a replay of the external interrupt handler on this CPU. 558 */ 559 void force_external_irq_replay(void) 560 { 561 /* 562 * This must only be called with interrupts soft-disabled, 563 * the replay will happen when re-enabling. 564 */ 565 WARN_ON(!arch_irqs_disabled()); 566 567 /* 568 * Interrupts must always be hard disabled before irq_happened is 569 * modified (to prevent lost update in case of interrupt between 570 * load and store). 571 */ 572 __hard_irq_disable(); 573 local_paca->irq_happened |= PACA_IRQ_HARD_DIS; 574 575 /* Indicate in the PACA that we have an interrupt to replay */ 576 local_paca->irq_happened |= PACA_IRQ_EE; 577 } 578 579 #endif /* CONFIG_PPC64 */ 580 581 int arch_show_interrupts(struct seq_file *p, int prec) 582 { 583 int j; 584 585 #if defined(CONFIG_PPC32) && defined(CONFIG_TAU_INT) 586 if (tau_initialized) { 587 seq_printf(p, "%*s: ", prec, "TAU"); 588 for_each_online_cpu(j) 589 seq_printf(p, "%10u ", tau_interrupts(j)); 590 seq_puts(p, " PowerPC Thermal Assist (cpu temp)\n"); 591 } 592 #endif /* CONFIG_PPC32 && CONFIG_TAU_INT */ 593 594 seq_printf(p, "%*s: ", prec, "LOC"); 595 for_each_online_cpu(j) 596 seq_printf(p, "%10u ", per_cpu(irq_stat, j).timer_irqs_event); 597 seq_printf(p, " Local timer interrupts for timer event device\n"); 598 599 seq_printf(p, "%*s: ", prec, "BCT"); 600 for_each_online_cpu(j) 601 seq_printf(p, "%10u ", per_cpu(irq_stat, j).broadcast_irqs_event); 602 seq_printf(p, " Broadcast timer interrupts for timer event device\n"); 603 604 seq_printf(p, "%*s: ", prec, "LOC"); 605 for_each_online_cpu(j) 606 seq_printf(p, "%10u ", per_cpu(irq_stat, j).timer_irqs_others); 607 seq_printf(p, " Local timer interrupts for others\n"); 608 609 seq_printf(p, "%*s: ", prec, "SPU"); 610 for_each_online_cpu(j) 611 seq_printf(p, "%10u ", per_cpu(irq_stat, j).spurious_irqs); 612 seq_printf(p, " Spurious interrupts\n"); 613 614 seq_printf(p, "%*s: ", prec, "PMI"); 615 for_each_online_cpu(j) 616 seq_printf(p, "%10u ", per_cpu(irq_stat, j).pmu_irqs); 617 seq_printf(p, " Performance monitoring interrupts\n"); 618 619 seq_printf(p, "%*s: ", prec, "MCE"); 620 for_each_online_cpu(j) 621 seq_printf(p, "%10u ", per_cpu(irq_stat, j).mce_exceptions); 622 seq_printf(p, " Machine check exceptions\n"); 623 624 if (cpu_has_feature(CPU_FTR_HVMODE)) { 625 seq_printf(p, "%*s: ", prec, "HMI"); 626 for_each_online_cpu(j) 627 seq_printf(p, "%10u ", 628 per_cpu(irq_stat, j).hmi_exceptions); 629 seq_printf(p, " Hypervisor Maintenance Interrupts\n"); 630 } 631 632 seq_printf(p, "%*s: ", prec, "NMI"); 633 for_each_online_cpu(j) 634 seq_printf(p, "%10u ", per_cpu(irq_stat, j).sreset_irqs); 635 seq_printf(p, " System Reset interrupts\n"); 636 637 #ifdef CONFIG_PPC_WATCHDOG 638 seq_printf(p, "%*s: ", prec, "WDG"); 639 for_each_online_cpu(j) 640 seq_printf(p, "%10u ", per_cpu(irq_stat, j).soft_nmi_irqs); 641 seq_printf(p, " Watchdog soft-NMI interrupts\n"); 642 #endif 643 644 #ifdef CONFIG_PPC_DOORBELL 645 if (cpu_has_feature(CPU_FTR_DBELL)) { 646 seq_printf(p, "%*s: ", prec, "DBL"); 647 for_each_online_cpu(j) 648 seq_printf(p, "%10u ", per_cpu(irq_stat, j).doorbell_irqs); 649 seq_printf(p, " Doorbell interrupts\n"); 650 } 651 #endif 652 653 return 0; 654 } 655 656 /* 657 * /proc/stat helpers 658 */ 659 u64 arch_irq_stat_cpu(unsigned int cpu) 660 { 661 u64 sum = per_cpu(irq_stat, cpu).timer_irqs_event; 662 663 sum += per_cpu(irq_stat, cpu).broadcast_irqs_event; 664 sum += per_cpu(irq_stat, cpu).pmu_irqs; 665 sum += per_cpu(irq_stat, cpu).mce_exceptions; 666 sum += per_cpu(irq_stat, cpu).spurious_irqs; 667 sum += per_cpu(irq_stat, cpu).timer_irqs_others; 668 sum += per_cpu(irq_stat, cpu).hmi_exceptions; 669 sum += per_cpu(irq_stat, cpu).sreset_irqs; 670 #ifdef CONFIG_PPC_WATCHDOG 671 sum += per_cpu(irq_stat, cpu).soft_nmi_irqs; 672 #endif 673 #ifdef CONFIG_PPC_DOORBELL 674 sum += per_cpu(irq_stat, cpu).doorbell_irqs; 675 #endif 676 677 return sum; 678 } 679 680 static inline void check_stack_overflow(void) 681 { 682 long sp; 683 684 if (!IS_ENABLED(CONFIG_DEBUG_STACKOVERFLOW)) 685 return; 686 687 sp = current_stack_pointer & (THREAD_SIZE - 1); 688 689 /* check for stack overflow: is there less than 2KB free? */ 690 if (unlikely(sp < 2048)) { 691 pr_err("do_IRQ: stack overflow: %ld\n", sp); 692 dump_stack(); 693 } 694 } 695 696 void __do_irq(struct pt_regs *regs) 697 { 698 unsigned int irq; 699 700 irq_enter(); 701 702 trace_irq_entry(regs); 703 704 /* 705 * Query the platform PIC for the interrupt & ack it. 706 * 707 * This will typically lower the interrupt line to the CPU 708 */ 709 irq = ppc_md.get_irq(); 710 711 /* We can hard enable interrupts now to allow perf interrupts */ 712 may_hard_irq_enable(); 713 714 /* And finally process it */ 715 if (unlikely(!irq)) 716 __this_cpu_inc(irq_stat.spurious_irqs); 717 else 718 generic_handle_irq(irq); 719 720 trace_irq_exit(regs); 721 722 irq_exit(); 723 } 724 725 void do_IRQ(struct pt_regs *regs) 726 { 727 struct pt_regs *old_regs = set_irq_regs(regs); 728 void *cursp, *irqsp, *sirqsp; 729 730 /* Switch to the irq stack to handle this */ 731 cursp = (void *)(current_stack_pointer & ~(THREAD_SIZE - 1)); 732 irqsp = hardirq_ctx[raw_smp_processor_id()]; 733 sirqsp = softirq_ctx[raw_smp_processor_id()]; 734 735 check_stack_overflow(); 736 737 /* Already there ? */ 738 if (unlikely(cursp == irqsp || cursp == sirqsp)) { 739 __do_irq(regs); 740 set_irq_regs(old_regs); 741 return; 742 } 743 /* Switch stack and call */ 744 call_do_irq(regs, irqsp); 745 746 set_irq_regs(old_regs); 747 } 748 749 static void *__init alloc_vm_stack(void) 750 { 751 return __vmalloc_node_range(THREAD_SIZE, THREAD_ALIGN, VMALLOC_START, 752 VMALLOC_END, THREADINFO_GFP, PAGE_KERNEL, 753 0, NUMA_NO_NODE, (void*)_RET_IP_); 754 } 755 756 static void __init vmap_irqstack_init(void) 757 { 758 int i; 759 760 for_each_possible_cpu(i) { 761 softirq_ctx[i] = alloc_vm_stack(); 762 hardirq_ctx[i] = alloc_vm_stack(); 763 } 764 } 765 766 767 void __init init_IRQ(void) 768 { 769 if (IS_ENABLED(CONFIG_VMAP_STACK)) 770 vmap_irqstack_init(); 771 772 if (ppc_md.init_IRQ) 773 ppc_md.init_IRQ(); 774 } 775 776 #if defined(CONFIG_BOOKE) || defined(CONFIG_40x) 777 void *critirq_ctx[NR_CPUS] __read_mostly; 778 void *dbgirq_ctx[NR_CPUS] __read_mostly; 779 void *mcheckirq_ctx[NR_CPUS] __read_mostly; 780 #endif 781 782 void *softirq_ctx[NR_CPUS] __read_mostly; 783 void *hardirq_ctx[NR_CPUS] __read_mostly; 784 785 void do_softirq_own_stack(void) 786 { 787 call_do_softirq(softirq_ctx[smp_processor_id()]); 788 } 789 790 irq_hw_number_t virq_to_hw(unsigned int virq) 791 { 792 struct irq_data *irq_data = irq_get_irq_data(virq); 793 return WARN_ON(!irq_data) ? 0 : irq_data->hwirq; 794 } 795 EXPORT_SYMBOL_GPL(virq_to_hw); 796 797 #ifdef CONFIG_SMP 798 int irq_choose_cpu(const struct cpumask *mask) 799 { 800 int cpuid; 801 802 if (cpumask_equal(mask, cpu_online_mask)) { 803 static int irq_rover; 804 static DEFINE_RAW_SPINLOCK(irq_rover_lock); 805 unsigned long flags; 806 807 /* Round-robin distribution... */ 808 do_round_robin: 809 raw_spin_lock_irqsave(&irq_rover_lock, flags); 810 811 irq_rover = cpumask_next(irq_rover, cpu_online_mask); 812 if (irq_rover >= nr_cpu_ids) 813 irq_rover = cpumask_first(cpu_online_mask); 814 815 cpuid = irq_rover; 816 817 raw_spin_unlock_irqrestore(&irq_rover_lock, flags); 818 } else { 819 cpuid = cpumask_first_and(mask, cpu_online_mask); 820 if (cpuid >= nr_cpu_ids) 821 goto do_round_robin; 822 } 823 824 return get_hard_smp_processor_id(cpuid); 825 } 826 #else 827 int irq_choose_cpu(const struct cpumask *mask) 828 { 829 return hard_smp_processor_id(); 830 } 831 #endif 832 833 #ifdef CONFIG_PPC64 834 static int __init setup_noirqdistrib(char *str) 835 { 836 distribute_irqs = 0; 837 return 1; 838 } 839 840 __setup("noirqdistrib", setup_noirqdistrib); 841 #endif /* CONFIG_PPC64 */ 842