1 /* 2 * I/O SAPIC support. 3 * 4 * Copyright (C) 1999 Intel Corp. 5 * Copyright (C) 1999 Asit Mallick <asit.k.mallick@intel.com> 6 * Copyright (C) 2000-2002 J.I. Lee <jung-ik.lee@intel.com> 7 * Copyright (C) 1999-2000, 2002-2003 Hewlett-Packard Co. 8 * David Mosberger-Tang <davidm@hpl.hp.com> 9 * Copyright (C) 1999 VA Linux Systems 10 * Copyright (C) 1999,2000 Walt Drummond <drummond@valinux.com> 11 * 12 * 00/04/19 D. Mosberger Rewritten to mirror more closely the x86 I/O 13 * APIC code. In particular, we now have separate 14 * handlers for edge and level triggered 15 * interrupts. 16 * 00/10/27 Asit Mallick, Goutham Rao <goutham.rao@intel.com> IRQ vector 17 * allocation PCI to vector mapping, shared PCI 18 * interrupts. 19 * 00/10/27 D. Mosberger Document things a bit more to make them more 20 * understandable. Clean up much of the old 21 * IOSAPIC cruft. 22 * 01/07/27 J.I. Lee PCI irq routing, Platform/Legacy interrupts 23 * and fixes for ACPI S5(SoftOff) support. 24 * 02/01/23 J.I. Lee iosapic pgm fixes for PCI irq routing from _PRT 25 * 02/01/07 E. Focht <efocht@ess.nec.de> Redirectable interrupt 26 * vectors in iosapic_set_affinity(), 27 * initializations for /proc/irq/#/smp_affinity 28 * 02/04/02 P. Diefenbaugh Cleaned up ACPI PCI IRQ routing. 29 * 02/04/18 J.I. Lee bug fix in iosapic_init_pci_irq 30 * 02/04/30 J.I. Lee bug fix in find_iosapic to fix ACPI PCI IRQ to 31 * IOSAPIC mapping error 32 * 02/07/29 T. Kochi Allocate interrupt vectors dynamically 33 * 02/08/04 T. Kochi Cleaned up terminology (irq, global system 34 * interrupt, vector, etc.) 35 * 02/09/20 D. Mosberger Simplified by taking advantage of ACPI's 36 * pci_irq code. 37 * 03/02/19 B. Helgaas Make pcat_compat system-wide, not per-IOSAPIC. 38 * Remove iosapic_address & gsi_base from 39 * external interfaces. Rationalize 40 * __init/__devinit attributes. 41 * 04/12/04 Ashok Raj <ashok.raj@intel.com> Intel Corporation 2004 42 * Updated to work with irq migration necessary 43 * for CPU Hotplug 44 */ 45 /* 46 * Here is what the interrupt logic between a PCI device and the kernel looks 47 * like: 48 * 49 * (1) A PCI device raises one of the four interrupt pins (INTA, INTB, INTC, 50 * INTD). The device is uniquely identified by its bus-, and slot-number 51 * (the function number does not matter here because all functions share 52 * the same interrupt lines). 53 * 54 * (2) The motherboard routes the interrupt line to a pin on a IOSAPIC 55 * controller. Multiple interrupt lines may have to share the same 56 * IOSAPIC pin (if they're level triggered and use the same polarity). 57 * Each interrupt line has a unique Global System Interrupt (GSI) number 58 * which can be calculated as the sum of the controller's base GSI number 59 * and the IOSAPIC pin number to which the line connects. 60 * 61 * (3) The IOSAPIC uses an internal routing table entries (RTEs) to map the 62 * IOSAPIC pin into the IA-64 interrupt vector. This interrupt vector is then 63 * sent to the CPU. 64 * 65 * (4) The kernel recognizes an interrupt as an IRQ. The IRQ interface is 66 * used as architecture-independent interrupt handling mechanism in Linux. 67 * As an IRQ is a number, we have to have 68 * IA-64 interrupt vector number <-> IRQ number mapping. On smaller 69 * systems, we use one-to-one mapping between IA-64 vector and IRQ. A 70 * platform can implement platform_irq_to_vector(irq) and 71 * platform_local_vector_to_irq(vector) APIs to differentiate the mapping. 72 * Please see also arch/ia64/include/asm/hw_irq.h for those APIs. 73 * 74 * To sum up, there are three levels of mappings involved: 75 * 76 * PCI pin -> global system interrupt (GSI) -> IA-64 vector <-> IRQ 77 * 78 * Note: The term "IRQ" is loosely used everywhere in Linux kernel to 79 * describeinterrupts. Now we use "IRQ" only for Linux IRQ's. ISA IRQ 80 * (isa_irq) is the only exception in this source code. 81 */ 82 83 #include <linux/acpi.h> 84 #include <linux/init.h> 85 #include <linux/irq.h> 86 #include <linux/kernel.h> 87 #include <linux/list.h> 88 #include <linux/pci.h> 89 #include <linux/slab.h> 90 #include <linux/smp.h> 91 #include <linux/string.h> 92 #include <linux/bootmem.h> 93 94 #include <asm/delay.h> 95 #include <asm/hw_irq.h> 96 #include <asm/io.h> 97 #include <asm/iosapic.h> 98 #include <asm/machvec.h> 99 #include <asm/processor.h> 100 #include <asm/ptrace.h> 101 #include <asm/system.h> 102 103 #undef DEBUG_INTERRUPT_ROUTING 104 105 #ifdef DEBUG_INTERRUPT_ROUTING 106 #define DBG(fmt...) printk(fmt) 107 #else 108 #define DBG(fmt...) 109 #endif 110 111 static DEFINE_SPINLOCK(iosapic_lock); 112 113 /* 114 * These tables map IA-64 vectors to the IOSAPIC pin that generates this 115 * vector. 116 */ 117 118 #define NO_REF_RTE 0 119 120 static struct iosapic { 121 char __iomem *addr; /* base address of IOSAPIC */ 122 unsigned int gsi_base; /* GSI base */ 123 unsigned short num_rte; /* # of RTEs on this IOSAPIC */ 124 int rtes_inuse; /* # of RTEs in use on this IOSAPIC */ 125 #ifdef CONFIG_NUMA 126 unsigned short node; /* numa node association via pxm */ 127 #endif 128 spinlock_t lock; /* lock for indirect reg access */ 129 } iosapic_lists[NR_IOSAPICS]; 130 131 struct iosapic_rte_info { 132 struct list_head rte_list; /* RTEs sharing the same vector */ 133 char rte_index; /* IOSAPIC RTE index */ 134 int refcnt; /* reference counter */ 135 struct iosapic *iosapic; 136 } ____cacheline_aligned; 137 138 static struct iosapic_intr_info { 139 struct list_head rtes; /* RTEs using this vector (empty => 140 * not an IOSAPIC interrupt) */ 141 int count; /* # of registered RTEs */ 142 u32 low32; /* current value of low word of 143 * Redirection table entry */ 144 unsigned int dest; /* destination CPU physical ID */ 145 unsigned char dmode : 3; /* delivery mode (see iosapic.h) */ 146 unsigned char polarity: 1; /* interrupt polarity 147 * (see iosapic.h) */ 148 unsigned char trigger : 1; /* trigger mode (see iosapic.h) */ 149 } iosapic_intr_info[NR_IRQS]; 150 151 static unsigned char pcat_compat __devinitdata; /* 8259 compatibility flag */ 152 153 static inline void 154 iosapic_write(struct iosapic *iosapic, unsigned int reg, u32 val) 155 { 156 unsigned long flags; 157 158 spin_lock_irqsave(&iosapic->lock, flags); 159 __iosapic_write(iosapic->addr, reg, val); 160 spin_unlock_irqrestore(&iosapic->lock, flags); 161 } 162 163 /* 164 * Find an IOSAPIC associated with a GSI 165 */ 166 static inline int 167 find_iosapic (unsigned int gsi) 168 { 169 int i; 170 171 for (i = 0; i < NR_IOSAPICS; i++) { 172 if ((unsigned) (gsi - iosapic_lists[i].gsi_base) < 173 iosapic_lists[i].num_rte) 174 return i; 175 } 176 177 return -1; 178 } 179 180 static inline int __gsi_to_irq(unsigned int gsi) 181 { 182 int irq; 183 struct iosapic_intr_info *info; 184 struct iosapic_rte_info *rte; 185 186 for (irq = 0; irq < NR_IRQS; irq++) { 187 info = &iosapic_intr_info[irq]; 188 list_for_each_entry(rte, &info->rtes, rte_list) 189 if (rte->iosapic->gsi_base + rte->rte_index == gsi) 190 return irq; 191 } 192 return -1; 193 } 194 195 int 196 gsi_to_irq (unsigned int gsi) 197 { 198 unsigned long flags; 199 int irq; 200 201 spin_lock_irqsave(&iosapic_lock, flags); 202 irq = __gsi_to_irq(gsi); 203 spin_unlock_irqrestore(&iosapic_lock, flags); 204 return irq; 205 } 206 207 static struct iosapic_rte_info *find_rte(unsigned int irq, unsigned int gsi) 208 { 209 struct iosapic_rte_info *rte; 210 211 list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) 212 if (rte->iosapic->gsi_base + rte->rte_index == gsi) 213 return rte; 214 return NULL; 215 } 216 217 static void 218 set_rte (unsigned int gsi, unsigned int irq, unsigned int dest, int mask) 219 { 220 unsigned long pol, trigger, dmode; 221 u32 low32, high32; 222 int rte_index; 223 char redir; 224 struct iosapic_rte_info *rte; 225 ia64_vector vector = irq_to_vector(irq); 226 227 DBG(KERN_DEBUG"IOSAPIC: routing vector %d to 0x%x\n", vector, dest); 228 229 rte = find_rte(irq, gsi); 230 if (!rte) 231 return; /* not an IOSAPIC interrupt */ 232 233 rte_index = rte->rte_index; 234 pol = iosapic_intr_info[irq].polarity; 235 trigger = iosapic_intr_info[irq].trigger; 236 dmode = iosapic_intr_info[irq].dmode; 237 238 redir = (dmode == IOSAPIC_LOWEST_PRIORITY) ? 1 : 0; 239 240 #ifdef CONFIG_SMP 241 set_irq_affinity_info(irq, (int)(dest & 0xffff), redir); 242 #endif 243 244 low32 = ((pol << IOSAPIC_POLARITY_SHIFT) | 245 (trigger << IOSAPIC_TRIGGER_SHIFT) | 246 (dmode << IOSAPIC_DELIVERY_SHIFT) | 247 ((mask ? 1 : 0) << IOSAPIC_MASK_SHIFT) | 248 vector); 249 250 /* dest contains both id and eid */ 251 high32 = (dest << IOSAPIC_DEST_SHIFT); 252 253 iosapic_write(rte->iosapic, IOSAPIC_RTE_HIGH(rte_index), high32); 254 iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte_index), low32); 255 iosapic_intr_info[irq].low32 = low32; 256 iosapic_intr_info[irq].dest = dest; 257 } 258 259 static void 260 nop (unsigned int irq) 261 { 262 /* do nothing... */ 263 } 264 265 266 #ifdef CONFIG_KEXEC 267 void 268 kexec_disable_iosapic(void) 269 { 270 struct iosapic_intr_info *info; 271 struct iosapic_rte_info *rte; 272 ia64_vector vec; 273 int irq; 274 275 for (irq = 0; irq < NR_IRQS; irq++) { 276 info = &iosapic_intr_info[irq]; 277 vec = irq_to_vector(irq); 278 list_for_each_entry(rte, &info->rtes, 279 rte_list) { 280 iosapic_write(rte->iosapic, 281 IOSAPIC_RTE_LOW(rte->rte_index), 282 IOSAPIC_MASK|vec); 283 iosapic_eoi(rte->iosapic->addr, vec); 284 } 285 } 286 } 287 #endif 288 289 static void 290 mask_irq (unsigned int irq) 291 { 292 u32 low32; 293 int rte_index; 294 struct iosapic_rte_info *rte; 295 296 if (!iosapic_intr_info[irq].count) 297 return; /* not an IOSAPIC interrupt! */ 298 299 /* set only the mask bit */ 300 low32 = iosapic_intr_info[irq].low32 |= IOSAPIC_MASK; 301 list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) { 302 rte_index = rte->rte_index; 303 iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte_index), low32); 304 } 305 } 306 307 static void 308 unmask_irq (unsigned int irq) 309 { 310 u32 low32; 311 int rte_index; 312 struct iosapic_rte_info *rte; 313 314 if (!iosapic_intr_info[irq].count) 315 return; /* not an IOSAPIC interrupt! */ 316 317 low32 = iosapic_intr_info[irq].low32 &= ~IOSAPIC_MASK; 318 list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) { 319 rte_index = rte->rte_index; 320 iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte_index), low32); 321 } 322 } 323 324 325 static int 326 iosapic_set_affinity(unsigned int irq, const struct cpumask *mask) 327 { 328 #ifdef CONFIG_SMP 329 u32 high32, low32; 330 int cpu, dest, rte_index; 331 int redir = (irq & IA64_IRQ_REDIRECTED) ? 1 : 0; 332 struct iosapic_rte_info *rte; 333 struct iosapic *iosapic; 334 335 irq &= (~IA64_IRQ_REDIRECTED); 336 337 cpu = cpumask_first_and(cpu_online_mask, mask); 338 if (cpu >= nr_cpu_ids) 339 return -1; 340 341 if (irq_prepare_move(irq, cpu)) 342 return -1; 343 344 dest = cpu_physical_id(cpu); 345 346 if (!iosapic_intr_info[irq].count) 347 return -1; /* not an IOSAPIC interrupt */ 348 349 set_irq_affinity_info(irq, dest, redir); 350 351 /* dest contains both id and eid */ 352 high32 = dest << IOSAPIC_DEST_SHIFT; 353 354 low32 = iosapic_intr_info[irq].low32 & ~(7 << IOSAPIC_DELIVERY_SHIFT); 355 if (redir) 356 /* change delivery mode to lowest priority */ 357 low32 |= (IOSAPIC_LOWEST_PRIORITY << IOSAPIC_DELIVERY_SHIFT); 358 else 359 /* change delivery mode to fixed */ 360 low32 |= (IOSAPIC_FIXED << IOSAPIC_DELIVERY_SHIFT); 361 low32 &= IOSAPIC_VECTOR_MASK; 362 low32 |= irq_to_vector(irq); 363 364 iosapic_intr_info[irq].low32 = low32; 365 iosapic_intr_info[irq].dest = dest; 366 list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) { 367 iosapic = rte->iosapic; 368 rte_index = rte->rte_index; 369 iosapic_write(iosapic, IOSAPIC_RTE_HIGH(rte_index), high32); 370 iosapic_write(iosapic, IOSAPIC_RTE_LOW(rte_index), low32); 371 } 372 373 #endif 374 return 0; 375 } 376 377 /* 378 * Handlers for level-triggered interrupts. 379 */ 380 381 static unsigned int 382 iosapic_startup_level_irq (unsigned int irq) 383 { 384 unmask_irq(irq); 385 return 0; 386 } 387 388 static void 389 iosapic_unmask_level_irq (unsigned int irq) 390 { 391 ia64_vector vec = irq_to_vector(irq); 392 struct iosapic_rte_info *rte; 393 int do_unmask_irq = 0; 394 395 irq_complete_move(irq); 396 if (unlikely(irq_desc[irq].status & IRQ_MOVE_PENDING)) { 397 do_unmask_irq = 1; 398 mask_irq(irq); 399 } else 400 unmask_irq(irq); 401 402 list_for_each_entry(rte, &iosapic_intr_info[irq].rtes, rte_list) 403 iosapic_eoi(rte->iosapic->addr, vec); 404 405 if (unlikely(do_unmask_irq)) { 406 move_masked_irq(irq); 407 unmask_irq(irq); 408 } 409 } 410 411 #define iosapic_shutdown_level_irq mask_irq 412 #define iosapic_enable_level_irq unmask_irq 413 #define iosapic_disable_level_irq mask_irq 414 #define iosapic_ack_level_irq nop 415 416 static struct irq_chip irq_type_iosapic_level = { 417 .name = "IO-SAPIC-level", 418 .startup = iosapic_startup_level_irq, 419 .shutdown = iosapic_shutdown_level_irq, 420 .enable = iosapic_enable_level_irq, 421 .disable = iosapic_disable_level_irq, 422 .ack = iosapic_ack_level_irq, 423 .mask = mask_irq, 424 .unmask = iosapic_unmask_level_irq, 425 .set_affinity = iosapic_set_affinity 426 }; 427 428 /* 429 * Handlers for edge-triggered interrupts. 430 */ 431 432 static unsigned int 433 iosapic_startup_edge_irq (unsigned int irq) 434 { 435 unmask_irq(irq); 436 /* 437 * IOSAPIC simply drops interrupts pended while the 438 * corresponding pin was masked, so we can't know if an 439 * interrupt is pending already. Let's hope not... 440 */ 441 return 0; 442 } 443 444 static void 445 iosapic_ack_edge_irq (unsigned int irq) 446 { 447 struct irq_desc *idesc = irq_desc + irq; 448 449 irq_complete_move(irq); 450 move_native_irq(irq); 451 /* 452 * Once we have recorded IRQ_PENDING already, we can mask the 453 * interrupt for real. This prevents IRQ storms from unhandled 454 * devices. 455 */ 456 if ((idesc->status & (IRQ_PENDING|IRQ_DISABLED)) == 457 (IRQ_PENDING|IRQ_DISABLED)) 458 mask_irq(irq); 459 } 460 461 #define iosapic_enable_edge_irq unmask_irq 462 #define iosapic_disable_edge_irq nop 463 #define iosapic_end_edge_irq nop 464 465 static struct irq_chip irq_type_iosapic_edge = { 466 .name = "IO-SAPIC-edge", 467 .startup = iosapic_startup_edge_irq, 468 .shutdown = iosapic_disable_edge_irq, 469 .enable = iosapic_enable_edge_irq, 470 .disable = iosapic_disable_edge_irq, 471 .ack = iosapic_ack_edge_irq, 472 .end = iosapic_end_edge_irq, 473 .mask = mask_irq, 474 .unmask = unmask_irq, 475 .set_affinity = iosapic_set_affinity 476 }; 477 478 static unsigned int 479 iosapic_version (char __iomem *addr) 480 { 481 /* 482 * IOSAPIC Version Register return 32 bit structure like: 483 * { 484 * unsigned int version : 8; 485 * unsigned int reserved1 : 8; 486 * unsigned int max_redir : 8; 487 * unsigned int reserved2 : 8; 488 * } 489 */ 490 return __iosapic_read(addr, IOSAPIC_VERSION); 491 } 492 493 static int iosapic_find_sharable_irq(unsigned long trigger, unsigned long pol) 494 { 495 int i, irq = -ENOSPC, min_count = -1; 496 struct iosapic_intr_info *info; 497 498 /* 499 * shared vectors for edge-triggered interrupts are not 500 * supported yet 501 */ 502 if (trigger == IOSAPIC_EDGE) 503 return -EINVAL; 504 505 for (i = 0; i < NR_IRQS; i++) { 506 info = &iosapic_intr_info[i]; 507 if (info->trigger == trigger && info->polarity == pol && 508 (info->dmode == IOSAPIC_FIXED || 509 info->dmode == IOSAPIC_LOWEST_PRIORITY) && 510 can_request_irq(i, IRQF_SHARED)) { 511 if (min_count == -1 || info->count < min_count) { 512 irq = i; 513 min_count = info->count; 514 } 515 } 516 } 517 return irq; 518 } 519 520 /* 521 * if the given vector is already owned by other, 522 * assign a new vector for the other and make the vector available 523 */ 524 static void __init 525 iosapic_reassign_vector (int irq) 526 { 527 int new_irq; 528 529 if (iosapic_intr_info[irq].count) { 530 new_irq = create_irq(); 531 if (new_irq < 0) 532 panic("%s: out of interrupt vectors!\n", __func__); 533 printk(KERN_INFO "Reassigning vector %d to %d\n", 534 irq_to_vector(irq), irq_to_vector(new_irq)); 535 memcpy(&iosapic_intr_info[new_irq], &iosapic_intr_info[irq], 536 sizeof(struct iosapic_intr_info)); 537 INIT_LIST_HEAD(&iosapic_intr_info[new_irq].rtes); 538 list_move(iosapic_intr_info[irq].rtes.next, 539 &iosapic_intr_info[new_irq].rtes); 540 memset(&iosapic_intr_info[irq], 0, 541 sizeof(struct iosapic_intr_info)); 542 iosapic_intr_info[irq].low32 = IOSAPIC_MASK; 543 INIT_LIST_HEAD(&iosapic_intr_info[irq].rtes); 544 } 545 } 546 547 static inline int irq_is_shared (int irq) 548 { 549 return (iosapic_intr_info[irq].count > 1); 550 } 551 552 struct irq_chip* 553 ia64_native_iosapic_get_irq_chip(unsigned long trigger) 554 { 555 if (trigger == IOSAPIC_EDGE) 556 return &irq_type_iosapic_edge; 557 else 558 return &irq_type_iosapic_level; 559 } 560 561 static int 562 register_intr (unsigned int gsi, int irq, unsigned char delivery, 563 unsigned long polarity, unsigned long trigger) 564 { 565 struct irq_desc *idesc; 566 struct irq_chip *irq_type; 567 int index; 568 struct iosapic_rte_info *rte; 569 570 index = find_iosapic(gsi); 571 if (index < 0) { 572 printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n", 573 __func__, gsi); 574 return -ENODEV; 575 } 576 577 rte = find_rte(irq, gsi); 578 if (!rte) { 579 rte = kzalloc(sizeof (*rte), GFP_ATOMIC); 580 if (!rte) { 581 printk(KERN_WARNING "%s: cannot allocate memory\n", 582 __func__); 583 return -ENOMEM; 584 } 585 586 rte->iosapic = &iosapic_lists[index]; 587 rte->rte_index = gsi - rte->iosapic->gsi_base; 588 rte->refcnt++; 589 list_add_tail(&rte->rte_list, &iosapic_intr_info[irq].rtes); 590 iosapic_intr_info[irq].count++; 591 iosapic_lists[index].rtes_inuse++; 592 } 593 else if (rte->refcnt == NO_REF_RTE) { 594 struct iosapic_intr_info *info = &iosapic_intr_info[irq]; 595 if (info->count > 0 && 596 (info->trigger != trigger || info->polarity != polarity)){ 597 printk (KERN_WARNING 598 "%s: cannot override the interrupt\n", 599 __func__); 600 return -EINVAL; 601 } 602 rte->refcnt++; 603 iosapic_intr_info[irq].count++; 604 iosapic_lists[index].rtes_inuse++; 605 } 606 607 iosapic_intr_info[irq].polarity = polarity; 608 iosapic_intr_info[irq].dmode = delivery; 609 iosapic_intr_info[irq].trigger = trigger; 610 611 irq_type = iosapic_get_irq_chip(trigger); 612 613 idesc = irq_desc + irq; 614 if (irq_type != NULL && idesc->chip != irq_type) { 615 if (idesc->chip != &no_irq_chip) 616 printk(KERN_WARNING 617 "%s: changing vector %d from %s to %s\n", 618 __func__, irq_to_vector(irq), 619 idesc->chip->name, irq_type->name); 620 idesc->chip = irq_type; 621 } 622 if (trigger == IOSAPIC_EDGE) 623 __set_irq_handler_unlocked(irq, handle_edge_irq); 624 else 625 __set_irq_handler_unlocked(irq, handle_level_irq); 626 return 0; 627 } 628 629 static unsigned int 630 get_target_cpu (unsigned int gsi, int irq) 631 { 632 #ifdef CONFIG_SMP 633 static int cpu = -1; 634 extern int cpe_vector; 635 cpumask_t domain = irq_to_domain(irq); 636 637 /* 638 * In case of vector shared by multiple RTEs, all RTEs that 639 * share the vector need to use the same destination CPU. 640 */ 641 if (iosapic_intr_info[irq].count) 642 return iosapic_intr_info[irq].dest; 643 644 /* 645 * If the platform supports redirection via XTP, let it 646 * distribute interrupts. 647 */ 648 if (smp_int_redirect & SMP_IRQ_REDIRECTION) 649 return cpu_physical_id(smp_processor_id()); 650 651 /* 652 * Some interrupts (ACPI SCI, for instance) are registered 653 * before the BSP is marked as online. 654 */ 655 if (!cpu_online(smp_processor_id())) 656 return cpu_physical_id(smp_processor_id()); 657 658 #ifdef CONFIG_ACPI 659 if (cpe_vector > 0 && irq_to_vector(irq) == IA64_CPEP_VECTOR) 660 return get_cpei_target_cpu(); 661 #endif 662 663 #ifdef CONFIG_NUMA 664 { 665 int num_cpus, cpu_index, iosapic_index, numa_cpu, i = 0; 666 const struct cpumask *cpu_mask; 667 668 iosapic_index = find_iosapic(gsi); 669 if (iosapic_index < 0 || 670 iosapic_lists[iosapic_index].node == MAX_NUMNODES) 671 goto skip_numa_setup; 672 673 cpu_mask = cpumask_of_node(iosapic_lists[iosapic_index].node); 674 num_cpus = 0; 675 for_each_cpu_and(numa_cpu, cpu_mask, &domain) { 676 if (cpu_online(numa_cpu)) 677 num_cpus++; 678 } 679 680 if (!num_cpus) 681 goto skip_numa_setup; 682 683 /* Use irq assignment to distribute across cpus in node */ 684 cpu_index = irq % num_cpus; 685 686 for_each_cpu_and(numa_cpu, cpu_mask, &domain) 687 if (cpu_online(numa_cpu) && i++ >= cpu_index) 688 break; 689 690 if (numa_cpu < nr_cpu_ids) 691 return cpu_physical_id(numa_cpu); 692 } 693 skip_numa_setup: 694 #endif 695 /* 696 * Otherwise, round-robin interrupt vectors across all the 697 * processors. (It'd be nice if we could be smarter in the 698 * case of NUMA.) 699 */ 700 do { 701 if (++cpu >= nr_cpu_ids) 702 cpu = 0; 703 } while (!cpu_online(cpu) || !cpu_isset(cpu, domain)); 704 705 return cpu_physical_id(cpu); 706 #else /* CONFIG_SMP */ 707 return cpu_physical_id(smp_processor_id()); 708 #endif 709 } 710 711 static inline unsigned char choose_dmode(void) 712 { 713 #ifdef CONFIG_SMP 714 if (smp_int_redirect & SMP_IRQ_REDIRECTION) 715 return IOSAPIC_LOWEST_PRIORITY; 716 #endif 717 return IOSAPIC_FIXED; 718 } 719 720 /* 721 * ACPI can describe IOSAPIC interrupts via static tables and namespace 722 * methods. This provides an interface to register those interrupts and 723 * program the IOSAPIC RTE. 724 */ 725 int 726 iosapic_register_intr (unsigned int gsi, 727 unsigned long polarity, unsigned long trigger) 728 { 729 int irq, mask = 1, err; 730 unsigned int dest; 731 unsigned long flags; 732 struct iosapic_rte_info *rte; 733 u32 low32; 734 unsigned char dmode; 735 736 /* 737 * If this GSI has already been registered (i.e., it's a 738 * shared interrupt, or we lost a race to register it), 739 * don't touch the RTE. 740 */ 741 spin_lock_irqsave(&iosapic_lock, flags); 742 irq = __gsi_to_irq(gsi); 743 if (irq > 0) { 744 rte = find_rte(irq, gsi); 745 if(iosapic_intr_info[irq].count == 0) { 746 assign_irq_vector(irq); 747 dynamic_irq_init(irq); 748 } else if (rte->refcnt != NO_REF_RTE) { 749 rte->refcnt++; 750 goto unlock_iosapic_lock; 751 } 752 } else 753 irq = create_irq(); 754 755 /* If vector is running out, we try to find a sharable vector */ 756 if (irq < 0) { 757 irq = iosapic_find_sharable_irq(trigger, polarity); 758 if (irq < 0) 759 goto unlock_iosapic_lock; 760 } 761 762 raw_spin_lock(&irq_desc[irq].lock); 763 dest = get_target_cpu(gsi, irq); 764 dmode = choose_dmode(); 765 err = register_intr(gsi, irq, dmode, polarity, trigger); 766 if (err < 0) { 767 raw_spin_unlock(&irq_desc[irq].lock); 768 irq = err; 769 goto unlock_iosapic_lock; 770 } 771 772 /* 773 * If the vector is shared and already unmasked for other 774 * interrupt sources, don't mask it. 775 */ 776 low32 = iosapic_intr_info[irq].low32; 777 if (irq_is_shared(irq) && !(low32 & IOSAPIC_MASK)) 778 mask = 0; 779 set_rte(gsi, irq, dest, mask); 780 781 printk(KERN_INFO "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d\n", 782 gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"), 783 (polarity == IOSAPIC_POL_HIGH ? "high" : "low"), 784 cpu_logical_id(dest), dest, irq_to_vector(irq)); 785 786 raw_spin_unlock(&irq_desc[irq].lock); 787 unlock_iosapic_lock: 788 spin_unlock_irqrestore(&iosapic_lock, flags); 789 return irq; 790 } 791 792 void 793 iosapic_unregister_intr (unsigned int gsi) 794 { 795 unsigned long flags; 796 int irq, index; 797 struct irq_desc *idesc; 798 u32 low32; 799 unsigned long trigger, polarity; 800 unsigned int dest; 801 struct iosapic_rte_info *rte; 802 803 /* 804 * If the irq associated with the gsi is not found, 805 * iosapic_unregister_intr() is unbalanced. We need to check 806 * this again after getting locks. 807 */ 808 irq = gsi_to_irq(gsi); 809 if (irq < 0) { 810 printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n", 811 gsi); 812 WARN_ON(1); 813 return; 814 } 815 816 spin_lock_irqsave(&iosapic_lock, flags); 817 if ((rte = find_rte(irq, gsi)) == NULL) { 818 printk(KERN_ERR "iosapic_unregister_intr(%u) unbalanced\n", 819 gsi); 820 WARN_ON(1); 821 goto out; 822 } 823 824 if (--rte->refcnt > 0) 825 goto out; 826 827 idesc = irq_desc + irq; 828 rte->refcnt = NO_REF_RTE; 829 830 /* Mask the interrupt */ 831 low32 = iosapic_intr_info[irq].low32 | IOSAPIC_MASK; 832 iosapic_write(rte->iosapic, IOSAPIC_RTE_LOW(rte->rte_index), low32); 833 834 iosapic_intr_info[irq].count--; 835 index = find_iosapic(gsi); 836 iosapic_lists[index].rtes_inuse--; 837 WARN_ON(iosapic_lists[index].rtes_inuse < 0); 838 839 trigger = iosapic_intr_info[irq].trigger; 840 polarity = iosapic_intr_info[irq].polarity; 841 dest = iosapic_intr_info[irq].dest; 842 printk(KERN_INFO 843 "GSI %u (%s, %s) -> CPU %d (0x%04x) vector %d unregistered\n", 844 gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"), 845 (polarity == IOSAPIC_POL_HIGH ? "high" : "low"), 846 cpu_logical_id(dest), dest, irq_to_vector(irq)); 847 848 if (iosapic_intr_info[irq].count == 0) { 849 #ifdef CONFIG_SMP 850 /* Clear affinity */ 851 cpumask_setall(idesc->affinity); 852 #endif 853 /* Clear the interrupt information */ 854 iosapic_intr_info[irq].dest = 0; 855 iosapic_intr_info[irq].dmode = 0; 856 iosapic_intr_info[irq].polarity = 0; 857 iosapic_intr_info[irq].trigger = 0; 858 iosapic_intr_info[irq].low32 |= IOSAPIC_MASK; 859 860 /* Destroy and reserve IRQ */ 861 destroy_and_reserve_irq(irq); 862 } 863 out: 864 spin_unlock_irqrestore(&iosapic_lock, flags); 865 } 866 867 /* 868 * ACPI calls this when it finds an entry for a platform interrupt. 869 */ 870 int __init 871 iosapic_register_platform_intr (u32 int_type, unsigned int gsi, 872 int iosapic_vector, u16 eid, u16 id, 873 unsigned long polarity, unsigned long trigger) 874 { 875 static const char * const name[] = {"unknown", "PMI", "INIT", "CPEI"}; 876 unsigned char delivery; 877 int irq, vector, mask = 0; 878 unsigned int dest = ((id << 8) | eid) & 0xffff; 879 880 switch (int_type) { 881 case ACPI_INTERRUPT_PMI: 882 irq = vector = iosapic_vector; 883 bind_irq_vector(irq, vector, CPU_MASK_ALL); 884 /* 885 * since PMI vector is alloc'd by FW(ACPI) not by kernel, 886 * we need to make sure the vector is available 887 */ 888 iosapic_reassign_vector(irq); 889 delivery = IOSAPIC_PMI; 890 break; 891 case ACPI_INTERRUPT_INIT: 892 irq = create_irq(); 893 if (irq < 0) 894 panic("%s: out of interrupt vectors!\n", __func__); 895 vector = irq_to_vector(irq); 896 delivery = IOSAPIC_INIT; 897 break; 898 case ACPI_INTERRUPT_CPEI: 899 irq = vector = IA64_CPE_VECTOR; 900 BUG_ON(bind_irq_vector(irq, vector, CPU_MASK_ALL)); 901 delivery = IOSAPIC_FIXED; 902 mask = 1; 903 break; 904 default: 905 printk(KERN_ERR "%s: invalid int type 0x%x\n", __func__, 906 int_type); 907 return -1; 908 } 909 910 register_intr(gsi, irq, delivery, polarity, trigger); 911 912 printk(KERN_INFO 913 "PLATFORM int %s (0x%x): GSI %u (%s, %s) -> CPU %d (0x%04x)" 914 " vector %d\n", 915 int_type < ARRAY_SIZE(name) ? name[int_type] : "unknown", 916 int_type, gsi, (trigger == IOSAPIC_EDGE ? "edge" : "level"), 917 (polarity == IOSAPIC_POL_HIGH ? "high" : "low"), 918 cpu_logical_id(dest), dest, vector); 919 920 set_rte(gsi, irq, dest, mask); 921 return vector; 922 } 923 924 /* 925 * ACPI calls this when it finds an entry for a legacy ISA IRQ override. 926 */ 927 void __devinit 928 iosapic_override_isa_irq (unsigned int isa_irq, unsigned int gsi, 929 unsigned long polarity, 930 unsigned long trigger) 931 { 932 int vector, irq; 933 unsigned int dest = cpu_physical_id(smp_processor_id()); 934 unsigned char dmode; 935 936 irq = vector = isa_irq_to_vector(isa_irq); 937 BUG_ON(bind_irq_vector(irq, vector, CPU_MASK_ALL)); 938 dmode = choose_dmode(); 939 register_intr(gsi, irq, dmode, polarity, trigger); 940 941 DBG("ISA: IRQ %u -> GSI %u (%s,%s) -> CPU %d (0x%04x) vector %d\n", 942 isa_irq, gsi, trigger == IOSAPIC_EDGE ? "edge" : "level", 943 polarity == IOSAPIC_POL_HIGH ? "high" : "low", 944 cpu_logical_id(dest), dest, vector); 945 946 set_rte(gsi, irq, dest, 1); 947 } 948 949 void __init 950 ia64_native_iosapic_pcat_compat_init(void) 951 { 952 if (pcat_compat) { 953 /* 954 * Disable the compatibility mode interrupts (8259 style), 955 * needs IN/OUT support enabled. 956 */ 957 printk(KERN_INFO 958 "%s: Disabling PC-AT compatible 8259 interrupts\n", 959 __func__); 960 outb(0xff, 0xA1); 961 outb(0xff, 0x21); 962 } 963 } 964 965 void __init 966 iosapic_system_init (int system_pcat_compat) 967 { 968 int irq; 969 970 for (irq = 0; irq < NR_IRQS; ++irq) { 971 iosapic_intr_info[irq].low32 = IOSAPIC_MASK; 972 /* mark as unused */ 973 INIT_LIST_HEAD(&iosapic_intr_info[irq].rtes); 974 975 iosapic_intr_info[irq].count = 0; 976 } 977 978 pcat_compat = system_pcat_compat; 979 if (pcat_compat) 980 iosapic_pcat_compat_init(); 981 } 982 983 static inline int 984 iosapic_alloc (void) 985 { 986 int index; 987 988 for (index = 0; index < NR_IOSAPICS; index++) 989 if (!iosapic_lists[index].addr) 990 return index; 991 992 printk(KERN_WARNING "%s: failed to allocate iosapic\n", __func__); 993 return -1; 994 } 995 996 static inline void 997 iosapic_free (int index) 998 { 999 memset(&iosapic_lists[index], 0, sizeof(iosapic_lists[0])); 1000 } 1001 1002 static inline int 1003 iosapic_check_gsi_range (unsigned int gsi_base, unsigned int ver) 1004 { 1005 int index; 1006 unsigned int gsi_end, base, end; 1007 1008 /* check gsi range */ 1009 gsi_end = gsi_base + ((ver >> 16) & 0xff); 1010 for (index = 0; index < NR_IOSAPICS; index++) { 1011 if (!iosapic_lists[index].addr) 1012 continue; 1013 1014 base = iosapic_lists[index].gsi_base; 1015 end = base + iosapic_lists[index].num_rte - 1; 1016 1017 if (gsi_end < base || end < gsi_base) 1018 continue; /* OK */ 1019 1020 return -EBUSY; 1021 } 1022 return 0; 1023 } 1024 1025 int __devinit 1026 iosapic_init (unsigned long phys_addr, unsigned int gsi_base) 1027 { 1028 int num_rte, err, index; 1029 unsigned int isa_irq, ver; 1030 char __iomem *addr; 1031 unsigned long flags; 1032 1033 spin_lock_irqsave(&iosapic_lock, flags); 1034 index = find_iosapic(gsi_base); 1035 if (index >= 0) { 1036 spin_unlock_irqrestore(&iosapic_lock, flags); 1037 return -EBUSY; 1038 } 1039 1040 addr = ioremap(phys_addr, 0); 1041 if (addr == NULL) { 1042 spin_unlock_irqrestore(&iosapic_lock, flags); 1043 return -ENOMEM; 1044 } 1045 ver = iosapic_version(addr); 1046 if ((err = iosapic_check_gsi_range(gsi_base, ver))) { 1047 iounmap(addr); 1048 spin_unlock_irqrestore(&iosapic_lock, flags); 1049 return err; 1050 } 1051 1052 /* 1053 * The MAX_REDIR register holds the highest input pin number 1054 * (starting from 0). We add 1 so that we can use it for 1055 * number of pins (= RTEs) 1056 */ 1057 num_rte = ((ver >> 16) & 0xff) + 1; 1058 1059 index = iosapic_alloc(); 1060 iosapic_lists[index].addr = addr; 1061 iosapic_lists[index].gsi_base = gsi_base; 1062 iosapic_lists[index].num_rte = num_rte; 1063 #ifdef CONFIG_NUMA 1064 iosapic_lists[index].node = MAX_NUMNODES; 1065 #endif 1066 spin_lock_init(&iosapic_lists[index].lock); 1067 spin_unlock_irqrestore(&iosapic_lock, flags); 1068 1069 if ((gsi_base == 0) && pcat_compat) { 1070 /* 1071 * Map the legacy ISA devices into the IOSAPIC data. Some of 1072 * these may get reprogrammed later on with data from the ACPI 1073 * Interrupt Source Override table. 1074 */ 1075 for (isa_irq = 0; isa_irq < 16; ++isa_irq) 1076 iosapic_override_isa_irq(isa_irq, isa_irq, 1077 IOSAPIC_POL_HIGH, 1078 IOSAPIC_EDGE); 1079 } 1080 return 0; 1081 } 1082 1083 #ifdef CONFIG_HOTPLUG 1084 int 1085 iosapic_remove (unsigned int gsi_base) 1086 { 1087 int index, err = 0; 1088 unsigned long flags; 1089 1090 spin_lock_irqsave(&iosapic_lock, flags); 1091 index = find_iosapic(gsi_base); 1092 if (index < 0) { 1093 printk(KERN_WARNING "%s: No IOSAPIC for GSI base %u\n", 1094 __func__, gsi_base); 1095 goto out; 1096 } 1097 1098 if (iosapic_lists[index].rtes_inuse) { 1099 err = -EBUSY; 1100 printk(KERN_WARNING "%s: IOSAPIC for GSI base %u is busy\n", 1101 __func__, gsi_base); 1102 goto out; 1103 } 1104 1105 iounmap(iosapic_lists[index].addr); 1106 iosapic_free(index); 1107 out: 1108 spin_unlock_irqrestore(&iosapic_lock, flags); 1109 return err; 1110 } 1111 #endif /* CONFIG_HOTPLUG */ 1112 1113 #ifdef CONFIG_NUMA 1114 void __devinit 1115 map_iosapic_to_node(unsigned int gsi_base, int node) 1116 { 1117 int index; 1118 1119 index = find_iosapic(gsi_base); 1120 if (index < 0) { 1121 printk(KERN_WARNING "%s: No IOSAPIC for GSI %u\n", 1122 __func__, gsi_base); 1123 return; 1124 } 1125 iosapic_lists[index].node = node; 1126 return; 1127 } 1128 #endif 1129