1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Xen event channels 4 * 5 * Xen models interrupts with abstract event channels. Because each 6 * domain gets 1024 event channels, but NR_IRQ is not that large, we 7 * must dynamically map irqs<->event channels. The event channels 8 * interface with the rest of the kernel by defining a xen interrupt 9 * chip. When an event is received, it is mapped to an irq and sent 10 * through the normal interrupt processing path. 11 * 12 * There are four kinds of events which can be mapped to an event 13 * channel: 14 * 15 * 1. Inter-domain notifications. This includes all the virtual 16 * device events, since they're driven by front-ends in another domain 17 * (typically dom0). 18 * 2. VIRQs, typically used for timers. These are per-cpu events. 19 * 3. IPIs. 20 * 4. PIRQs - Hardware interrupts. 21 * 22 * Jeremy Fitzhardinge <jeremy@xensource.com>, XenSource Inc, 2007 23 */ 24 25 #define pr_fmt(fmt) "xen:" KBUILD_MODNAME ": " fmt 26 27 #include <linux/linkage.h> 28 #include <linux/interrupt.h> 29 #include <linux/irq.h> 30 #include <linux/moduleparam.h> 31 #include <linux/string.h> 32 #include <linux/memblock.h> 33 #include <linux/slab.h> 34 #include <linux/irqnr.h> 35 #include <linux/pci.h> 36 37 #ifdef CONFIG_X86 38 #include <asm/desc.h> 39 #include <asm/ptrace.h> 40 #include <asm/idtentry.h> 41 #include <asm/irq.h> 42 #include <asm/io_apic.h> 43 #include <asm/i8259.h> 44 #include <asm/xen/pci.h> 45 #endif 46 #include <asm/sync_bitops.h> 47 #include <asm/xen/hypercall.h> 48 #include <asm/xen/hypervisor.h> 49 #include <xen/page.h> 50 51 #include <xen/xen.h> 52 #include <xen/hvm.h> 53 #include <xen/xen-ops.h> 54 #include <xen/events.h> 55 #include <xen/interface/xen.h> 56 #include <xen/interface/event_channel.h> 57 #include <xen/interface/hvm/hvm_op.h> 58 #include <xen/interface/hvm/params.h> 59 #include <xen/interface/physdev.h> 60 #include <xen/interface/sched.h> 61 #include <xen/interface/vcpu.h> 62 #include <asm/hw_irq.h> 63 64 #include "events_internal.h" 65 66 const struct evtchn_ops *evtchn_ops; 67 68 /* 69 * This lock protects updates to the following mapping and reference-count 70 * arrays. The lock does not need to be acquired to read the mapping tables. 71 */ 72 static DEFINE_MUTEX(irq_mapping_update_lock); 73 74 static LIST_HEAD(xen_irq_list_head); 75 76 /* IRQ <-> VIRQ mapping. */ 77 static DEFINE_PER_CPU(int [NR_VIRQS], virq_to_irq) = {[0 ... NR_VIRQS-1] = -1}; 78 79 /* IRQ <-> IPI mapping */ 80 static DEFINE_PER_CPU(int [XEN_NR_IPIS], ipi_to_irq) = {[0 ... XEN_NR_IPIS-1] = -1}; 81 82 int **evtchn_to_irq; 83 #ifdef CONFIG_X86 84 static unsigned long *pirq_eoi_map; 85 #endif 86 static bool (*pirq_needs_eoi)(unsigned irq); 87 88 #define EVTCHN_ROW(e) (e / (PAGE_SIZE/sizeof(**evtchn_to_irq))) 89 #define EVTCHN_COL(e) (e % (PAGE_SIZE/sizeof(**evtchn_to_irq))) 90 #define EVTCHN_PER_ROW (PAGE_SIZE / sizeof(**evtchn_to_irq)) 91 92 /* Xen will never allocate port zero for any purpose. */ 93 #define VALID_EVTCHN(chn) ((chn) != 0) 94 95 static struct irq_chip xen_dynamic_chip; 96 static struct irq_chip xen_percpu_chip; 97 static struct irq_chip xen_pirq_chip; 98 static void enable_dynirq(struct irq_data *data); 99 static void disable_dynirq(struct irq_data *data); 100 101 static void clear_evtchn_to_irq_row(unsigned row) 102 { 103 unsigned col; 104 105 for (col = 0; col < EVTCHN_PER_ROW; col++) 106 evtchn_to_irq[row][col] = -1; 107 } 108 109 static void clear_evtchn_to_irq_all(void) 110 { 111 unsigned row; 112 113 for (row = 0; row < EVTCHN_ROW(xen_evtchn_max_channels()); row++) { 114 if (evtchn_to_irq[row] == NULL) 115 continue; 116 clear_evtchn_to_irq_row(row); 117 } 118 } 119 120 static int set_evtchn_to_irq(evtchn_port_t evtchn, unsigned int irq) 121 { 122 unsigned row; 123 unsigned col; 124 125 if (evtchn >= xen_evtchn_max_channels()) 126 return -EINVAL; 127 128 row = EVTCHN_ROW(evtchn); 129 col = EVTCHN_COL(evtchn); 130 131 if (evtchn_to_irq[row] == NULL) { 132 /* Unallocated irq entries return -1 anyway */ 133 if (irq == -1) 134 return 0; 135 136 evtchn_to_irq[row] = (int *)get_zeroed_page(GFP_KERNEL); 137 if (evtchn_to_irq[row] == NULL) 138 return -ENOMEM; 139 140 clear_evtchn_to_irq_row(row); 141 } 142 143 evtchn_to_irq[row][col] = irq; 144 return 0; 145 } 146 147 int get_evtchn_to_irq(evtchn_port_t evtchn) 148 { 149 if (evtchn >= xen_evtchn_max_channels()) 150 return -1; 151 if (evtchn_to_irq[EVTCHN_ROW(evtchn)] == NULL) 152 return -1; 153 return evtchn_to_irq[EVTCHN_ROW(evtchn)][EVTCHN_COL(evtchn)]; 154 } 155 156 /* Get info for IRQ */ 157 struct irq_info *info_for_irq(unsigned irq) 158 { 159 return irq_get_handler_data(irq); 160 } 161 162 /* Constructors for packed IRQ information. */ 163 static int xen_irq_info_common_setup(struct irq_info *info, 164 unsigned irq, 165 enum xen_irq_type type, 166 evtchn_port_t evtchn, 167 unsigned short cpu) 168 { 169 int ret; 170 171 BUG_ON(info->type != IRQT_UNBOUND && info->type != type); 172 173 info->type = type; 174 info->irq = irq; 175 info->evtchn = evtchn; 176 info->cpu = cpu; 177 178 ret = set_evtchn_to_irq(evtchn, irq); 179 if (ret < 0) 180 return ret; 181 182 irq_clear_status_flags(irq, IRQ_NOREQUEST|IRQ_NOAUTOEN); 183 184 return xen_evtchn_port_setup(info); 185 } 186 187 static int xen_irq_info_evtchn_setup(unsigned irq, 188 evtchn_port_t evtchn) 189 { 190 struct irq_info *info = info_for_irq(irq); 191 192 return xen_irq_info_common_setup(info, irq, IRQT_EVTCHN, evtchn, 0); 193 } 194 195 static int xen_irq_info_ipi_setup(unsigned cpu, 196 unsigned irq, 197 evtchn_port_t evtchn, 198 enum ipi_vector ipi) 199 { 200 struct irq_info *info = info_for_irq(irq); 201 202 info->u.ipi = ipi; 203 204 per_cpu(ipi_to_irq, cpu)[ipi] = irq; 205 206 return xen_irq_info_common_setup(info, irq, IRQT_IPI, evtchn, 0); 207 } 208 209 static int xen_irq_info_virq_setup(unsigned cpu, 210 unsigned irq, 211 evtchn_port_t evtchn, 212 unsigned virq) 213 { 214 struct irq_info *info = info_for_irq(irq); 215 216 info->u.virq = virq; 217 218 per_cpu(virq_to_irq, cpu)[virq] = irq; 219 220 return xen_irq_info_common_setup(info, irq, IRQT_VIRQ, evtchn, 0); 221 } 222 223 static int xen_irq_info_pirq_setup(unsigned irq, 224 evtchn_port_t evtchn, 225 unsigned pirq, 226 unsigned gsi, 227 uint16_t domid, 228 unsigned char flags) 229 { 230 struct irq_info *info = info_for_irq(irq); 231 232 info->u.pirq.pirq = pirq; 233 info->u.pirq.gsi = gsi; 234 info->u.pirq.domid = domid; 235 info->u.pirq.flags = flags; 236 237 return xen_irq_info_common_setup(info, irq, IRQT_PIRQ, evtchn, 0); 238 } 239 240 static void xen_irq_info_cleanup(struct irq_info *info) 241 { 242 set_evtchn_to_irq(info->evtchn, -1); 243 info->evtchn = 0; 244 } 245 246 /* 247 * Accessors for packed IRQ information. 248 */ 249 evtchn_port_t evtchn_from_irq(unsigned irq) 250 { 251 if (WARN(irq >= nr_irqs, "Invalid irq %d!\n", irq)) 252 return 0; 253 254 return info_for_irq(irq)->evtchn; 255 } 256 257 unsigned int irq_from_evtchn(evtchn_port_t evtchn) 258 { 259 return get_evtchn_to_irq(evtchn); 260 } 261 EXPORT_SYMBOL_GPL(irq_from_evtchn); 262 263 int irq_from_virq(unsigned int cpu, unsigned int virq) 264 { 265 return per_cpu(virq_to_irq, cpu)[virq]; 266 } 267 268 static enum ipi_vector ipi_from_irq(unsigned irq) 269 { 270 struct irq_info *info = info_for_irq(irq); 271 272 BUG_ON(info == NULL); 273 BUG_ON(info->type != IRQT_IPI); 274 275 return info->u.ipi; 276 } 277 278 static unsigned virq_from_irq(unsigned irq) 279 { 280 struct irq_info *info = info_for_irq(irq); 281 282 BUG_ON(info == NULL); 283 BUG_ON(info->type != IRQT_VIRQ); 284 285 return info->u.virq; 286 } 287 288 static unsigned pirq_from_irq(unsigned irq) 289 { 290 struct irq_info *info = info_for_irq(irq); 291 292 BUG_ON(info == NULL); 293 BUG_ON(info->type != IRQT_PIRQ); 294 295 return info->u.pirq.pirq; 296 } 297 298 static enum xen_irq_type type_from_irq(unsigned irq) 299 { 300 return info_for_irq(irq)->type; 301 } 302 303 unsigned cpu_from_irq(unsigned irq) 304 { 305 return info_for_irq(irq)->cpu; 306 } 307 308 unsigned int cpu_from_evtchn(evtchn_port_t evtchn) 309 { 310 int irq = get_evtchn_to_irq(evtchn); 311 unsigned ret = 0; 312 313 if (irq != -1) 314 ret = cpu_from_irq(irq); 315 316 return ret; 317 } 318 319 #ifdef CONFIG_X86 320 static bool pirq_check_eoi_map(unsigned irq) 321 { 322 return test_bit(pirq_from_irq(irq), pirq_eoi_map); 323 } 324 #endif 325 326 static bool pirq_needs_eoi_flag(unsigned irq) 327 { 328 struct irq_info *info = info_for_irq(irq); 329 BUG_ON(info->type != IRQT_PIRQ); 330 331 return info->u.pirq.flags & PIRQ_NEEDS_EOI; 332 } 333 334 static void bind_evtchn_to_cpu(evtchn_port_t evtchn, unsigned int cpu) 335 { 336 int irq = get_evtchn_to_irq(evtchn); 337 struct irq_info *info = info_for_irq(irq); 338 339 BUG_ON(irq == -1); 340 #ifdef CONFIG_SMP 341 cpumask_copy(irq_get_affinity_mask(irq), cpumask_of(cpu)); 342 #endif 343 xen_evtchn_port_bind_to_cpu(info, cpu); 344 345 info->cpu = cpu; 346 } 347 348 /** 349 * notify_remote_via_irq - send event to remote end of event channel via irq 350 * @irq: irq of event channel to send event to 351 * 352 * Unlike notify_remote_via_evtchn(), this is safe to use across 353 * save/restore. Notifications on a broken connection are silently 354 * dropped. 355 */ 356 void notify_remote_via_irq(int irq) 357 { 358 evtchn_port_t evtchn = evtchn_from_irq(irq); 359 360 if (VALID_EVTCHN(evtchn)) 361 notify_remote_via_evtchn(evtchn); 362 } 363 EXPORT_SYMBOL_GPL(notify_remote_via_irq); 364 365 static void xen_irq_init(unsigned irq) 366 { 367 struct irq_info *info; 368 #ifdef CONFIG_SMP 369 /* By default all event channels notify CPU#0. */ 370 cpumask_copy(irq_get_affinity_mask(irq), cpumask_of(0)); 371 #endif 372 373 info = kzalloc(sizeof(*info), GFP_KERNEL); 374 if (info == NULL) 375 panic("Unable to allocate metadata for IRQ%d\n", irq); 376 377 info->type = IRQT_UNBOUND; 378 info->refcnt = -1; 379 380 irq_set_handler_data(irq, info); 381 382 list_add_tail(&info->list, &xen_irq_list_head); 383 } 384 385 static int __must_check xen_allocate_irqs_dynamic(int nvec) 386 { 387 int i, irq = irq_alloc_descs(-1, 0, nvec, -1); 388 389 if (irq >= 0) { 390 for (i = 0; i < nvec; i++) 391 xen_irq_init(irq + i); 392 } 393 394 return irq; 395 } 396 397 static inline int __must_check xen_allocate_irq_dynamic(void) 398 { 399 400 return xen_allocate_irqs_dynamic(1); 401 } 402 403 static int __must_check xen_allocate_irq_gsi(unsigned gsi) 404 { 405 int irq; 406 407 /* 408 * A PV guest has no concept of a GSI (since it has no ACPI 409 * nor access to/knowledge of the physical APICs). Therefore 410 * all IRQs are dynamically allocated from the entire IRQ 411 * space. 412 */ 413 if (xen_pv_domain() && !xen_initial_domain()) 414 return xen_allocate_irq_dynamic(); 415 416 /* Legacy IRQ descriptors are already allocated by the arch. */ 417 if (gsi < nr_legacy_irqs()) 418 irq = gsi; 419 else 420 irq = irq_alloc_desc_at(gsi, -1); 421 422 xen_irq_init(irq); 423 424 return irq; 425 } 426 427 static void xen_free_irq(unsigned irq) 428 { 429 struct irq_info *info = irq_get_handler_data(irq); 430 431 if (WARN_ON(!info)) 432 return; 433 434 list_del(&info->list); 435 436 irq_set_handler_data(irq, NULL); 437 438 WARN_ON(info->refcnt > 0); 439 440 kfree(info); 441 442 /* Legacy IRQ descriptors are managed by the arch. */ 443 if (irq < nr_legacy_irqs()) 444 return; 445 446 irq_free_desc(irq); 447 } 448 449 static void xen_evtchn_close(evtchn_port_t port) 450 { 451 struct evtchn_close close; 452 453 close.port = port; 454 if (HYPERVISOR_event_channel_op(EVTCHNOP_close, &close) != 0) 455 BUG(); 456 } 457 458 static void pirq_query_unmask(int irq) 459 { 460 struct physdev_irq_status_query irq_status; 461 struct irq_info *info = info_for_irq(irq); 462 463 BUG_ON(info->type != IRQT_PIRQ); 464 465 irq_status.irq = pirq_from_irq(irq); 466 if (HYPERVISOR_physdev_op(PHYSDEVOP_irq_status_query, &irq_status)) 467 irq_status.flags = 0; 468 469 info->u.pirq.flags &= ~PIRQ_NEEDS_EOI; 470 if (irq_status.flags & XENIRQSTAT_needs_eoi) 471 info->u.pirq.flags |= PIRQ_NEEDS_EOI; 472 } 473 474 static void eoi_pirq(struct irq_data *data) 475 { 476 evtchn_port_t evtchn = evtchn_from_irq(data->irq); 477 struct physdev_eoi eoi = { .irq = pirq_from_irq(data->irq) }; 478 int rc = 0; 479 480 if (!VALID_EVTCHN(evtchn)) 481 return; 482 483 if (unlikely(irqd_is_setaffinity_pending(data)) && 484 likely(!irqd_irq_disabled(data))) { 485 int masked = test_and_set_mask(evtchn); 486 487 clear_evtchn(evtchn); 488 489 irq_move_masked_irq(data); 490 491 if (!masked) 492 unmask_evtchn(evtchn); 493 } else 494 clear_evtchn(evtchn); 495 496 if (pirq_needs_eoi(data->irq)) { 497 rc = HYPERVISOR_physdev_op(PHYSDEVOP_eoi, &eoi); 498 WARN_ON(rc); 499 } 500 } 501 502 static void mask_ack_pirq(struct irq_data *data) 503 { 504 disable_dynirq(data); 505 eoi_pirq(data); 506 } 507 508 static unsigned int __startup_pirq(unsigned int irq) 509 { 510 struct evtchn_bind_pirq bind_pirq; 511 struct irq_info *info = info_for_irq(irq); 512 evtchn_port_t evtchn = evtchn_from_irq(irq); 513 int rc; 514 515 BUG_ON(info->type != IRQT_PIRQ); 516 517 if (VALID_EVTCHN(evtchn)) 518 goto out; 519 520 bind_pirq.pirq = pirq_from_irq(irq); 521 /* NB. We are happy to share unless we are probing. */ 522 bind_pirq.flags = info->u.pirq.flags & PIRQ_SHAREABLE ? 523 BIND_PIRQ__WILL_SHARE : 0; 524 rc = HYPERVISOR_event_channel_op(EVTCHNOP_bind_pirq, &bind_pirq); 525 if (rc != 0) { 526 pr_warn("Failed to obtain physical IRQ %d\n", irq); 527 return 0; 528 } 529 evtchn = bind_pirq.port; 530 531 pirq_query_unmask(irq); 532 533 rc = set_evtchn_to_irq(evtchn, irq); 534 if (rc) 535 goto err; 536 537 info->evtchn = evtchn; 538 bind_evtchn_to_cpu(evtchn, 0); 539 540 rc = xen_evtchn_port_setup(info); 541 if (rc) 542 goto err; 543 544 out: 545 unmask_evtchn(evtchn); 546 eoi_pirq(irq_get_irq_data(irq)); 547 548 return 0; 549 550 err: 551 pr_err("irq%d: Failed to set port to irq mapping (%d)\n", irq, rc); 552 xen_evtchn_close(evtchn); 553 return 0; 554 } 555 556 static unsigned int startup_pirq(struct irq_data *data) 557 { 558 return __startup_pirq(data->irq); 559 } 560 561 static void shutdown_pirq(struct irq_data *data) 562 { 563 unsigned int irq = data->irq; 564 struct irq_info *info = info_for_irq(irq); 565 evtchn_port_t evtchn = evtchn_from_irq(irq); 566 567 BUG_ON(info->type != IRQT_PIRQ); 568 569 if (!VALID_EVTCHN(evtchn)) 570 return; 571 572 mask_evtchn(evtchn); 573 xen_evtchn_close(evtchn); 574 xen_irq_info_cleanup(info); 575 } 576 577 static void enable_pirq(struct irq_data *data) 578 { 579 enable_dynirq(data); 580 } 581 582 static void disable_pirq(struct irq_data *data) 583 { 584 disable_dynirq(data); 585 } 586 587 int xen_irq_from_gsi(unsigned gsi) 588 { 589 struct irq_info *info; 590 591 list_for_each_entry(info, &xen_irq_list_head, list) { 592 if (info->type != IRQT_PIRQ) 593 continue; 594 595 if (info->u.pirq.gsi == gsi) 596 return info->irq; 597 } 598 599 return -1; 600 } 601 EXPORT_SYMBOL_GPL(xen_irq_from_gsi); 602 603 static void __unbind_from_irq(unsigned int irq) 604 { 605 evtchn_port_t evtchn = evtchn_from_irq(irq); 606 struct irq_info *info = irq_get_handler_data(irq); 607 608 if (info->refcnt > 0) { 609 info->refcnt--; 610 if (info->refcnt != 0) 611 return; 612 } 613 614 if (VALID_EVTCHN(evtchn)) { 615 unsigned int cpu = cpu_from_irq(irq); 616 617 xen_evtchn_close(evtchn); 618 619 switch (type_from_irq(irq)) { 620 case IRQT_VIRQ: 621 per_cpu(virq_to_irq, cpu)[virq_from_irq(irq)] = -1; 622 break; 623 case IRQT_IPI: 624 per_cpu(ipi_to_irq, cpu)[ipi_from_irq(irq)] = -1; 625 break; 626 default: 627 break; 628 } 629 630 xen_irq_info_cleanup(info); 631 } 632 633 xen_free_irq(irq); 634 } 635 636 /* 637 * Do not make any assumptions regarding the relationship between the 638 * IRQ number returned here and the Xen pirq argument. 639 * 640 * Note: We don't assign an event channel until the irq actually started 641 * up. Return an existing irq if we've already got one for the gsi. 642 * 643 * Shareable implies level triggered, not shareable implies edge 644 * triggered here. 645 */ 646 int xen_bind_pirq_gsi_to_irq(unsigned gsi, 647 unsigned pirq, int shareable, char *name) 648 { 649 int irq = -1; 650 struct physdev_irq irq_op; 651 int ret; 652 653 mutex_lock(&irq_mapping_update_lock); 654 655 irq = xen_irq_from_gsi(gsi); 656 if (irq != -1) { 657 pr_info("%s: returning irq %d for gsi %u\n", 658 __func__, irq, gsi); 659 goto out; 660 } 661 662 irq = xen_allocate_irq_gsi(gsi); 663 if (irq < 0) 664 goto out; 665 666 irq_op.irq = irq; 667 irq_op.vector = 0; 668 669 /* Only the privileged domain can do this. For non-priv, the pcifront 670 * driver provides a PCI bus that does the call to do exactly 671 * this in the priv domain. */ 672 if (xen_initial_domain() && 673 HYPERVISOR_physdev_op(PHYSDEVOP_alloc_irq_vector, &irq_op)) { 674 xen_free_irq(irq); 675 irq = -ENOSPC; 676 goto out; 677 } 678 679 ret = xen_irq_info_pirq_setup(irq, 0, pirq, gsi, DOMID_SELF, 680 shareable ? PIRQ_SHAREABLE : 0); 681 if (ret < 0) { 682 __unbind_from_irq(irq); 683 irq = ret; 684 goto out; 685 } 686 687 pirq_query_unmask(irq); 688 /* We try to use the handler with the appropriate semantic for the 689 * type of interrupt: if the interrupt is an edge triggered 690 * interrupt we use handle_edge_irq. 691 * 692 * On the other hand if the interrupt is level triggered we use 693 * handle_fasteoi_irq like the native code does for this kind of 694 * interrupts. 695 * 696 * Depending on the Xen version, pirq_needs_eoi might return true 697 * not only for level triggered interrupts but for edge triggered 698 * interrupts too. In any case Xen always honors the eoi mechanism, 699 * not injecting any more pirqs of the same kind if the first one 700 * hasn't received an eoi yet. Therefore using the fasteoi handler 701 * is the right choice either way. 702 */ 703 if (shareable) 704 irq_set_chip_and_handler_name(irq, &xen_pirq_chip, 705 handle_fasteoi_irq, name); 706 else 707 irq_set_chip_and_handler_name(irq, &xen_pirq_chip, 708 handle_edge_irq, name); 709 710 out: 711 mutex_unlock(&irq_mapping_update_lock); 712 713 return irq; 714 } 715 716 #ifdef CONFIG_PCI_MSI 717 int xen_allocate_pirq_msi(struct pci_dev *dev, struct msi_desc *msidesc) 718 { 719 int rc; 720 struct physdev_get_free_pirq op_get_free_pirq; 721 722 op_get_free_pirq.type = MAP_PIRQ_TYPE_MSI; 723 rc = HYPERVISOR_physdev_op(PHYSDEVOP_get_free_pirq, &op_get_free_pirq); 724 725 WARN_ONCE(rc == -ENOSYS, 726 "hypervisor does not support the PHYSDEVOP_get_free_pirq interface\n"); 727 728 return rc ? -1 : op_get_free_pirq.pirq; 729 } 730 731 int xen_bind_pirq_msi_to_irq(struct pci_dev *dev, struct msi_desc *msidesc, 732 int pirq, int nvec, const char *name, domid_t domid) 733 { 734 int i, irq, ret; 735 736 mutex_lock(&irq_mapping_update_lock); 737 738 irq = xen_allocate_irqs_dynamic(nvec); 739 if (irq < 0) 740 goto out; 741 742 for (i = 0; i < nvec; i++) { 743 irq_set_chip_and_handler_name(irq + i, &xen_pirq_chip, handle_edge_irq, name); 744 745 ret = xen_irq_info_pirq_setup(irq + i, 0, pirq + i, 0, domid, 746 i == 0 ? 0 : PIRQ_MSI_GROUP); 747 if (ret < 0) 748 goto error_irq; 749 } 750 751 ret = irq_set_msi_desc(irq, msidesc); 752 if (ret < 0) 753 goto error_irq; 754 out: 755 mutex_unlock(&irq_mapping_update_lock); 756 return irq; 757 error_irq: 758 while (nvec--) 759 __unbind_from_irq(irq + nvec); 760 mutex_unlock(&irq_mapping_update_lock); 761 return ret; 762 } 763 #endif 764 765 int xen_destroy_irq(int irq) 766 { 767 struct physdev_unmap_pirq unmap_irq; 768 struct irq_info *info = info_for_irq(irq); 769 int rc = -ENOENT; 770 771 mutex_lock(&irq_mapping_update_lock); 772 773 /* 774 * If trying to remove a vector in a MSI group different 775 * than the first one skip the PIRQ unmap unless this vector 776 * is the first one in the group. 777 */ 778 if (xen_initial_domain() && !(info->u.pirq.flags & PIRQ_MSI_GROUP)) { 779 unmap_irq.pirq = info->u.pirq.pirq; 780 unmap_irq.domid = info->u.pirq.domid; 781 rc = HYPERVISOR_physdev_op(PHYSDEVOP_unmap_pirq, &unmap_irq); 782 /* If another domain quits without making the pci_disable_msix 783 * call, the Xen hypervisor takes care of freeing the PIRQs 784 * (free_domain_pirqs). 785 */ 786 if ((rc == -ESRCH && info->u.pirq.domid != DOMID_SELF)) 787 pr_info("domain %d does not have %d anymore\n", 788 info->u.pirq.domid, info->u.pirq.pirq); 789 else if (rc) { 790 pr_warn("unmap irq failed %d\n", rc); 791 goto out; 792 } 793 } 794 795 xen_free_irq(irq); 796 797 out: 798 mutex_unlock(&irq_mapping_update_lock); 799 return rc; 800 } 801 802 int xen_irq_from_pirq(unsigned pirq) 803 { 804 int irq; 805 806 struct irq_info *info; 807 808 mutex_lock(&irq_mapping_update_lock); 809 810 list_for_each_entry(info, &xen_irq_list_head, list) { 811 if (info->type != IRQT_PIRQ) 812 continue; 813 irq = info->irq; 814 if (info->u.pirq.pirq == pirq) 815 goto out; 816 } 817 irq = -1; 818 out: 819 mutex_unlock(&irq_mapping_update_lock); 820 821 return irq; 822 } 823 824 825 int xen_pirq_from_irq(unsigned irq) 826 { 827 return pirq_from_irq(irq); 828 } 829 EXPORT_SYMBOL_GPL(xen_pirq_from_irq); 830 831 int bind_evtchn_to_irq(evtchn_port_t evtchn) 832 { 833 int irq; 834 int ret; 835 836 if (evtchn >= xen_evtchn_max_channels()) 837 return -ENOMEM; 838 839 mutex_lock(&irq_mapping_update_lock); 840 841 irq = get_evtchn_to_irq(evtchn); 842 843 if (irq == -1) { 844 irq = xen_allocate_irq_dynamic(); 845 if (irq < 0) 846 goto out; 847 848 irq_set_chip_and_handler_name(irq, &xen_dynamic_chip, 849 handle_edge_irq, "event"); 850 851 ret = xen_irq_info_evtchn_setup(irq, evtchn); 852 if (ret < 0) { 853 __unbind_from_irq(irq); 854 irq = ret; 855 goto out; 856 } 857 /* New interdomain events are bound to VCPU 0. */ 858 bind_evtchn_to_cpu(evtchn, 0); 859 } else { 860 struct irq_info *info = info_for_irq(irq); 861 WARN_ON(info == NULL || info->type != IRQT_EVTCHN); 862 } 863 864 out: 865 mutex_unlock(&irq_mapping_update_lock); 866 867 return irq; 868 } 869 EXPORT_SYMBOL_GPL(bind_evtchn_to_irq); 870 871 static int bind_ipi_to_irq(unsigned int ipi, unsigned int cpu) 872 { 873 struct evtchn_bind_ipi bind_ipi; 874 evtchn_port_t evtchn; 875 int ret, irq; 876 877 mutex_lock(&irq_mapping_update_lock); 878 879 irq = per_cpu(ipi_to_irq, cpu)[ipi]; 880 881 if (irq == -1) { 882 irq = xen_allocate_irq_dynamic(); 883 if (irq < 0) 884 goto out; 885 886 irq_set_chip_and_handler_name(irq, &xen_percpu_chip, 887 handle_percpu_irq, "ipi"); 888 889 bind_ipi.vcpu = xen_vcpu_nr(cpu); 890 if (HYPERVISOR_event_channel_op(EVTCHNOP_bind_ipi, 891 &bind_ipi) != 0) 892 BUG(); 893 evtchn = bind_ipi.port; 894 895 ret = xen_irq_info_ipi_setup(cpu, irq, evtchn, ipi); 896 if (ret < 0) { 897 __unbind_from_irq(irq); 898 irq = ret; 899 goto out; 900 } 901 bind_evtchn_to_cpu(evtchn, cpu); 902 } else { 903 struct irq_info *info = info_for_irq(irq); 904 WARN_ON(info == NULL || info->type != IRQT_IPI); 905 } 906 907 out: 908 mutex_unlock(&irq_mapping_update_lock); 909 return irq; 910 } 911 912 int bind_interdomain_evtchn_to_irq(unsigned int remote_domain, 913 evtchn_port_t remote_port) 914 { 915 struct evtchn_bind_interdomain bind_interdomain; 916 int err; 917 918 bind_interdomain.remote_dom = remote_domain; 919 bind_interdomain.remote_port = remote_port; 920 921 err = HYPERVISOR_event_channel_op(EVTCHNOP_bind_interdomain, 922 &bind_interdomain); 923 924 return err ? : bind_evtchn_to_irq(bind_interdomain.local_port); 925 } 926 EXPORT_SYMBOL_GPL(bind_interdomain_evtchn_to_irq); 927 928 static int find_virq(unsigned int virq, unsigned int cpu, evtchn_port_t *evtchn) 929 { 930 struct evtchn_status status; 931 evtchn_port_t port; 932 int rc = -ENOENT; 933 934 memset(&status, 0, sizeof(status)); 935 for (port = 0; port < xen_evtchn_max_channels(); port++) { 936 status.dom = DOMID_SELF; 937 status.port = port; 938 rc = HYPERVISOR_event_channel_op(EVTCHNOP_status, &status); 939 if (rc < 0) 940 continue; 941 if (status.status != EVTCHNSTAT_virq) 942 continue; 943 if (status.u.virq == virq && status.vcpu == xen_vcpu_nr(cpu)) { 944 *evtchn = port; 945 break; 946 } 947 } 948 return rc; 949 } 950 951 /** 952 * xen_evtchn_nr_channels - number of usable event channel ports 953 * 954 * This may be less than the maximum supported by the current 955 * hypervisor ABI. Use xen_evtchn_max_channels() for the maximum 956 * supported. 957 */ 958 unsigned xen_evtchn_nr_channels(void) 959 { 960 return evtchn_ops->nr_channels(); 961 } 962 EXPORT_SYMBOL_GPL(xen_evtchn_nr_channels); 963 964 int bind_virq_to_irq(unsigned int virq, unsigned int cpu, bool percpu) 965 { 966 struct evtchn_bind_virq bind_virq; 967 evtchn_port_t evtchn = 0; 968 int irq, ret; 969 970 mutex_lock(&irq_mapping_update_lock); 971 972 irq = per_cpu(virq_to_irq, cpu)[virq]; 973 974 if (irq == -1) { 975 irq = xen_allocate_irq_dynamic(); 976 if (irq < 0) 977 goto out; 978 979 if (percpu) 980 irq_set_chip_and_handler_name(irq, &xen_percpu_chip, 981 handle_percpu_irq, "virq"); 982 else 983 irq_set_chip_and_handler_name(irq, &xen_dynamic_chip, 984 handle_edge_irq, "virq"); 985 986 bind_virq.virq = virq; 987 bind_virq.vcpu = xen_vcpu_nr(cpu); 988 ret = HYPERVISOR_event_channel_op(EVTCHNOP_bind_virq, 989 &bind_virq); 990 if (ret == 0) 991 evtchn = bind_virq.port; 992 else { 993 if (ret == -EEXIST) 994 ret = find_virq(virq, cpu, &evtchn); 995 BUG_ON(ret < 0); 996 } 997 998 ret = xen_irq_info_virq_setup(cpu, irq, evtchn, virq); 999 if (ret < 0) { 1000 __unbind_from_irq(irq); 1001 irq = ret; 1002 goto out; 1003 } 1004 1005 bind_evtchn_to_cpu(evtchn, cpu); 1006 } else { 1007 struct irq_info *info = info_for_irq(irq); 1008 WARN_ON(info == NULL || info->type != IRQT_VIRQ); 1009 } 1010 1011 out: 1012 mutex_unlock(&irq_mapping_update_lock); 1013 1014 return irq; 1015 } 1016 1017 static void unbind_from_irq(unsigned int irq) 1018 { 1019 mutex_lock(&irq_mapping_update_lock); 1020 __unbind_from_irq(irq); 1021 mutex_unlock(&irq_mapping_update_lock); 1022 } 1023 1024 int bind_evtchn_to_irqhandler(evtchn_port_t evtchn, 1025 irq_handler_t handler, 1026 unsigned long irqflags, 1027 const char *devname, void *dev_id) 1028 { 1029 int irq, retval; 1030 1031 irq = bind_evtchn_to_irq(evtchn); 1032 if (irq < 0) 1033 return irq; 1034 retval = request_irq(irq, handler, irqflags, devname, dev_id); 1035 if (retval != 0) { 1036 unbind_from_irq(irq); 1037 return retval; 1038 } 1039 1040 return irq; 1041 } 1042 EXPORT_SYMBOL_GPL(bind_evtchn_to_irqhandler); 1043 1044 int bind_interdomain_evtchn_to_irqhandler(unsigned int remote_domain, 1045 evtchn_port_t remote_port, 1046 irq_handler_t handler, 1047 unsigned long irqflags, 1048 const char *devname, 1049 void *dev_id) 1050 { 1051 int irq, retval; 1052 1053 irq = bind_interdomain_evtchn_to_irq(remote_domain, remote_port); 1054 if (irq < 0) 1055 return irq; 1056 1057 retval = request_irq(irq, handler, irqflags, devname, dev_id); 1058 if (retval != 0) { 1059 unbind_from_irq(irq); 1060 return retval; 1061 } 1062 1063 return irq; 1064 } 1065 EXPORT_SYMBOL_GPL(bind_interdomain_evtchn_to_irqhandler); 1066 1067 int bind_virq_to_irqhandler(unsigned int virq, unsigned int cpu, 1068 irq_handler_t handler, 1069 unsigned long irqflags, const char *devname, void *dev_id) 1070 { 1071 int irq, retval; 1072 1073 irq = bind_virq_to_irq(virq, cpu, irqflags & IRQF_PERCPU); 1074 if (irq < 0) 1075 return irq; 1076 retval = request_irq(irq, handler, irqflags, devname, dev_id); 1077 if (retval != 0) { 1078 unbind_from_irq(irq); 1079 return retval; 1080 } 1081 1082 return irq; 1083 } 1084 EXPORT_SYMBOL_GPL(bind_virq_to_irqhandler); 1085 1086 int bind_ipi_to_irqhandler(enum ipi_vector ipi, 1087 unsigned int cpu, 1088 irq_handler_t handler, 1089 unsigned long irqflags, 1090 const char *devname, 1091 void *dev_id) 1092 { 1093 int irq, retval; 1094 1095 irq = bind_ipi_to_irq(ipi, cpu); 1096 if (irq < 0) 1097 return irq; 1098 1099 irqflags |= IRQF_NO_SUSPEND | IRQF_FORCE_RESUME | IRQF_EARLY_RESUME; 1100 retval = request_irq(irq, handler, irqflags, devname, dev_id); 1101 if (retval != 0) { 1102 unbind_from_irq(irq); 1103 return retval; 1104 } 1105 1106 return irq; 1107 } 1108 1109 void unbind_from_irqhandler(unsigned int irq, void *dev_id) 1110 { 1111 struct irq_info *info = irq_get_handler_data(irq); 1112 1113 if (WARN_ON(!info)) 1114 return; 1115 free_irq(irq, dev_id); 1116 unbind_from_irq(irq); 1117 } 1118 EXPORT_SYMBOL_GPL(unbind_from_irqhandler); 1119 1120 /** 1121 * xen_set_irq_priority() - set an event channel priority. 1122 * @irq:irq bound to an event channel. 1123 * @priority: priority between XEN_IRQ_PRIORITY_MAX and XEN_IRQ_PRIORITY_MIN. 1124 */ 1125 int xen_set_irq_priority(unsigned irq, unsigned priority) 1126 { 1127 struct evtchn_set_priority set_priority; 1128 1129 set_priority.port = evtchn_from_irq(irq); 1130 set_priority.priority = priority; 1131 1132 return HYPERVISOR_event_channel_op(EVTCHNOP_set_priority, 1133 &set_priority); 1134 } 1135 EXPORT_SYMBOL_GPL(xen_set_irq_priority); 1136 1137 int evtchn_make_refcounted(evtchn_port_t evtchn) 1138 { 1139 int irq = get_evtchn_to_irq(evtchn); 1140 struct irq_info *info; 1141 1142 if (irq == -1) 1143 return -ENOENT; 1144 1145 info = irq_get_handler_data(irq); 1146 1147 if (!info) 1148 return -ENOENT; 1149 1150 WARN_ON(info->refcnt != -1); 1151 1152 info->refcnt = 1; 1153 1154 return 0; 1155 } 1156 EXPORT_SYMBOL_GPL(evtchn_make_refcounted); 1157 1158 int evtchn_get(evtchn_port_t evtchn) 1159 { 1160 int irq; 1161 struct irq_info *info; 1162 int err = -ENOENT; 1163 1164 if (evtchn >= xen_evtchn_max_channels()) 1165 return -EINVAL; 1166 1167 mutex_lock(&irq_mapping_update_lock); 1168 1169 irq = get_evtchn_to_irq(evtchn); 1170 if (irq == -1) 1171 goto done; 1172 1173 info = irq_get_handler_data(irq); 1174 1175 if (!info) 1176 goto done; 1177 1178 err = -EINVAL; 1179 if (info->refcnt <= 0) 1180 goto done; 1181 1182 info->refcnt++; 1183 err = 0; 1184 done: 1185 mutex_unlock(&irq_mapping_update_lock); 1186 1187 return err; 1188 } 1189 EXPORT_SYMBOL_GPL(evtchn_get); 1190 1191 void evtchn_put(evtchn_port_t evtchn) 1192 { 1193 int irq = get_evtchn_to_irq(evtchn); 1194 if (WARN_ON(irq == -1)) 1195 return; 1196 unbind_from_irq(irq); 1197 } 1198 EXPORT_SYMBOL_GPL(evtchn_put); 1199 1200 void xen_send_IPI_one(unsigned int cpu, enum ipi_vector vector) 1201 { 1202 int irq; 1203 1204 #ifdef CONFIG_X86 1205 if (unlikely(vector == XEN_NMI_VECTOR)) { 1206 int rc = HYPERVISOR_vcpu_op(VCPUOP_send_nmi, xen_vcpu_nr(cpu), 1207 NULL); 1208 if (rc < 0) 1209 printk(KERN_WARNING "Sending nmi to CPU%d failed (rc:%d)\n", cpu, rc); 1210 return; 1211 } 1212 #endif 1213 irq = per_cpu(ipi_to_irq, cpu)[vector]; 1214 BUG_ON(irq < 0); 1215 notify_remote_via_irq(irq); 1216 } 1217 1218 static void __xen_evtchn_do_upcall(void) 1219 { 1220 struct vcpu_info *vcpu_info = __this_cpu_read(xen_vcpu); 1221 int cpu = smp_processor_id(); 1222 1223 do { 1224 vcpu_info->evtchn_upcall_pending = 0; 1225 1226 xen_evtchn_handle_events(cpu); 1227 1228 BUG_ON(!irqs_disabled()); 1229 1230 virt_rmb(); /* Hypervisor can set upcall pending. */ 1231 1232 } while (vcpu_info->evtchn_upcall_pending); 1233 } 1234 1235 void xen_evtchn_do_upcall(struct pt_regs *regs) 1236 { 1237 struct pt_regs *old_regs = set_irq_regs(regs); 1238 1239 irq_enter(); 1240 1241 __xen_evtchn_do_upcall(); 1242 1243 irq_exit(); 1244 set_irq_regs(old_regs); 1245 } 1246 1247 void xen_hvm_evtchn_do_upcall(void) 1248 { 1249 __xen_evtchn_do_upcall(); 1250 } 1251 EXPORT_SYMBOL_GPL(xen_hvm_evtchn_do_upcall); 1252 1253 /* Rebind a new event channel to an existing irq. */ 1254 void rebind_evtchn_irq(evtchn_port_t evtchn, int irq) 1255 { 1256 struct irq_info *info = info_for_irq(irq); 1257 1258 if (WARN_ON(!info)) 1259 return; 1260 1261 /* Make sure the irq is masked, since the new event channel 1262 will also be masked. */ 1263 disable_irq(irq); 1264 1265 mutex_lock(&irq_mapping_update_lock); 1266 1267 /* After resume the irq<->evtchn mappings are all cleared out */ 1268 BUG_ON(get_evtchn_to_irq(evtchn) != -1); 1269 /* Expect irq to have been bound before, 1270 so there should be a proper type */ 1271 BUG_ON(info->type == IRQT_UNBOUND); 1272 1273 (void)xen_irq_info_evtchn_setup(irq, evtchn); 1274 1275 mutex_unlock(&irq_mapping_update_lock); 1276 1277 bind_evtchn_to_cpu(evtchn, info->cpu); 1278 /* This will be deferred until interrupt is processed */ 1279 irq_set_affinity(irq, cpumask_of(info->cpu)); 1280 1281 /* Unmask the event channel. */ 1282 enable_irq(irq); 1283 } 1284 1285 /* Rebind an evtchn so that it gets delivered to a specific cpu */ 1286 static int xen_rebind_evtchn_to_cpu(evtchn_port_t evtchn, unsigned int tcpu) 1287 { 1288 struct evtchn_bind_vcpu bind_vcpu; 1289 int masked; 1290 1291 if (!VALID_EVTCHN(evtchn)) 1292 return -1; 1293 1294 if (!xen_support_evtchn_rebind()) 1295 return -1; 1296 1297 /* Send future instances of this interrupt to other vcpu. */ 1298 bind_vcpu.port = evtchn; 1299 bind_vcpu.vcpu = xen_vcpu_nr(tcpu); 1300 1301 /* 1302 * Mask the event while changing the VCPU binding to prevent 1303 * it being delivered on an unexpected VCPU. 1304 */ 1305 masked = test_and_set_mask(evtchn); 1306 1307 /* 1308 * If this fails, it usually just indicates that we're dealing with a 1309 * virq or IPI channel, which don't actually need to be rebound. Ignore 1310 * it, but don't do the xenlinux-level rebind in that case. 1311 */ 1312 if (HYPERVISOR_event_channel_op(EVTCHNOP_bind_vcpu, &bind_vcpu) >= 0) 1313 bind_evtchn_to_cpu(evtchn, tcpu); 1314 1315 if (!masked) 1316 unmask_evtchn(evtchn); 1317 1318 return 0; 1319 } 1320 1321 static int set_affinity_irq(struct irq_data *data, const struct cpumask *dest, 1322 bool force) 1323 { 1324 unsigned tcpu = cpumask_first_and(dest, cpu_online_mask); 1325 int ret = xen_rebind_evtchn_to_cpu(evtchn_from_irq(data->irq), tcpu); 1326 1327 if (!ret) 1328 irq_data_update_effective_affinity(data, cpumask_of(tcpu)); 1329 1330 return ret; 1331 } 1332 1333 /* To be called with desc->lock held. */ 1334 int xen_set_affinity_evtchn(struct irq_desc *desc, unsigned int tcpu) 1335 { 1336 struct irq_data *d = irq_desc_get_irq_data(desc); 1337 1338 return set_affinity_irq(d, cpumask_of(tcpu), false); 1339 } 1340 EXPORT_SYMBOL_GPL(xen_set_affinity_evtchn); 1341 1342 static void enable_dynirq(struct irq_data *data) 1343 { 1344 evtchn_port_t evtchn = evtchn_from_irq(data->irq); 1345 1346 if (VALID_EVTCHN(evtchn)) 1347 unmask_evtchn(evtchn); 1348 } 1349 1350 static void disable_dynirq(struct irq_data *data) 1351 { 1352 evtchn_port_t evtchn = evtchn_from_irq(data->irq); 1353 1354 if (VALID_EVTCHN(evtchn)) 1355 mask_evtchn(evtchn); 1356 } 1357 1358 static void ack_dynirq(struct irq_data *data) 1359 { 1360 evtchn_port_t evtchn = evtchn_from_irq(data->irq); 1361 1362 if (!VALID_EVTCHN(evtchn)) 1363 return; 1364 1365 if (unlikely(irqd_is_setaffinity_pending(data)) && 1366 likely(!irqd_irq_disabled(data))) { 1367 int masked = test_and_set_mask(evtchn); 1368 1369 clear_evtchn(evtchn); 1370 1371 irq_move_masked_irq(data); 1372 1373 if (!masked) 1374 unmask_evtchn(evtchn); 1375 } else 1376 clear_evtchn(evtchn); 1377 } 1378 1379 static void mask_ack_dynirq(struct irq_data *data) 1380 { 1381 disable_dynirq(data); 1382 ack_dynirq(data); 1383 } 1384 1385 static int retrigger_dynirq(struct irq_data *data) 1386 { 1387 evtchn_port_t evtchn = evtchn_from_irq(data->irq); 1388 int masked; 1389 1390 if (!VALID_EVTCHN(evtchn)) 1391 return 0; 1392 1393 masked = test_and_set_mask(evtchn); 1394 set_evtchn(evtchn); 1395 if (!masked) 1396 unmask_evtchn(evtchn); 1397 1398 return 1; 1399 } 1400 1401 static void restore_pirqs(void) 1402 { 1403 int pirq, rc, irq, gsi; 1404 struct physdev_map_pirq map_irq; 1405 struct irq_info *info; 1406 1407 list_for_each_entry(info, &xen_irq_list_head, list) { 1408 if (info->type != IRQT_PIRQ) 1409 continue; 1410 1411 pirq = info->u.pirq.pirq; 1412 gsi = info->u.pirq.gsi; 1413 irq = info->irq; 1414 1415 /* save/restore of PT devices doesn't work, so at this point the 1416 * only devices present are GSI based emulated devices */ 1417 if (!gsi) 1418 continue; 1419 1420 map_irq.domid = DOMID_SELF; 1421 map_irq.type = MAP_PIRQ_TYPE_GSI; 1422 map_irq.index = gsi; 1423 map_irq.pirq = pirq; 1424 1425 rc = HYPERVISOR_physdev_op(PHYSDEVOP_map_pirq, &map_irq); 1426 if (rc) { 1427 pr_warn("xen map irq failed gsi=%d irq=%d pirq=%d rc=%d\n", 1428 gsi, irq, pirq, rc); 1429 xen_free_irq(irq); 1430 continue; 1431 } 1432 1433 printk(KERN_DEBUG "xen: --> irq=%d, pirq=%d\n", irq, map_irq.pirq); 1434 1435 __startup_pirq(irq); 1436 } 1437 } 1438 1439 static void restore_cpu_virqs(unsigned int cpu) 1440 { 1441 struct evtchn_bind_virq bind_virq; 1442 evtchn_port_t evtchn; 1443 int virq, irq; 1444 1445 for (virq = 0; virq < NR_VIRQS; virq++) { 1446 if ((irq = per_cpu(virq_to_irq, cpu)[virq]) == -1) 1447 continue; 1448 1449 BUG_ON(virq_from_irq(irq) != virq); 1450 1451 /* Get a new binding from Xen. */ 1452 bind_virq.virq = virq; 1453 bind_virq.vcpu = xen_vcpu_nr(cpu); 1454 if (HYPERVISOR_event_channel_op(EVTCHNOP_bind_virq, 1455 &bind_virq) != 0) 1456 BUG(); 1457 evtchn = bind_virq.port; 1458 1459 /* Record the new mapping. */ 1460 (void)xen_irq_info_virq_setup(cpu, irq, evtchn, virq); 1461 bind_evtchn_to_cpu(evtchn, cpu); 1462 } 1463 } 1464 1465 static void restore_cpu_ipis(unsigned int cpu) 1466 { 1467 struct evtchn_bind_ipi bind_ipi; 1468 evtchn_port_t evtchn; 1469 int ipi, irq; 1470 1471 for (ipi = 0; ipi < XEN_NR_IPIS; ipi++) { 1472 if ((irq = per_cpu(ipi_to_irq, cpu)[ipi]) == -1) 1473 continue; 1474 1475 BUG_ON(ipi_from_irq(irq) != ipi); 1476 1477 /* Get a new binding from Xen. */ 1478 bind_ipi.vcpu = xen_vcpu_nr(cpu); 1479 if (HYPERVISOR_event_channel_op(EVTCHNOP_bind_ipi, 1480 &bind_ipi) != 0) 1481 BUG(); 1482 evtchn = bind_ipi.port; 1483 1484 /* Record the new mapping. */ 1485 (void)xen_irq_info_ipi_setup(cpu, irq, evtchn, ipi); 1486 bind_evtchn_to_cpu(evtchn, cpu); 1487 } 1488 } 1489 1490 /* Clear an irq's pending state, in preparation for polling on it */ 1491 void xen_clear_irq_pending(int irq) 1492 { 1493 evtchn_port_t evtchn = evtchn_from_irq(irq); 1494 1495 if (VALID_EVTCHN(evtchn)) 1496 clear_evtchn(evtchn); 1497 } 1498 EXPORT_SYMBOL(xen_clear_irq_pending); 1499 void xen_set_irq_pending(int irq) 1500 { 1501 evtchn_port_t evtchn = evtchn_from_irq(irq); 1502 1503 if (VALID_EVTCHN(evtchn)) 1504 set_evtchn(evtchn); 1505 } 1506 1507 bool xen_test_irq_pending(int irq) 1508 { 1509 evtchn_port_t evtchn = evtchn_from_irq(irq); 1510 bool ret = false; 1511 1512 if (VALID_EVTCHN(evtchn)) 1513 ret = test_evtchn(evtchn); 1514 1515 return ret; 1516 } 1517 1518 /* Poll waiting for an irq to become pending with timeout. In the usual case, 1519 * the irq will be disabled so it won't deliver an interrupt. */ 1520 void xen_poll_irq_timeout(int irq, u64 timeout) 1521 { 1522 evtchn_port_t evtchn = evtchn_from_irq(irq); 1523 1524 if (VALID_EVTCHN(evtchn)) { 1525 struct sched_poll poll; 1526 1527 poll.nr_ports = 1; 1528 poll.timeout = timeout; 1529 set_xen_guest_handle(poll.ports, &evtchn); 1530 1531 if (HYPERVISOR_sched_op(SCHEDOP_poll, &poll) != 0) 1532 BUG(); 1533 } 1534 } 1535 EXPORT_SYMBOL(xen_poll_irq_timeout); 1536 /* Poll waiting for an irq to become pending. In the usual case, the 1537 * irq will be disabled so it won't deliver an interrupt. */ 1538 void xen_poll_irq(int irq) 1539 { 1540 xen_poll_irq_timeout(irq, 0 /* no timeout */); 1541 } 1542 1543 /* Check whether the IRQ line is shared with other guests. */ 1544 int xen_test_irq_shared(int irq) 1545 { 1546 struct irq_info *info = info_for_irq(irq); 1547 struct physdev_irq_status_query irq_status; 1548 1549 if (WARN_ON(!info)) 1550 return -ENOENT; 1551 1552 irq_status.irq = info->u.pirq.pirq; 1553 1554 if (HYPERVISOR_physdev_op(PHYSDEVOP_irq_status_query, &irq_status)) 1555 return 0; 1556 return !(irq_status.flags & XENIRQSTAT_shared); 1557 } 1558 EXPORT_SYMBOL_GPL(xen_test_irq_shared); 1559 1560 void xen_irq_resume(void) 1561 { 1562 unsigned int cpu; 1563 struct irq_info *info; 1564 1565 /* New event-channel space is not 'live' yet. */ 1566 xen_evtchn_resume(); 1567 1568 /* No IRQ <-> event-channel mappings. */ 1569 list_for_each_entry(info, &xen_irq_list_head, list) 1570 info->evtchn = 0; /* zap event-channel binding */ 1571 1572 clear_evtchn_to_irq_all(); 1573 1574 for_each_possible_cpu(cpu) { 1575 restore_cpu_virqs(cpu); 1576 restore_cpu_ipis(cpu); 1577 } 1578 1579 restore_pirqs(); 1580 } 1581 1582 static struct irq_chip xen_dynamic_chip __read_mostly = { 1583 .name = "xen-dyn", 1584 1585 .irq_disable = disable_dynirq, 1586 .irq_mask = disable_dynirq, 1587 .irq_unmask = enable_dynirq, 1588 1589 .irq_ack = ack_dynirq, 1590 .irq_mask_ack = mask_ack_dynirq, 1591 1592 .irq_set_affinity = set_affinity_irq, 1593 .irq_retrigger = retrigger_dynirq, 1594 }; 1595 1596 static struct irq_chip xen_pirq_chip __read_mostly = { 1597 .name = "xen-pirq", 1598 1599 .irq_startup = startup_pirq, 1600 .irq_shutdown = shutdown_pirq, 1601 .irq_enable = enable_pirq, 1602 .irq_disable = disable_pirq, 1603 1604 .irq_mask = disable_dynirq, 1605 .irq_unmask = enable_dynirq, 1606 1607 .irq_ack = eoi_pirq, 1608 .irq_eoi = eoi_pirq, 1609 .irq_mask_ack = mask_ack_pirq, 1610 1611 .irq_set_affinity = set_affinity_irq, 1612 1613 .irq_retrigger = retrigger_dynirq, 1614 }; 1615 1616 static struct irq_chip xen_percpu_chip __read_mostly = { 1617 .name = "xen-percpu", 1618 1619 .irq_disable = disable_dynirq, 1620 .irq_mask = disable_dynirq, 1621 .irq_unmask = enable_dynirq, 1622 1623 .irq_ack = ack_dynirq, 1624 }; 1625 1626 int xen_set_callback_via(uint64_t via) 1627 { 1628 struct xen_hvm_param a; 1629 a.domid = DOMID_SELF; 1630 a.index = HVM_PARAM_CALLBACK_IRQ; 1631 a.value = via; 1632 return HYPERVISOR_hvm_op(HVMOP_set_param, &a); 1633 } 1634 EXPORT_SYMBOL_GPL(xen_set_callback_via); 1635 1636 #ifdef CONFIG_XEN_PVHVM 1637 /* Vector callbacks are better than PCI interrupts to receive event 1638 * channel notifications because we can receive vector callbacks on any 1639 * vcpu and we don't need PCI support or APIC interactions. */ 1640 void xen_setup_callback_vector(void) 1641 { 1642 uint64_t callback_via; 1643 1644 if (xen_have_vector_callback) { 1645 callback_via = HVM_CALLBACK_VECTOR(HYPERVISOR_CALLBACK_VECTOR); 1646 if (xen_set_callback_via(callback_via)) { 1647 pr_err("Request for Xen HVM callback vector failed\n"); 1648 xen_have_vector_callback = 0; 1649 } 1650 } 1651 } 1652 1653 static __init void xen_alloc_callback_vector(void) 1654 { 1655 if (!xen_have_vector_callback) 1656 return; 1657 1658 pr_info("Xen HVM callback vector for event delivery is enabled\n"); 1659 alloc_intr_gate(HYPERVISOR_CALLBACK_VECTOR, asm_sysvec_xen_hvm_callback); 1660 } 1661 #else 1662 void xen_setup_callback_vector(void) {} 1663 static inline void xen_alloc_callback_vector(void) {} 1664 #endif 1665 1666 #undef MODULE_PARAM_PREFIX 1667 #define MODULE_PARAM_PREFIX "xen." 1668 1669 static bool fifo_events = true; 1670 module_param(fifo_events, bool, 0); 1671 1672 void __init xen_init_IRQ(void) 1673 { 1674 int ret = -EINVAL; 1675 evtchn_port_t evtchn; 1676 1677 if (fifo_events) 1678 ret = xen_evtchn_fifo_init(); 1679 if (ret < 0) 1680 xen_evtchn_2l_init(); 1681 1682 evtchn_to_irq = kcalloc(EVTCHN_ROW(xen_evtchn_max_channels()), 1683 sizeof(*evtchn_to_irq), GFP_KERNEL); 1684 BUG_ON(!evtchn_to_irq); 1685 1686 /* No event channels are 'live' right now. */ 1687 for (evtchn = 0; evtchn < xen_evtchn_nr_channels(); evtchn++) 1688 mask_evtchn(evtchn); 1689 1690 pirq_needs_eoi = pirq_needs_eoi_flag; 1691 1692 #ifdef CONFIG_X86 1693 if (xen_pv_domain()) { 1694 if (xen_initial_domain()) 1695 pci_xen_initial_domain(); 1696 } 1697 if (xen_feature(XENFEAT_hvm_callback_vector)) { 1698 xen_setup_callback_vector(); 1699 xen_alloc_callback_vector(); 1700 } 1701 1702 if (xen_hvm_domain()) { 1703 native_init_IRQ(); 1704 /* pci_xen_hvm_init must be called after native_init_IRQ so that 1705 * __acpi_register_gsi can point at the right function */ 1706 pci_xen_hvm_init(); 1707 } else { 1708 int rc; 1709 struct physdev_pirq_eoi_gmfn eoi_gmfn; 1710 1711 pirq_eoi_map = (void *)__get_free_page(GFP_KERNEL|__GFP_ZERO); 1712 eoi_gmfn.gmfn = virt_to_gfn(pirq_eoi_map); 1713 rc = HYPERVISOR_physdev_op(PHYSDEVOP_pirq_eoi_gmfn_v2, &eoi_gmfn); 1714 if (rc != 0) { 1715 free_page((unsigned long) pirq_eoi_map); 1716 pirq_eoi_map = NULL; 1717 } else 1718 pirq_needs_eoi = pirq_check_eoi_map; 1719 } 1720 #endif 1721 } 1722