1*f33f5fe2SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later 25f4c9760SMichael S. Tsirkin /* 35f4c9760SMichael S. Tsirkin * Virtio PCI driver - common functionality for all device versions 45f4c9760SMichael S. Tsirkin * 55f4c9760SMichael S. Tsirkin * This module allows virtio devices to be used over a virtual PCI device. 65f4c9760SMichael S. Tsirkin * This can be used with QEMU based VMMs like KVM or Xen. 75f4c9760SMichael S. Tsirkin * 85f4c9760SMichael S. Tsirkin * Copyright IBM Corp. 2007 95f4c9760SMichael S. Tsirkin * Copyright Red Hat, Inc. 2014 105f4c9760SMichael S. Tsirkin * 115f4c9760SMichael S. Tsirkin * Authors: 125f4c9760SMichael S. Tsirkin * Anthony Liguori <aliguori@us.ibm.com> 135f4c9760SMichael S. Tsirkin * Rusty Russell <rusty@rustcorp.com.au> 145f4c9760SMichael S. Tsirkin * Michael S. Tsirkin <mst@redhat.com> 155f4c9760SMichael S. Tsirkin */ 165f4c9760SMichael S. Tsirkin 175f4c9760SMichael S. Tsirkin #include "virtio_pci_common.h" 185f4c9760SMichael S. Tsirkin 19ac399d8fSMichael S. Tsirkin static bool force_legacy = false; 20ac399d8fSMichael S. Tsirkin 21ac399d8fSMichael S. Tsirkin #if IS_ENABLED(CONFIG_VIRTIO_PCI_LEGACY) 22ac399d8fSMichael S. Tsirkin module_param(force_legacy, bool, 0444); 23ac399d8fSMichael S. Tsirkin MODULE_PARM_DESC(force_legacy, 24ac399d8fSMichael S. Tsirkin "Force legacy mode for transitional virtio 1 devices"); 25ac399d8fSMichael S. Tsirkin #endif 26ac399d8fSMichael S. Tsirkin 275f4c9760SMichael S. Tsirkin /* wait for pending irq handlers */ 285f4c9760SMichael S. Tsirkin void vp_synchronize_vectors(struct virtio_device *vdev) 295f4c9760SMichael S. Tsirkin { 305f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 315f4c9760SMichael S. Tsirkin int i; 325f4c9760SMichael S. Tsirkin 330b0f9dc5SMichael S. Tsirkin if (vp_dev->intx_enabled) 340b0f9dc5SMichael S. Tsirkin synchronize_irq(vp_dev->pci_dev->irq); 350b0f9dc5SMichael S. Tsirkin 360b0f9dc5SMichael S. Tsirkin for (i = 0; i < vp_dev->msix_vectors; ++i) 37fa3a3279SChristoph Hellwig synchronize_irq(pci_irq_vector(vp_dev->pci_dev, i)); 385f4c9760SMichael S. Tsirkin } 395f4c9760SMichael S. Tsirkin 405f4c9760SMichael S. Tsirkin /* the notify function used when creating a virt queue */ 415f4c9760SMichael S. Tsirkin bool vp_notify(struct virtqueue *vq) 425f4c9760SMichael S. Tsirkin { 435f4c9760SMichael S. Tsirkin /* we write the queue's selector into the notification register to 445f4c9760SMichael S. Tsirkin * signal the other end */ 455f4c9760SMichael S. Tsirkin iowrite16(vq->index, (void __iomem *)vq->priv); 465f4c9760SMichael S. Tsirkin return true; 475f4c9760SMichael S. Tsirkin } 485f4c9760SMichael S. Tsirkin 495f4c9760SMichael S. Tsirkin /* Handle a configuration change: Tell driver if it wants to know. */ 505f4c9760SMichael S. Tsirkin static irqreturn_t vp_config_changed(int irq, void *opaque) 515f4c9760SMichael S. Tsirkin { 525f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = opaque; 535f4c9760SMichael S. Tsirkin 545f4c9760SMichael S. Tsirkin virtio_config_changed(&vp_dev->vdev); 555f4c9760SMichael S. Tsirkin return IRQ_HANDLED; 565f4c9760SMichael S. Tsirkin } 575f4c9760SMichael S. Tsirkin 585f4c9760SMichael S. Tsirkin /* Notify all virtqueues on an interrupt. */ 595f4c9760SMichael S. Tsirkin static irqreturn_t vp_vring_interrupt(int irq, void *opaque) 605f4c9760SMichael S. Tsirkin { 615f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = opaque; 620a9b3f47SMichael S. Tsirkin struct virtio_pci_vq_info *info; 635f4c9760SMichael S. Tsirkin irqreturn_t ret = IRQ_NONE; 640a9b3f47SMichael S. Tsirkin unsigned long flags; 655f4c9760SMichael S. Tsirkin 660a9b3f47SMichael S. Tsirkin spin_lock_irqsave(&vp_dev->lock, flags); 670a9b3f47SMichael S. Tsirkin list_for_each_entry(info, &vp_dev->virtqueues, node) { 680a9b3f47SMichael S. Tsirkin if (vring_interrupt(irq, info->vq) == IRQ_HANDLED) 695f4c9760SMichael S. Tsirkin ret = IRQ_HANDLED; 705f4c9760SMichael S. Tsirkin } 710a9b3f47SMichael S. Tsirkin spin_unlock_irqrestore(&vp_dev->lock, flags); 725f4c9760SMichael S. Tsirkin 735f4c9760SMichael S. Tsirkin return ret; 745f4c9760SMichael S. Tsirkin } 755f4c9760SMichael S. Tsirkin 765f4c9760SMichael S. Tsirkin /* A small wrapper to also acknowledge the interrupt when it's handled. 775f4c9760SMichael S. Tsirkin * I really need an EIO hook for the vring so I can ack the interrupt once we 785f4c9760SMichael S. Tsirkin * know that we'll be handling the IRQ but before we invoke the callback since 795f4c9760SMichael S. Tsirkin * the callback may notify the host which results in the host attempting to 805f4c9760SMichael S. Tsirkin * raise an interrupt that we would then mask once we acknowledged the 815f4c9760SMichael S. Tsirkin * interrupt. */ 825f4c9760SMichael S. Tsirkin static irqreturn_t vp_interrupt(int irq, void *opaque) 835f4c9760SMichael S. Tsirkin { 845f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = opaque; 855f4c9760SMichael S. Tsirkin u8 isr; 865f4c9760SMichael S. Tsirkin 875f4c9760SMichael S. Tsirkin /* reading the ISR has the effect of also clearing it so it's very 885f4c9760SMichael S. Tsirkin * important to save off the value. */ 895f4c9760SMichael S. Tsirkin isr = ioread8(vp_dev->isr); 905f4c9760SMichael S. Tsirkin 915f4c9760SMichael S. Tsirkin /* It's definitely not us if the ISR was not high */ 925f4c9760SMichael S. Tsirkin if (!isr) 935f4c9760SMichael S. Tsirkin return IRQ_NONE; 945f4c9760SMichael S. Tsirkin 955f4c9760SMichael S. Tsirkin /* Configuration change? Tell driver if it wants to know. */ 965f4c9760SMichael S. Tsirkin if (isr & VIRTIO_PCI_ISR_CONFIG) 975f4c9760SMichael S. Tsirkin vp_config_changed(irq, opaque); 985f4c9760SMichael S. Tsirkin 995f4c9760SMichael S. Tsirkin return vp_vring_interrupt(irq, opaque); 1005f4c9760SMichael S. Tsirkin } 1015f4c9760SMichael S. Tsirkin 1020b0f9dc5SMichael S. Tsirkin static int vp_request_msix_vectors(struct virtio_device *vdev, int nvectors, 1030b0f9dc5SMichael S. Tsirkin bool per_vq_vectors, struct irq_affinity *desc) 1040b0f9dc5SMichael S. Tsirkin { 1050b0f9dc5SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 1060b0f9dc5SMichael S. Tsirkin const char *name = dev_name(&vp_dev->vdev.dev); 107ba74b6f7SChristoph Hellwig unsigned flags = PCI_IRQ_MSIX; 1080b0f9dc5SMichael S. Tsirkin unsigned i, v; 1090b0f9dc5SMichael S. Tsirkin int err = -ENOMEM; 1100b0f9dc5SMichael S. Tsirkin 1110b0f9dc5SMichael S. Tsirkin vp_dev->msix_vectors = nvectors; 1120b0f9dc5SMichael S. Tsirkin 1136da2ec56SKees Cook vp_dev->msix_names = kmalloc_array(nvectors, 1146da2ec56SKees Cook sizeof(*vp_dev->msix_names), 1150b0f9dc5SMichael S. Tsirkin GFP_KERNEL); 1160b0f9dc5SMichael S. Tsirkin if (!vp_dev->msix_names) 1170b0f9dc5SMichael S. Tsirkin goto error; 1180b0f9dc5SMichael S. Tsirkin vp_dev->msix_affinity_masks 1196396bb22SKees Cook = kcalloc(nvectors, sizeof(*vp_dev->msix_affinity_masks), 1200b0f9dc5SMichael S. Tsirkin GFP_KERNEL); 1210b0f9dc5SMichael S. Tsirkin if (!vp_dev->msix_affinity_masks) 1220b0f9dc5SMichael S. Tsirkin goto error; 1230b0f9dc5SMichael S. Tsirkin for (i = 0; i < nvectors; ++i) 1240b0f9dc5SMichael S. Tsirkin if (!alloc_cpumask_var(&vp_dev->msix_affinity_masks[i], 1250b0f9dc5SMichael S. Tsirkin GFP_KERNEL)) 1260b0f9dc5SMichael S. Tsirkin goto error; 1270b0f9dc5SMichael S. Tsirkin 128ba74b6f7SChristoph Hellwig if (desc) { 129ba74b6f7SChristoph Hellwig flags |= PCI_IRQ_AFFINITY; 130ba74b6f7SChristoph Hellwig desc->pre_vectors++; /* virtio config vector */ 131ba74b6f7SChristoph Hellwig } 132ba74b6f7SChristoph Hellwig 1330b0f9dc5SMichael S. Tsirkin err = pci_alloc_irq_vectors_affinity(vp_dev->pci_dev, nvectors, 134ba74b6f7SChristoph Hellwig nvectors, flags, desc); 1350b0f9dc5SMichael S. Tsirkin if (err < 0) 1360b0f9dc5SMichael S. Tsirkin goto error; 1370b0f9dc5SMichael S. Tsirkin vp_dev->msix_enabled = 1; 1380b0f9dc5SMichael S. Tsirkin 1390b0f9dc5SMichael S. Tsirkin /* Set the vector used for configuration */ 1400b0f9dc5SMichael S. Tsirkin v = vp_dev->msix_used_vectors; 1410b0f9dc5SMichael S. Tsirkin snprintf(vp_dev->msix_names[v], sizeof *vp_dev->msix_names, 1420b0f9dc5SMichael S. Tsirkin "%s-config", name); 1430b0f9dc5SMichael S. Tsirkin err = request_irq(pci_irq_vector(vp_dev->pci_dev, v), 1440b0f9dc5SMichael S. Tsirkin vp_config_changed, 0, vp_dev->msix_names[v], 1450b0f9dc5SMichael S. Tsirkin vp_dev); 1460b0f9dc5SMichael S. Tsirkin if (err) 1470b0f9dc5SMichael S. Tsirkin goto error; 1480b0f9dc5SMichael S. Tsirkin ++vp_dev->msix_used_vectors; 1490b0f9dc5SMichael S. Tsirkin 1500b0f9dc5SMichael S. Tsirkin v = vp_dev->config_vector(vp_dev, v); 1510b0f9dc5SMichael S. Tsirkin /* Verify we had enough resources to assign the vector */ 1520b0f9dc5SMichael S. Tsirkin if (v == VIRTIO_MSI_NO_VECTOR) { 1530b0f9dc5SMichael S. Tsirkin err = -EBUSY; 1540b0f9dc5SMichael S. Tsirkin goto error; 1550b0f9dc5SMichael S. Tsirkin } 1560b0f9dc5SMichael S. Tsirkin 1570b0f9dc5SMichael S. Tsirkin if (!per_vq_vectors) { 1580b0f9dc5SMichael S. Tsirkin /* Shared vector for all VQs */ 1590b0f9dc5SMichael S. Tsirkin v = vp_dev->msix_used_vectors; 1600b0f9dc5SMichael S. Tsirkin snprintf(vp_dev->msix_names[v], sizeof *vp_dev->msix_names, 1610b0f9dc5SMichael S. Tsirkin "%s-virtqueues", name); 1620b0f9dc5SMichael S. Tsirkin err = request_irq(pci_irq_vector(vp_dev->pci_dev, v), 1630b0f9dc5SMichael S. Tsirkin vp_vring_interrupt, 0, vp_dev->msix_names[v], 1640b0f9dc5SMichael S. Tsirkin vp_dev); 1650b0f9dc5SMichael S. Tsirkin if (err) 1660b0f9dc5SMichael S. Tsirkin goto error; 1670b0f9dc5SMichael S. Tsirkin ++vp_dev->msix_used_vectors; 1680b0f9dc5SMichael S. Tsirkin } 1690b0f9dc5SMichael S. Tsirkin return 0; 1700b0f9dc5SMichael S. Tsirkin error: 1710b0f9dc5SMichael S. Tsirkin return err; 1720b0f9dc5SMichael S. Tsirkin } 1730b0f9dc5SMichael S. Tsirkin 1740a9b3f47SMichael S. Tsirkin static struct virtqueue *vp_setup_vq(struct virtio_device *vdev, unsigned index, 1750a9b3f47SMichael S. Tsirkin void (*callback)(struct virtqueue *vq), 1760a9b3f47SMichael S. Tsirkin const char *name, 177f94682ddSMichael S. Tsirkin bool ctx, 1780a9b3f47SMichael S. Tsirkin u16 msix_vec) 1790a9b3f47SMichael S. Tsirkin { 1800a9b3f47SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 1810a9b3f47SMichael S. Tsirkin struct virtio_pci_vq_info *info = kmalloc(sizeof *info, GFP_KERNEL); 1820a9b3f47SMichael S. Tsirkin struct virtqueue *vq; 1830a9b3f47SMichael S. Tsirkin unsigned long flags; 1840a9b3f47SMichael S. Tsirkin 1850a9b3f47SMichael S. Tsirkin /* fill out our structure that represents an active queue */ 1860a9b3f47SMichael S. Tsirkin if (!info) 1870a9b3f47SMichael S. Tsirkin return ERR_PTR(-ENOMEM); 1880a9b3f47SMichael S. Tsirkin 189f94682ddSMichael S. Tsirkin vq = vp_dev->setup_vq(vp_dev, info, index, callback, name, ctx, 1900a9b3f47SMichael S. Tsirkin msix_vec); 1910a9b3f47SMichael S. Tsirkin if (IS_ERR(vq)) 1920a9b3f47SMichael S. Tsirkin goto out_info; 1930a9b3f47SMichael S. Tsirkin 1940a9b3f47SMichael S. Tsirkin info->vq = vq; 1950a9b3f47SMichael S. Tsirkin if (callback) { 1960a9b3f47SMichael S. Tsirkin spin_lock_irqsave(&vp_dev->lock, flags); 1970a9b3f47SMichael S. Tsirkin list_add(&info->node, &vp_dev->virtqueues); 1980a9b3f47SMichael S. Tsirkin spin_unlock_irqrestore(&vp_dev->lock, flags); 1990a9b3f47SMichael S. Tsirkin } else { 2000a9b3f47SMichael S. Tsirkin INIT_LIST_HEAD(&info->node); 2010a9b3f47SMichael S. Tsirkin } 2020a9b3f47SMichael S. Tsirkin 2030a9b3f47SMichael S. Tsirkin vp_dev->vqs[index] = info; 2040a9b3f47SMichael S. Tsirkin return vq; 2050a9b3f47SMichael S. Tsirkin 2060a9b3f47SMichael S. Tsirkin out_info: 2070a9b3f47SMichael S. Tsirkin kfree(info); 2080a9b3f47SMichael S. Tsirkin return vq; 2090a9b3f47SMichael S. Tsirkin } 2100a9b3f47SMichael S. Tsirkin 2110a9b3f47SMichael S. Tsirkin static void vp_del_vq(struct virtqueue *vq) 2120a9b3f47SMichael S. Tsirkin { 2130a9b3f47SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vq->vdev); 2140a9b3f47SMichael S. Tsirkin struct virtio_pci_vq_info *info = vp_dev->vqs[vq->index]; 2150a9b3f47SMichael S. Tsirkin unsigned long flags; 2160a9b3f47SMichael S. Tsirkin 2170a9b3f47SMichael S. Tsirkin spin_lock_irqsave(&vp_dev->lock, flags); 2180a9b3f47SMichael S. Tsirkin list_del(&info->node); 2190a9b3f47SMichael S. Tsirkin spin_unlock_irqrestore(&vp_dev->lock, flags); 2200a9b3f47SMichael S. Tsirkin 2210a9b3f47SMichael S. Tsirkin vp_dev->del_vq(info); 2220a9b3f47SMichael S. Tsirkin kfree(info); 2230a9b3f47SMichael S. Tsirkin } 2240a9b3f47SMichael S. Tsirkin 2250b0f9dc5SMichael S. Tsirkin /* the config->del_vqs() implementation */ 2260b0f9dc5SMichael S. Tsirkin void vp_del_vqs(struct virtio_device *vdev) 2275f4c9760SMichael S. Tsirkin { 2285f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 2295f4c9760SMichael S. Tsirkin struct virtqueue *vq, *n; 2300b0f9dc5SMichael S. Tsirkin int i; 2315f4c9760SMichael S. Tsirkin 2325f4c9760SMichael S. Tsirkin list_for_each_entry_safe(vq, n, &vdev->vqs, list) { 2330a9b3f47SMichael S. Tsirkin if (vp_dev->per_vq_vectors) { 2340a9b3f47SMichael S. Tsirkin int v = vp_dev->vqs[vq->index]->msix_vector; 235fa3a3279SChristoph Hellwig 2362f8dc3a0SMarc Zyngier if (v != VIRTIO_MSI_NO_VECTOR) { 2372f8dc3a0SMarc Zyngier int irq = pci_irq_vector(vp_dev->pci_dev, v); 2382f8dc3a0SMarc Zyngier 2392f8dc3a0SMarc Zyngier irq_set_affinity_hint(irq, NULL); 2402f8dc3a0SMarc Zyngier free_irq(irq, vq); 2412f8dc3a0SMarc Zyngier } 242fa3a3279SChristoph Hellwig } 2430a9b3f47SMichael S. Tsirkin vp_del_vq(vq); 2445f4c9760SMichael S. Tsirkin } 2450a9b3f47SMichael S. Tsirkin vp_dev->per_vq_vectors = false; 2460b0f9dc5SMichael S. Tsirkin 2470b0f9dc5SMichael S. Tsirkin if (vp_dev->intx_enabled) { 2480b0f9dc5SMichael S. Tsirkin free_irq(vp_dev->pci_dev->irq, vp_dev); 2490b0f9dc5SMichael S. Tsirkin vp_dev->intx_enabled = 0; 25066f2f555SChristoph Hellwig } 25166f2f555SChristoph Hellwig 2520b0f9dc5SMichael S. Tsirkin for (i = 0; i < vp_dev->msix_used_vectors; ++i) 2530b0f9dc5SMichael S. Tsirkin free_irq(pci_irq_vector(vp_dev->pci_dev, i), vp_dev); 25466f2f555SChristoph Hellwig 2556a8aae68SLongpeng if (vp_dev->msix_affinity_masks) { 25607ec5148SChristoph Hellwig for (i = 0; i < vp_dev->msix_vectors; i++) 2570b0f9dc5SMichael S. Tsirkin if (vp_dev->msix_affinity_masks[i]) 25807ec5148SChristoph Hellwig free_cpumask_var(vp_dev->msix_affinity_masks[i]); 2596a8aae68SLongpeng } 26007ec5148SChristoph Hellwig 2610b0f9dc5SMichael S. Tsirkin if (vp_dev->msix_enabled) { 26266f2f555SChristoph Hellwig /* Disable the vector used for configuration */ 26366f2f555SChristoph Hellwig vp_dev->config_vector(vp_dev, VIRTIO_MSI_NO_VECTOR); 26466f2f555SChristoph Hellwig 2650b0f9dc5SMichael S. Tsirkin pci_free_irq_vectors(vp_dev->pci_dev); 2660b0f9dc5SMichael S. Tsirkin vp_dev->msix_enabled = 0; 26766f2f555SChristoph Hellwig } 26866f2f555SChristoph Hellwig 2690b0f9dc5SMichael S. Tsirkin vp_dev->msix_vectors = 0; 2700b0f9dc5SMichael S. Tsirkin vp_dev->msix_used_vectors = 0; 2710b0f9dc5SMichael S. Tsirkin kfree(vp_dev->msix_names); 2720b0f9dc5SMichael S. Tsirkin vp_dev->msix_names = NULL; 2730b0f9dc5SMichael S. Tsirkin kfree(vp_dev->msix_affinity_masks); 2740b0f9dc5SMichael S. Tsirkin vp_dev->msix_affinity_masks = NULL; 2750a9b3f47SMichael S. Tsirkin kfree(vp_dev->vqs); 2760a9b3f47SMichael S. Tsirkin vp_dev->vqs = NULL; 2775f4c9760SMichael S. Tsirkin } 2785f4c9760SMichael S. Tsirkin 279a3cbec69SChristoph Hellwig static int vp_find_vqs_msix(struct virtio_device *vdev, unsigned nvqs, 28052a61516SChristoph Hellwig struct virtqueue *vqs[], vq_callback_t *callbacks[], 281bf951b10SMichael S. Tsirkin const char * const names[], bool per_vq_vectors, 282f94682ddSMichael S. Tsirkin const bool *ctx, 283bf951b10SMichael S. Tsirkin struct irq_affinity *desc) 2845f4c9760SMichael S. Tsirkin { 2855f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 2865f4c9760SMichael S. Tsirkin u16 msix_vec; 287ddbeac07SWei Wang int i, err, nvectors, allocated_vectors, queue_idx = 0; 2885f4c9760SMichael S. Tsirkin 2890a9b3f47SMichael S. Tsirkin vp_dev->vqs = kcalloc(nvqs, sizeof(*vp_dev->vqs), GFP_KERNEL); 2900a9b3f47SMichael S. Tsirkin if (!vp_dev->vqs) 2910a9b3f47SMichael S. Tsirkin return -ENOMEM; 2920a9b3f47SMichael S. Tsirkin 293bf951b10SMichael S. Tsirkin if (per_vq_vectors) { 2940b0f9dc5SMichael S. Tsirkin /* Best option: one for change interrupt, one per vq. */ 2950b0f9dc5SMichael S. Tsirkin nvectors = 1; 2960b0f9dc5SMichael S. Tsirkin for (i = 0; i < nvqs; ++i) 2970b0f9dc5SMichael S. Tsirkin if (callbacks[i]) 2980b0f9dc5SMichael S. Tsirkin ++nvectors; 299bf951b10SMichael S. Tsirkin } else { 3000b0f9dc5SMichael S. Tsirkin /* Second best: one for change, shared for all vqs. */ 3010b0f9dc5SMichael S. Tsirkin nvectors = 2; 3025f4c9760SMichael S. Tsirkin } 3035f4c9760SMichael S. Tsirkin 3040b0f9dc5SMichael S. Tsirkin err = vp_request_msix_vectors(vdev, nvectors, per_vq_vectors, 3050b0f9dc5SMichael S. Tsirkin per_vq_vectors ? desc : NULL); 3065f4c9760SMichael S. Tsirkin if (err) 3070b0f9dc5SMichael S. Tsirkin goto error_find; 3085f4c9760SMichael S. Tsirkin 3090a9b3f47SMichael S. Tsirkin vp_dev->per_vq_vectors = per_vq_vectors; 3100b0f9dc5SMichael S. Tsirkin allocated_vectors = vp_dev->msix_used_vectors; 3115f4c9760SMichael S. Tsirkin for (i = 0; i < nvqs; ++i) { 3125f4c9760SMichael S. Tsirkin if (!names[i]) { 3135f4c9760SMichael S. Tsirkin vqs[i] = NULL; 3145f4c9760SMichael S. Tsirkin continue; 315a3cbec69SChristoph Hellwig } 316a3cbec69SChristoph Hellwig 3170b0f9dc5SMichael S. Tsirkin if (!callbacks[i]) 31807ec5148SChristoph Hellwig msix_vec = VIRTIO_MSI_NO_VECTOR; 3190a9b3f47SMichael S. Tsirkin else if (vp_dev->per_vq_vectors) 3200b0f9dc5SMichael S. Tsirkin msix_vec = allocated_vectors++; 3210b0f9dc5SMichael S. Tsirkin else 3220b0f9dc5SMichael S. Tsirkin msix_vec = VP_MSIX_VQ_VECTOR; 323ddbeac07SWei Wang vqs[i] = vp_setup_vq(vdev, queue_idx++, callbacks[i], names[i], 324f94682ddSMichael S. Tsirkin ctx ? ctx[i] : false, 3255c34d002SChristoph Hellwig msix_vec); 3265f4c9760SMichael S. Tsirkin if (IS_ERR(vqs[i])) { 3275f4c9760SMichael S. Tsirkin err = PTR_ERR(vqs[i]); 3280b0f9dc5SMichael S. Tsirkin goto error_find; 3295f4c9760SMichael S. Tsirkin } 3305f4c9760SMichael S. Tsirkin 3310a9b3f47SMichael S. Tsirkin if (!vp_dev->per_vq_vectors || msix_vec == VIRTIO_MSI_NO_VECTOR) 3320b0f9dc5SMichael S. Tsirkin continue; 3330b0f9dc5SMichael S. Tsirkin 3340b0f9dc5SMichael S. Tsirkin /* allocate per-vq irq if available and necessary */ 3350b0f9dc5SMichael S. Tsirkin snprintf(vp_dev->msix_names[msix_vec], 3360b0f9dc5SMichael S. Tsirkin sizeof *vp_dev->msix_names, 3370b0f9dc5SMichael S. Tsirkin "%s-%s", 3385f4c9760SMichael S. Tsirkin dev_name(&vp_dev->vdev.dev), names[i]); 339fa3a3279SChristoph Hellwig err = request_irq(pci_irq_vector(vp_dev->pci_dev, msix_vec), 3400b0f9dc5SMichael S. Tsirkin vring_interrupt, 0, 3410b0f9dc5SMichael S. Tsirkin vp_dev->msix_names[msix_vec], 3420b0f9dc5SMichael S. Tsirkin vqs[i]); 3430a9b3f47SMichael S. Tsirkin if (err) 3440b0f9dc5SMichael S. Tsirkin goto error_find; 3455f4c9760SMichael S. Tsirkin } 3465f4c9760SMichael S. Tsirkin return 0; 3475f4c9760SMichael S. Tsirkin 3480b0f9dc5SMichael S. Tsirkin error_find: 3490b0f9dc5SMichael S. Tsirkin vp_del_vqs(vdev); 3505f4c9760SMichael S. Tsirkin return err; 3515f4c9760SMichael S. Tsirkin } 3525f4c9760SMichael S. Tsirkin 353a3cbec69SChristoph Hellwig static int vp_find_vqs_intx(struct virtio_device *vdev, unsigned nvqs, 354a3cbec69SChristoph Hellwig struct virtqueue *vqs[], vq_callback_t *callbacks[], 355f94682ddSMichael S. Tsirkin const char * const names[], const bool *ctx) 356a3cbec69SChristoph Hellwig { 357a3cbec69SChristoph Hellwig struct virtio_pci_device *vp_dev = to_vp_device(vdev); 358ddbeac07SWei Wang int i, err, queue_idx = 0; 359a3cbec69SChristoph Hellwig 3600a9b3f47SMichael S. Tsirkin vp_dev->vqs = kcalloc(nvqs, sizeof(*vp_dev->vqs), GFP_KERNEL); 3610a9b3f47SMichael S. Tsirkin if (!vp_dev->vqs) 3620a9b3f47SMichael S. Tsirkin return -ENOMEM; 3630a9b3f47SMichael S. Tsirkin 364a3cbec69SChristoph Hellwig err = request_irq(vp_dev->pci_dev->irq, vp_interrupt, IRQF_SHARED, 365a3cbec69SChristoph Hellwig dev_name(&vdev->dev), vp_dev); 366a3cbec69SChristoph Hellwig if (err) 3670b0f9dc5SMichael S. Tsirkin goto out_del_vqs; 368a3cbec69SChristoph Hellwig 3690b0f9dc5SMichael S. Tsirkin vp_dev->intx_enabled = 1; 3700a9b3f47SMichael S. Tsirkin vp_dev->per_vq_vectors = false; 371a3cbec69SChristoph Hellwig for (i = 0; i < nvqs; ++i) { 372a3cbec69SChristoph Hellwig if (!names[i]) { 373a3cbec69SChristoph Hellwig vqs[i] = NULL; 374a3cbec69SChristoph Hellwig continue; 375a3cbec69SChristoph Hellwig } 376ddbeac07SWei Wang vqs[i] = vp_setup_vq(vdev, queue_idx++, callbacks[i], names[i], 377f94682ddSMichael S. Tsirkin ctx ? ctx[i] : false, 378a3cbec69SChristoph Hellwig VIRTIO_MSI_NO_VECTOR); 379a3cbec69SChristoph Hellwig if (IS_ERR(vqs[i])) { 380a3cbec69SChristoph Hellwig err = PTR_ERR(vqs[i]); 3810b0f9dc5SMichael S. Tsirkin goto out_del_vqs; 382a3cbec69SChristoph Hellwig } 383a3cbec69SChristoph Hellwig } 384a3cbec69SChristoph Hellwig 385a3cbec69SChristoph Hellwig return 0; 3860b0f9dc5SMichael S. Tsirkin out_del_vqs: 3870b0f9dc5SMichael S. Tsirkin vp_del_vqs(vdev); 388a3cbec69SChristoph Hellwig return err; 389a3cbec69SChristoph Hellwig } 390a3cbec69SChristoph Hellwig 3915f4c9760SMichael S. Tsirkin /* the config->find_vqs() implementation */ 3925f4c9760SMichael S. Tsirkin int vp_find_vqs(struct virtio_device *vdev, unsigned nvqs, 393fb5e31d9SChristoph Hellwig struct virtqueue *vqs[], vq_callback_t *callbacks[], 394f94682ddSMichael S. Tsirkin const char * const names[], const bool *ctx, 395f94682ddSMichael S. Tsirkin struct irq_affinity *desc) 3965f4c9760SMichael S. Tsirkin { 3975f4c9760SMichael S. Tsirkin int err; 3985f4c9760SMichael S. Tsirkin 399bf951b10SMichael S. Tsirkin /* Try MSI-X with one vector per queue. */ 400f94682ddSMichael S. Tsirkin err = vp_find_vqs_msix(vdev, nvqs, vqs, callbacks, names, true, ctx, desc); 4015f4c9760SMichael S. Tsirkin if (!err) 4025f4c9760SMichael S. Tsirkin return 0; 403bf951b10SMichael S. Tsirkin /* Fallback: MSI-X with one vector for config, one shared for queues. */ 404f94682ddSMichael S. Tsirkin err = vp_find_vqs_msix(vdev, nvqs, vqs, callbacks, names, false, ctx, desc); 405bf951b10SMichael S. Tsirkin if (!err) 406bf951b10SMichael S. Tsirkin return 0; 407bf951b10SMichael S. Tsirkin /* Finally fall back to regular interrupts. */ 408f94682ddSMichael S. Tsirkin return vp_find_vqs_intx(vdev, nvqs, vqs, callbacks, names, ctx); 4095f4c9760SMichael S. Tsirkin } 4105f4c9760SMichael S. Tsirkin 4115f4c9760SMichael S. Tsirkin const char *vp_bus_name(struct virtio_device *vdev) 4125f4c9760SMichael S. Tsirkin { 4135f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 4145f4c9760SMichael S. Tsirkin 4155f4c9760SMichael S. Tsirkin return pci_name(vp_dev->pci_dev); 4165f4c9760SMichael S. Tsirkin } 4175f4c9760SMichael S. Tsirkin 4185f4c9760SMichael S. Tsirkin /* Setup the affinity for a virtqueue: 4195f4c9760SMichael S. Tsirkin * - force the affinity for per vq vector 4205f4c9760SMichael S. Tsirkin * - OR over all affinities for shared MSI 4215f4c9760SMichael S. Tsirkin * - ignore the affinity request if we're using INTX 4225f4c9760SMichael S. Tsirkin */ 42319e226e8SCaleb Raitto int vp_set_vq_affinity(struct virtqueue *vq, const struct cpumask *cpu_mask) 4245f4c9760SMichael S. Tsirkin { 4255f4c9760SMichael S. Tsirkin struct virtio_device *vdev = vq->vdev; 4265f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 4270a9b3f47SMichael S. Tsirkin struct virtio_pci_vq_info *info = vp_dev->vqs[vq->index]; 4280a9b3f47SMichael S. Tsirkin struct cpumask *mask; 4290a9b3f47SMichael S. Tsirkin unsigned int irq; 4305f4c9760SMichael S. Tsirkin 4315f4c9760SMichael S. Tsirkin if (!vq->callback) 4325f4c9760SMichael S. Tsirkin return -EINVAL; 4335f4c9760SMichael S. Tsirkin 4342008c154SMichael S. Tsirkin if (vp_dev->msix_enabled) { 4350a9b3f47SMichael S. Tsirkin mask = vp_dev->msix_affinity_masks[info->msix_vector]; 4360a9b3f47SMichael S. Tsirkin irq = pci_irq_vector(vp_dev->pci_dev, info->msix_vector); 43719e226e8SCaleb Raitto if (!cpu_mask) 4385f4c9760SMichael S. Tsirkin irq_set_affinity_hint(irq, NULL); 4395f4c9760SMichael S. Tsirkin else { 44019e226e8SCaleb Raitto cpumask_copy(mask, cpu_mask); 4415f4c9760SMichael S. Tsirkin irq_set_affinity_hint(irq, mask); 4425f4c9760SMichael S. Tsirkin } 4435f4c9760SMichael S. Tsirkin } 4445f4c9760SMichael S. Tsirkin return 0; 4455f4c9760SMichael S. Tsirkin } 4465f4c9760SMichael S. Tsirkin 447bbaba479SChristoph Hellwig const struct cpumask *vp_get_vq_affinity(struct virtio_device *vdev, int index) 448bbaba479SChristoph Hellwig { 449bbaba479SChristoph Hellwig struct virtio_pci_device *vp_dev = to_vp_device(vdev); 450bbaba479SChristoph Hellwig 4510a9b3f47SMichael S. Tsirkin if (!vp_dev->per_vq_vectors || 4520a9b3f47SMichael S. Tsirkin vp_dev->vqs[index]->msix_vector == VIRTIO_MSI_NO_VECTOR) 453bbaba479SChristoph Hellwig return NULL; 454bbaba479SChristoph Hellwig 4550a9b3f47SMichael S. Tsirkin return pci_irq_get_affinity(vp_dev->pci_dev, 4560a9b3f47SMichael S. Tsirkin vp_dev->vqs[index]->msix_vector); 457bbaba479SChristoph Hellwig } 458bbaba479SChristoph Hellwig 4595f4c9760SMichael S. Tsirkin #ifdef CONFIG_PM_SLEEP 4605f4c9760SMichael S. Tsirkin static int virtio_pci_freeze(struct device *dev) 4615f4c9760SMichael S. Tsirkin { 4625f4c9760SMichael S. Tsirkin struct pci_dev *pci_dev = to_pci_dev(dev); 4635f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = pci_get_drvdata(pci_dev); 4645f4c9760SMichael S. Tsirkin int ret; 4655f4c9760SMichael S. Tsirkin 4665f4c9760SMichael S. Tsirkin ret = virtio_device_freeze(&vp_dev->vdev); 4675f4c9760SMichael S. Tsirkin 4685f4c9760SMichael S. Tsirkin if (!ret) 4695f4c9760SMichael S. Tsirkin pci_disable_device(pci_dev); 4705f4c9760SMichael S. Tsirkin return ret; 4715f4c9760SMichael S. Tsirkin } 4725f4c9760SMichael S. Tsirkin 4735f4c9760SMichael S. Tsirkin static int virtio_pci_restore(struct device *dev) 4745f4c9760SMichael S. Tsirkin { 4755f4c9760SMichael S. Tsirkin struct pci_dev *pci_dev = to_pci_dev(dev); 4765f4c9760SMichael S. Tsirkin struct virtio_pci_device *vp_dev = pci_get_drvdata(pci_dev); 4775f4c9760SMichael S. Tsirkin int ret; 4785f4c9760SMichael S. Tsirkin 4795f4c9760SMichael S. Tsirkin ret = pci_enable_device(pci_dev); 4805f4c9760SMichael S. Tsirkin if (ret) 4815f4c9760SMichael S. Tsirkin return ret; 4825f4c9760SMichael S. Tsirkin 4835f4c9760SMichael S. Tsirkin pci_set_master(pci_dev); 4845f4c9760SMichael S. Tsirkin return virtio_device_restore(&vp_dev->vdev); 4855f4c9760SMichael S. Tsirkin } 4865f4c9760SMichael S. Tsirkin 4879a4253dbSMichael S. Tsirkin static const struct dev_pm_ops virtio_pci_pm_ops = { 4885f4c9760SMichael S. Tsirkin SET_SYSTEM_SLEEP_PM_OPS(virtio_pci_freeze, virtio_pci_restore) 4895f4c9760SMichael S. Tsirkin }; 4905f4c9760SMichael S. Tsirkin #endif 4919a4253dbSMichael S. Tsirkin 4929a4253dbSMichael S. Tsirkin 4939a4253dbSMichael S. Tsirkin /* Qumranet donated their vendor ID for devices 0x1000 thru 0x10FF. */ 4949a4253dbSMichael S. Tsirkin static const struct pci_device_id virtio_pci_id_table[] = { 495caf02abfSRobin H. Johnson { PCI_DEVICE(PCI_VENDOR_ID_REDHAT_QUMRANET, PCI_ANY_ID) }, 4969a4253dbSMichael S. Tsirkin { 0 } 4979a4253dbSMichael S. Tsirkin }; 4989a4253dbSMichael S. Tsirkin 4999a4253dbSMichael S. Tsirkin MODULE_DEVICE_TABLE(pci, virtio_pci_id_table); 5009a4253dbSMichael S. Tsirkin 501ff31d2e2SMichael S. Tsirkin static void virtio_pci_release_dev(struct device *_d) 502ff31d2e2SMichael S. Tsirkin { 503ff31d2e2SMichael S. Tsirkin struct virtio_device *vdev = dev_to_virtio(_d); 504ff31d2e2SMichael S. Tsirkin struct virtio_pci_device *vp_dev = to_vp_device(vdev); 505ff31d2e2SMichael S. Tsirkin 506ff31d2e2SMichael S. Tsirkin /* As struct device is a kobject, it's not safe to 507ff31d2e2SMichael S. Tsirkin * free the memory (including the reference counter itself) 508ff31d2e2SMichael S. Tsirkin * until it's release callback. */ 509ff31d2e2SMichael S. Tsirkin kfree(vp_dev); 510ff31d2e2SMichael S. Tsirkin } 511ff31d2e2SMichael S. Tsirkin 5129a4253dbSMichael S. Tsirkin static int virtio_pci_probe(struct pci_dev *pci_dev, 5139a4253dbSMichael S. Tsirkin const struct pci_device_id *id) 5149a4253dbSMichael S. Tsirkin { 51533635bd9Sweiping zhang struct virtio_pci_device *vp_dev, *reg_dev = NULL; 516ff31d2e2SMichael S. Tsirkin int rc; 517ff31d2e2SMichael S. Tsirkin 518ff31d2e2SMichael S. Tsirkin /* allocate our structure and fill it out */ 519ff31d2e2SMichael S. Tsirkin vp_dev = kzalloc(sizeof(struct virtio_pci_device), GFP_KERNEL); 520ff31d2e2SMichael S. Tsirkin if (!vp_dev) 521ff31d2e2SMichael S. Tsirkin return -ENOMEM; 522ff31d2e2SMichael S. Tsirkin 523ff31d2e2SMichael S. Tsirkin pci_set_drvdata(pci_dev, vp_dev); 524ff31d2e2SMichael S. Tsirkin vp_dev->vdev.dev.parent = &pci_dev->dev; 525ff31d2e2SMichael S. Tsirkin vp_dev->vdev.dev.release = virtio_pci_release_dev; 526ff31d2e2SMichael S. Tsirkin vp_dev->pci_dev = pci_dev; 5270a9b3f47SMichael S. Tsirkin INIT_LIST_HEAD(&vp_dev->virtqueues); 5280a9b3f47SMichael S. Tsirkin spin_lock_init(&vp_dev->lock); 529ff31d2e2SMichael S. Tsirkin 530ff31d2e2SMichael S. Tsirkin /* enable the device */ 531ff31d2e2SMichael S. Tsirkin rc = pci_enable_device(pci_dev); 532ff31d2e2SMichael S. Tsirkin if (rc) 533ff31d2e2SMichael S. Tsirkin goto err_enable_device; 534ff31d2e2SMichael S. Tsirkin 535ac399d8fSMichael S. Tsirkin if (force_legacy) { 536ac399d8fSMichael S. Tsirkin rc = virtio_pci_legacy_probe(vp_dev); 537ac399d8fSMichael S. Tsirkin /* Also try modern mode if we can't map BAR0 (no IO space). */ 538ac399d8fSMichael S. Tsirkin if (rc == -ENODEV || rc == -ENOMEM) 539ac399d8fSMichael S. Tsirkin rc = virtio_pci_modern_probe(vp_dev); 540ac399d8fSMichael S. Tsirkin if (rc) 541ac399d8fSMichael S. Tsirkin goto err_probe; 542ac399d8fSMichael S. Tsirkin } else { 5431fcf0512SMichael S. Tsirkin rc = virtio_pci_modern_probe(vp_dev); 5441fcf0512SMichael S. Tsirkin if (rc == -ENODEV) 545ff31d2e2SMichael S. Tsirkin rc = virtio_pci_legacy_probe(vp_dev); 546ff31d2e2SMichael S. Tsirkin if (rc) 547ff31d2e2SMichael S. Tsirkin goto err_probe; 548ac399d8fSMichael S. Tsirkin } 549ff31d2e2SMichael S. Tsirkin 550ff31d2e2SMichael S. Tsirkin pci_set_master(pci_dev); 551ff31d2e2SMichael S. Tsirkin 552ff31d2e2SMichael S. Tsirkin rc = register_virtio_device(&vp_dev->vdev); 55333635bd9Sweiping zhang reg_dev = vp_dev; 554ff31d2e2SMichael S. Tsirkin if (rc) 555ff31d2e2SMichael S. Tsirkin goto err_register; 556ff31d2e2SMichael S. Tsirkin 557ff31d2e2SMichael S. Tsirkin return 0; 558ff31d2e2SMichael S. Tsirkin 559ff31d2e2SMichael S. Tsirkin err_register: 5601fcf0512SMichael S. Tsirkin if (vp_dev->ioaddr) 561ff31d2e2SMichael S. Tsirkin virtio_pci_legacy_remove(vp_dev); 5621fcf0512SMichael S. Tsirkin else 5631fcf0512SMichael S. Tsirkin virtio_pci_modern_remove(vp_dev); 564ff31d2e2SMichael S. Tsirkin err_probe: 565ff31d2e2SMichael S. Tsirkin pci_disable_device(pci_dev); 566ff31d2e2SMichael S. Tsirkin err_enable_device: 56733635bd9Sweiping zhang if (reg_dev) 56833635bd9Sweiping zhang put_device(&vp_dev->vdev.dev); 56933635bd9Sweiping zhang else 570ff31d2e2SMichael S. Tsirkin kfree(vp_dev); 571ff31d2e2SMichael S. Tsirkin return rc; 5729a4253dbSMichael S. Tsirkin } 5739a4253dbSMichael S. Tsirkin 5749a4253dbSMichael S. Tsirkin static void virtio_pci_remove(struct pci_dev *pci_dev) 5759a4253dbSMichael S. Tsirkin { 576ff31d2e2SMichael S. Tsirkin struct virtio_pci_device *vp_dev = pci_get_drvdata(pci_dev); 5772989be09SMichael S. Tsirkin struct device *dev = get_device(&vp_dev->vdev.dev); 578ff31d2e2SMichael S. Tsirkin 579cfecc291STiwei Bie pci_disable_sriov(pci_dev); 580cfecc291STiwei Bie 581ff31d2e2SMichael S. Tsirkin unregister_virtio_device(&vp_dev->vdev); 582ff31d2e2SMichael S. Tsirkin 5831fcf0512SMichael S. Tsirkin if (vp_dev->ioaddr) 5841fcf0512SMichael S. Tsirkin virtio_pci_legacy_remove(vp_dev); 5851fcf0512SMichael S. Tsirkin else 5861fcf0512SMichael S. Tsirkin virtio_pci_modern_remove(vp_dev); 587ff31d2e2SMichael S. Tsirkin 588ff31d2e2SMichael S. Tsirkin pci_disable_device(pci_dev); 5892989be09SMichael S. Tsirkin put_device(dev); 5909a4253dbSMichael S. Tsirkin } 5919a4253dbSMichael S. Tsirkin 592cfecc291STiwei Bie static int virtio_pci_sriov_configure(struct pci_dev *pci_dev, int num_vfs) 593cfecc291STiwei Bie { 594cfecc291STiwei Bie struct virtio_pci_device *vp_dev = pci_get_drvdata(pci_dev); 595cfecc291STiwei Bie struct virtio_device *vdev = &vp_dev->vdev; 596cfecc291STiwei Bie int ret; 597cfecc291STiwei Bie 598cfecc291STiwei Bie if (!(vdev->config->get_status(vdev) & VIRTIO_CONFIG_S_DRIVER_OK)) 599cfecc291STiwei Bie return -EBUSY; 600cfecc291STiwei Bie 601cfecc291STiwei Bie if (!__virtio_test_bit(vdev, VIRTIO_F_SR_IOV)) 602cfecc291STiwei Bie return -EINVAL; 603cfecc291STiwei Bie 604cfecc291STiwei Bie if (pci_vfs_assigned(pci_dev)) 605cfecc291STiwei Bie return -EPERM; 606cfecc291STiwei Bie 607cfecc291STiwei Bie if (num_vfs == 0) { 608cfecc291STiwei Bie pci_disable_sriov(pci_dev); 609cfecc291STiwei Bie return 0; 610cfecc291STiwei Bie } 611cfecc291STiwei Bie 612cfecc291STiwei Bie ret = pci_enable_sriov(pci_dev, num_vfs); 613cfecc291STiwei Bie if (ret < 0) 614cfecc291STiwei Bie return ret; 615cfecc291STiwei Bie 616cfecc291STiwei Bie return num_vfs; 617cfecc291STiwei Bie } 618cfecc291STiwei Bie 6199a4253dbSMichael S. Tsirkin static struct pci_driver virtio_pci_driver = { 6209a4253dbSMichael S. Tsirkin .name = "virtio-pci", 6219a4253dbSMichael S. Tsirkin .id_table = virtio_pci_id_table, 6229a4253dbSMichael S. Tsirkin .probe = virtio_pci_probe, 6239a4253dbSMichael S. Tsirkin .remove = virtio_pci_remove, 6249a4253dbSMichael S. Tsirkin #ifdef CONFIG_PM_SLEEP 6259a4253dbSMichael S. Tsirkin .driver.pm = &virtio_pci_pm_ops, 6269a4253dbSMichael S. Tsirkin #endif 627cfecc291STiwei Bie .sriov_configure = virtio_pci_sriov_configure, 6289a4253dbSMichael S. Tsirkin }; 6299a4253dbSMichael S. Tsirkin 6309a4253dbSMichael S. Tsirkin module_pci_driver(virtio_pci_driver); 6315ff16110SHerbert Xu 6325ff16110SHerbert Xu MODULE_AUTHOR("Anthony Liguori <aliguori@us.ibm.com>"); 6335ff16110SHerbert Xu MODULE_DESCRIPTION("virtio-pci"); 6345ff16110SHerbert Xu MODULE_LICENSE("GPL"); 6355ff16110SHerbert Xu MODULE_VERSION("1"); 636