10a8a69ddSRusty Russell /* Virtio ring implementation. 20a8a69ddSRusty Russell * 30a8a69ddSRusty Russell * Copyright 2007 Rusty Russell IBM Corporation 40a8a69ddSRusty Russell * 50a8a69ddSRusty Russell * This program is free software; you can redistribute it and/or modify 60a8a69ddSRusty Russell * it under the terms of the GNU General Public License as published by 70a8a69ddSRusty Russell * the Free Software Foundation; either version 2 of the License, or 80a8a69ddSRusty Russell * (at your option) any later version. 90a8a69ddSRusty Russell * 100a8a69ddSRusty Russell * This program is distributed in the hope that it will be useful, 110a8a69ddSRusty Russell * but WITHOUT ANY WARRANTY; without even the implied warranty of 120a8a69ddSRusty Russell * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 130a8a69ddSRusty Russell * GNU General Public License for more details. 140a8a69ddSRusty Russell * 150a8a69ddSRusty Russell * You should have received a copy of the GNU General Public License 160a8a69ddSRusty Russell * along with this program; if not, write to the Free Software 170a8a69ddSRusty Russell * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA 180a8a69ddSRusty Russell */ 190a8a69ddSRusty Russell #include <linux/virtio.h> 200a8a69ddSRusty Russell #include <linux/virtio_ring.h> 21e34f8725SRusty Russell #include <linux/virtio_config.h> 220a8a69ddSRusty Russell #include <linux/device.h> 235a0e3ad6STejun Heo #include <linux/slab.h> 240a8a69ddSRusty Russell 25d57ed95dSMichael S. Tsirkin /* virtio guest is communicating with a virtual "device" that actually runs on 26d57ed95dSMichael S. Tsirkin * a host processor. Memory barriers are used to control SMP effects. */ 27d57ed95dSMichael S. Tsirkin #ifdef CONFIG_SMP 28d57ed95dSMichael S. Tsirkin /* Where possible, use SMP barriers which are more lightweight than mandatory 29d57ed95dSMichael S. Tsirkin * barriers, because mandatory barriers control MMIO effects on accesses 30d57ed95dSMichael S. Tsirkin * through relaxed memory I/O windows (which virtio does not use). */ 31d57ed95dSMichael S. Tsirkin #define virtio_mb() smp_mb() 32d57ed95dSMichael S. Tsirkin #define virtio_rmb() smp_rmb() 33d57ed95dSMichael S. Tsirkin #define virtio_wmb() smp_wmb() 34d57ed95dSMichael S. Tsirkin #else 35d57ed95dSMichael S. Tsirkin /* We must force memory ordering even if guest is UP since host could be 36d57ed95dSMichael S. Tsirkin * running on another CPU, but SMP barriers are defined to barrier() in that 37d57ed95dSMichael S. Tsirkin * configuration. So fall back to mandatory barriers instead. */ 38d57ed95dSMichael S. Tsirkin #define virtio_mb() mb() 39d57ed95dSMichael S. Tsirkin #define virtio_rmb() rmb() 40d57ed95dSMichael S. Tsirkin #define virtio_wmb() wmb() 41d57ed95dSMichael S. Tsirkin #endif 42d57ed95dSMichael S. Tsirkin 430a8a69ddSRusty Russell #ifdef DEBUG 440a8a69ddSRusty Russell /* For development, we want to crash whenever the ring is screwed. */ 459499f5e7SRusty Russell #define BAD_RING(_vq, fmt, args...) \ 469499f5e7SRusty Russell do { \ 479499f5e7SRusty Russell dev_err(&(_vq)->vq.vdev->dev, \ 489499f5e7SRusty Russell "%s:"fmt, (_vq)->vq.name, ##args); \ 499499f5e7SRusty Russell BUG(); \ 509499f5e7SRusty Russell } while (0) 51c5f841f1SRusty Russell /* Caller is supposed to guarantee no reentry. */ 523a35ce7dSRoel Kluin #define START_USE(_vq) \ 53c5f841f1SRusty Russell do { \ 54c5f841f1SRusty Russell if ((_vq)->in_use) \ 559499f5e7SRusty Russell panic("%s:in_use = %i\n", \ 569499f5e7SRusty Russell (_vq)->vq.name, (_vq)->in_use); \ 57c5f841f1SRusty Russell (_vq)->in_use = __LINE__; \ 58c5f841f1SRusty Russell } while (0) 593a35ce7dSRoel Kluin #define END_USE(_vq) \ 6097a545abSRusty Russell do { BUG_ON(!(_vq)->in_use); (_vq)->in_use = 0; } while(0) 610a8a69ddSRusty Russell #else 629499f5e7SRusty Russell #define BAD_RING(_vq, fmt, args...) \ 639499f5e7SRusty Russell do { \ 649499f5e7SRusty Russell dev_err(&_vq->vq.vdev->dev, \ 659499f5e7SRusty Russell "%s:"fmt, (_vq)->vq.name, ##args); \ 669499f5e7SRusty Russell (_vq)->broken = true; \ 679499f5e7SRusty Russell } while (0) 680a8a69ddSRusty Russell #define START_USE(vq) 690a8a69ddSRusty Russell #define END_USE(vq) 700a8a69ddSRusty Russell #endif 710a8a69ddSRusty Russell 720a8a69ddSRusty Russell struct vring_virtqueue 730a8a69ddSRusty Russell { 740a8a69ddSRusty Russell struct virtqueue vq; 750a8a69ddSRusty Russell 760a8a69ddSRusty Russell /* Actual memory layout for this queue */ 770a8a69ddSRusty Russell struct vring vring; 780a8a69ddSRusty Russell 790a8a69ddSRusty Russell /* Other side has made a mess, don't try any more. */ 800a8a69ddSRusty Russell bool broken; 810a8a69ddSRusty Russell 829fa29b9dSMark McLoughlin /* Host supports indirect buffers */ 839fa29b9dSMark McLoughlin bool indirect; 849fa29b9dSMark McLoughlin 850a8a69ddSRusty Russell /* Number of free buffers */ 860a8a69ddSRusty Russell unsigned int num_free; 870a8a69ddSRusty Russell /* Head of free buffer list. */ 880a8a69ddSRusty Russell unsigned int free_head; 890a8a69ddSRusty Russell /* Number we've added since last sync. */ 900a8a69ddSRusty Russell unsigned int num_added; 910a8a69ddSRusty Russell 920a8a69ddSRusty Russell /* Last used index we've seen. */ 931bc4953eSAnthony Liguori u16 last_used_idx; 940a8a69ddSRusty Russell 950a8a69ddSRusty Russell /* How to notify other side. FIXME: commonalize hcalls! */ 960a8a69ddSRusty Russell void (*notify)(struct virtqueue *vq); 970a8a69ddSRusty Russell 980a8a69ddSRusty Russell #ifdef DEBUG 990a8a69ddSRusty Russell /* They're supposed to lock for us. */ 1000a8a69ddSRusty Russell unsigned int in_use; 1010a8a69ddSRusty Russell #endif 1020a8a69ddSRusty Russell 1030a8a69ddSRusty Russell /* Tokens for callbacks. */ 1040a8a69ddSRusty Russell void *data[]; 1050a8a69ddSRusty Russell }; 1060a8a69ddSRusty Russell 1070a8a69ddSRusty Russell #define to_vvq(_vq) container_of(_vq, struct vring_virtqueue, vq) 1080a8a69ddSRusty Russell 1099fa29b9dSMark McLoughlin /* Set up an indirect table of descriptors and add it to the queue. */ 1109fa29b9dSMark McLoughlin static int vring_add_indirect(struct vring_virtqueue *vq, 1119fa29b9dSMark McLoughlin struct scatterlist sg[], 1129fa29b9dSMark McLoughlin unsigned int out, 113bbd603efSMichael S. Tsirkin unsigned int in, 114bbd603efSMichael S. Tsirkin gfp_t gfp) 1159fa29b9dSMark McLoughlin { 1169fa29b9dSMark McLoughlin struct vring_desc *desc; 1179fa29b9dSMark McLoughlin unsigned head; 1189fa29b9dSMark McLoughlin int i; 1199fa29b9dSMark McLoughlin 120bbd603efSMichael S. Tsirkin desc = kmalloc((out + in) * sizeof(struct vring_desc), gfp); 1219fa29b9dSMark McLoughlin if (!desc) 122*686d3637SMichael S. Tsirkin return -ENOMEM; 1239fa29b9dSMark McLoughlin 1249fa29b9dSMark McLoughlin /* Transfer entries from the sg list into the indirect page */ 1259fa29b9dSMark McLoughlin for (i = 0; i < out; i++) { 1269fa29b9dSMark McLoughlin desc[i].flags = VRING_DESC_F_NEXT; 1279fa29b9dSMark McLoughlin desc[i].addr = sg_phys(sg); 1289fa29b9dSMark McLoughlin desc[i].len = sg->length; 1299fa29b9dSMark McLoughlin desc[i].next = i+1; 1309fa29b9dSMark McLoughlin sg++; 1319fa29b9dSMark McLoughlin } 1329fa29b9dSMark McLoughlin for (; i < (out + in); i++) { 1339fa29b9dSMark McLoughlin desc[i].flags = VRING_DESC_F_NEXT|VRING_DESC_F_WRITE; 1349fa29b9dSMark McLoughlin desc[i].addr = sg_phys(sg); 1359fa29b9dSMark McLoughlin desc[i].len = sg->length; 1369fa29b9dSMark McLoughlin desc[i].next = i+1; 1379fa29b9dSMark McLoughlin sg++; 1389fa29b9dSMark McLoughlin } 1399fa29b9dSMark McLoughlin 1409fa29b9dSMark McLoughlin /* Last one doesn't continue. */ 1419fa29b9dSMark McLoughlin desc[i-1].flags &= ~VRING_DESC_F_NEXT; 1429fa29b9dSMark McLoughlin desc[i-1].next = 0; 1439fa29b9dSMark McLoughlin 1449fa29b9dSMark McLoughlin /* We're about to use a buffer */ 1459fa29b9dSMark McLoughlin vq->num_free--; 1469fa29b9dSMark McLoughlin 1479fa29b9dSMark McLoughlin /* Use a single buffer which doesn't continue */ 1489fa29b9dSMark McLoughlin head = vq->free_head; 1499fa29b9dSMark McLoughlin vq->vring.desc[head].flags = VRING_DESC_F_INDIRECT; 1509fa29b9dSMark McLoughlin vq->vring.desc[head].addr = virt_to_phys(desc); 1519fa29b9dSMark McLoughlin vq->vring.desc[head].len = i * sizeof(struct vring_desc); 1529fa29b9dSMark McLoughlin 1539fa29b9dSMark McLoughlin /* Update free pointer */ 1549fa29b9dSMark McLoughlin vq->free_head = vq->vring.desc[head].next; 1559fa29b9dSMark McLoughlin 1569fa29b9dSMark McLoughlin return head; 1579fa29b9dSMark McLoughlin } 1589fa29b9dSMark McLoughlin 159bbd603efSMichael S. Tsirkin int virtqueue_add_buf_gfp(struct virtqueue *_vq, 1600a8a69ddSRusty Russell struct scatterlist sg[], 1610a8a69ddSRusty Russell unsigned int out, 1620a8a69ddSRusty Russell unsigned int in, 163bbd603efSMichael S. Tsirkin void *data, 164bbd603efSMichael S. Tsirkin gfp_t gfp) 1650a8a69ddSRusty Russell { 1660a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 1670a8a69ddSRusty Russell unsigned int i, avail, head, uninitialized_var(prev); 1680a8a69ddSRusty Russell 1699fa29b9dSMark McLoughlin START_USE(vq); 1709fa29b9dSMark McLoughlin 1710a8a69ddSRusty Russell BUG_ON(data == NULL); 1729fa29b9dSMark McLoughlin 1739fa29b9dSMark McLoughlin /* If the host supports indirect descriptor tables, and we have multiple 1749fa29b9dSMark McLoughlin * buffers, then go indirect. FIXME: tune this threshold */ 1759fa29b9dSMark McLoughlin if (vq->indirect && (out + in) > 1 && vq->num_free) { 176bbd603efSMichael S. Tsirkin head = vring_add_indirect(vq, sg, out, in, gfp); 1779fa29b9dSMark McLoughlin if (head != vq->vring.num) 1789fa29b9dSMark McLoughlin goto add_head; 1799fa29b9dSMark McLoughlin } 1809fa29b9dSMark McLoughlin 1810a8a69ddSRusty Russell BUG_ON(out + in > vq->vring.num); 1820a8a69ddSRusty Russell BUG_ON(out + in == 0); 1830a8a69ddSRusty Russell 1840a8a69ddSRusty Russell if (vq->num_free < out + in) { 1850a8a69ddSRusty Russell pr_debug("Can't add buf len %i - avail = %i\n", 1860a8a69ddSRusty Russell out + in, vq->num_free); 18744653eaeSRusty Russell /* FIXME: for historical reasons, we force a notify here if 18844653eaeSRusty Russell * there are outgoing parts to the buffer. Presumably the 18944653eaeSRusty Russell * host should service the ring ASAP. */ 19044653eaeSRusty Russell if (out) 191426e3e0aSRusty Russell vq->notify(&vq->vq); 1920a8a69ddSRusty Russell END_USE(vq); 1930a8a69ddSRusty Russell return -ENOSPC; 1940a8a69ddSRusty Russell } 1950a8a69ddSRusty Russell 1960a8a69ddSRusty Russell /* We're about to use some buffers from the free list. */ 1970a8a69ddSRusty Russell vq->num_free -= out + in; 1980a8a69ddSRusty Russell 1990a8a69ddSRusty Russell head = vq->free_head; 2000a8a69ddSRusty Russell for (i = vq->free_head; out; i = vq->vring.desc[i].next, out--) { 2010a8a69ddSRusty Russell vq->vring.desc[i].flags = VRING_DESC_F_NEXT; 20215f9c890SRusty Russell vq->vring.desc[i].addr = sg_phys(sg); 2030a8a69ddSRusty Russell vq->vring.desc[i].len = sg->length; 2040a8a69ddSRusty Russell prev = i; 2050a8a69ddSRusty Russell sg++; 2060a8a69ddSRusty Russell } 2070a8a69ddSRusty Russell for (; in; i = vq->vring.desc[i].next, in--) { 2080a8a69ddSRusty Russell vq->vring.desc[i].flags = VRING_DESC_F_NEXT|VRING_DESC_F_WRITE; 20915f9c890SRusty Russell vq->vring.desc[i].addr = sg_phys(sg); 2100a8a69ddSRusty Russell vq->vring.desc[i].len = sg->length; 2110a8a69ddSRusty Russell prev = i; 2120a8a69ddSRusty Russell sg++; 2130a8a69ddSRusty Russell } 2140a8a69ddSRusty Russell /* Last one doesn't continue. */ 2150a8a69ddSRusty Russell vq->vring.desc[prev].flags &= ~VRING_DESC_F_NEXT; 2160a8a69ddSRusty Russell 2170a8a69ddSRusty Russell /* Update free pointer */ 2180a8a69ddSRusty Russell vq->free_head = i; 2190a8a69ddSRusty Russell 2209fa29b9dSMark McLoughlin add_head: 2210a8a69ddSRusty Russell /* Set token. */ 2220a8a69ddSRusty Russell vq->data[head] = data; 2230a8a69ddSRusty Russell 2240a8a69ddSRusty Russell /* Put entry in available array (but don't update avail->idx until they 2250a8a69ddSRusty Russell * do sync). FIXME: avoid modulus here? */ 2260a8a69ddSRusty Russell avail = (vq->vring.avail->idx + vq->num_added++) % vq->vring.num; 2270a8a69ddSRusty Russell vq->vring.avail->ring[avail] = head; 2280a8a69ddSRusty Russell 2290a8a69ddSRusty Russell pr_debug("Added buffer head %i to %p\n", head, vq); 2300a8a69ddSRusty Russell END_USE(vq); 2313c1b27d5SRusty Russell 2323c1b27d5SRusty Russell /* If we're indirect, we can fit many (assuming not OOM). */ 2333c1b27d5SRusty Russell if (vq->indirect) 2343c1b27d5SRusty Russell return vq->num_free ? vq->vring.num : 0; 2353c1b27d5SRusty Russell return vq->num_free; 2360a8a69ddSRusty Russell } 237bbd603efSMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_add_buf_gfp); 2380a8a69ddSRusty Russell 2397c5e9ed0SMichael S. Tsirkin void virtqueue_kick(struct virtqueue *_vq) 2400a8a69ddSRusty Russell { 2410a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 2420a8a69ddSRusty Russell START_USE(vq); 2430a8a69ddSRusty Russell /* Descriptors and available array need to be set before we expose the 2440a8a69ddSRusty Russell * new available array entries. */ 245d57ed95dSMichael S. Tsirkin virtio_wmb(); 2460a8a69ddSRusty Russell 2470a8a69ddSRusty Russell vq->vring.avail->idx += vq->num_added; 2480a8a69ddSRusty Russell vq->num_added = 0; 2490a8a69ddSRusty Russell 2500a8a69ddSRusty Russell /* Need to update avail index before checking if we should notify */ 251d57ed95dSMichael S. Tsirkin virtio_mb(); 2520a8a69ddSRusty Russell 2530a8a69ddSRusty Russell if (!(vq->vring.used->flags & VRING_USED_F_NO_NOTIFY)) 2540a8a69ddSRusty Russell /* Prod other side to tell it about changes. */ 2550a8a69ddSRusty Russell vq->notify(&vq->vq); 2560a8a69ddSRusty Russell 2570a8a69ddSRusty Russell END_USE(vq); 2580a8a69ddSRusty Russell } 2597c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_kick); 2600a8a69ddSRusty Russell 2610a8a69ddSRusty Russell static void detach_buf(struct vring_virtqueue *vq, unsigned int head) 2620a8a69ddSRusty Russell { 2630a8a69ddSRusty Russell unsigned int i; 2640a8a69ddSRusty Russell 2650a8a69ddSRusty Russell /* Clear data ptr. */ 2660a8a69ddSRusty Russell vq->data[head] = NULL; 2670a8a69ddSRusty Russell 2680a8a69ddSRusty Russell /* Put back on free list: find end */ 2690a8a69ddSRusty Russell i = head; 2709fa29b9dSMark McLoughlin 2719fa29b9dSMark McLoughlin /* Free the indirect table */ 2729fa29b9dSMark McLoughlin if (vq->vring.desc[i].flags & VRING_DESC_F_INDIRECT) 2739fa29b9dSMark McLoughlin kfree(phys_to_virt(vq->vring.desc[i].addr)); 2749fa29b9dSMark McLoughlin 2750a8a69ddSRusty Russell while (vq->vring.desc[i].flags & VRING_DESC_F_NEXT) { 2760a8a69ddSRusty Russell i = vq->vring.desc[i].next; 2770a8a69ddSRusty Russell vq->num_free++; 2780a8a69ddSRusty Russell } 2790a8a69ddSRusty Russell 2800a8a69ddSRusty Russell vq->vring.desc[i].next = vq->free_head; 2810a8a69ddSRusty Russell vq->free_head = head; 2820a8a69ddSRusty Russell /* Plus final descriptor */ 2830a8a69ddSRusty Russell vq->num_free++; 2840a8a69ddSRusty Russell } 2850a8a69ddSRusty Russell 2860a8a69ddSRusty Russell static inline bool more_used(const struct vring_virtqueue *vq) 2870a8a69ddSRusty Russell { 2880a8a69ddSRusty Russell return vq->last_used_idx != vq->vring.used->idx; 2890a8a69ddSRusty Russell } 2900a8a69ddSRusty Russell 2917c5e9ed0SMichael S. Tsirkin void *virtqueue_get_buf(struct virtqueue *_vq, unsigned int *len) 2920a8a69ddSRusty Russell { 2930a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 2940a8a69ddSRusty Russell void *ret; 2950a8a69ddSRusty Russell unsigned int i; 2960a8a69ddSRusty Russell 2970a8a69ddSRusty Russell START_USE(vq); 2980a8a69ddSRusty Russell 2995ef82752SRusty Russell if (unlikely(vq->broken)) { 3005ef82752SRusty Russell END_USE(vq); 3015ef82752SRusty Russell return NULL; 3025ef82752SRusty Russell } 3035ef82752SRusty Russell 3040a8a69ddSRusty Russell if (!more_used(vq)) { 3050a8a69ddSRusty Russell pr_debug("No more buffers in queue\n"); 3060a8a69ddSRusty Russell END_USE(vq); 3070a8a69ddSRusty Russell return NULL; 3080a8a69ddSRusty Russell } 3090a8a69ddSRusty Russell 3102d61ba95SMichael S. Tsirkin /* Only get used array entries after they have been exposed by host. */ 311d57ed95dSMichael S. Tsirkin virtio_rmb(); 3122d61ba95SMichael S. Tsirkin 3130a8a69ddSRusty Russell i = vq->vring.used->ring[vq->last_used_idx%vq->vring.num].id; 3140a8a69ddSRusty Russell *len = vq->vring.used->ring[vq->last_used_idx%vq->vring.num].len; 3150a8a69ddSRusty Russell 3160a8a69ddSRusty Russell if (unlikely(i >= vq->vring.num)) { 3170a8a69ddSRusty Russell BAD_RING(vq, "id %u out of range\n", i); 3180a8a69ddSRusty Russell return NULL; 3190a8a69ddSRusty Russell } 3200a8a69ddSRusty Russell if (unlikely(!vq->data[i])) { 3210a8a69ddSRusty Russell BAD_RING(vq, "id %u is not a head!\n", i); 3220a8a69ddSRusty Russell return NULL; 3230a8a69ddSRusty Russell } 3240a8a69ddSRusty Russell 3250a8a69ddSRusty Russell /* detach_buf clears data, so grab it now. */ 3260a8a69ddSRusty Russell ret = vq->data[i]; 3270a8a69ddSRusty Russell detach_buf(vq, i); 3280a8a69ddSRusty Russell vq->last_used_idx++; 3290a8a69ddSRusty Russell END_USE(vq); 3300a8a69ddSRusty Russell return ret; 3310a8a69ddSRusty Russell } 3327c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_get_buf); 3330a8a69ddSRusty Russell 3347c5e9ed0SMichael S. Tsirkin void virtqueue_disable_cb(struct virtqueue *_vq) 33518445c4dSRusty Russell { 33618445c4dSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 33718445c4dSRusty Russell 33818445c4dSRusty Russell vq->vring.avail->flags |= VRING_AVAIL_F_NO_INTERRUPT; 33918445c4dSRusty Russell } 3407c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_disable_cb); 34118445c4dSRusty Russell 3427c5e9ed0SMichael S. Tsirkin bool virtqueue_enable_cb(struct virtqueue *_vq) 3430a8a69ddSRusty Russell { 3440a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 3450a8a69ddSRusty Russell 3460a8a69ddSRusty Russell START_USE(vq); 3470a8a69ddSRusty Russell 3480a8a69ddSRusty Russell /* We optimistically turn back on interrupts, then check if there was 3490a8a69ddSRusty Russell * more to do. */ 3500a8a69ddSRusty Russell vq->vring.avail->flags &= ~VRING_AVAIL_F_NO_INTERRUPT; 351d57ed95dSMichael S. Tsirkin virtio_mb(); 3520a8a69ddSRusty Russell if (unlikely(more_used(vq))) { 3530a8a69ddSRusty Russell END_USE(vq); 3540a8a69ddSRusty Russell return false; 3550a8a69ddSRusty Russell } 3560a8a69ddSRusty Russell 3570a8a69ddSRusty Russell END_USE(vq); 3580a8a69ddSRusty Russell return true; 3590a8a69ddSRusty Russell } 3607c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_enable_cb); 3610a8a69ddSRusty Russell 3627c5e9ed0SMichael S. Tsirkin void *virtqueue_detach_unused_buf(struct virtqueue *_vq) 363c021eac4SShirley Ma { 364c021eac4SShirley Ma struct vring_virtqueue *vq = to_vvq(_vq); 365c021eac4SShirley Ma unsigned int i; 366c021eac4SShirley Ma void *buf; 367c021eac4SShirley Ma 368c021eac4SShirley Ma START_USE(vq); 369c021eac4SShirley Ma 370c021eac4SShirley Ma for (i = 0; i < vq->vring.num; i++) { 371c021eac4SShirley Ma if (!vq->data[i]) 372c021eac4SShirley Ma continue; 373c021eac4SShirley Ma /* detach_buf clears data, so grab it now. */ 374c021eac4SShirley Ma buf = vq->data[i]; 375c021eac4SShirley Ma detach_buf(vq, i); 376c021eac4SShirley Ma END_USE(vq); 377c021eac4SShirley Ma return buf; 378c021eac4SShirley Ma } 379c021eac4SShirley Ma /* That should have freed everything. */ 380c021eac4SShirley Ma BUG_ON(vq->num_free != vq->vring.num); 381c021eac4SShirley Ma 382c021eac4SShirley Ma END_USE(vq); 383c021eac4SShirley Ma return NULL; 384c021eac4SShirley Ma } 3857c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_detach_unused_buf); 386c021eac4SShirley Ma 3870a8a69ddSRusty Russell irqreturn_t vring_interrupt(int irq, void *_vq) 3880a8a69ddSRusty Russell { 3890a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 3900a8a69ddSRusty Russell 3910a8a69ddSRusty Russell if (!more_used(vq)) { 3920a8a69ddSRusty Russell pr_debug("virtqueue interrupt with no work for %p\n", vq); 3930a8a69ddSRusty Russell return IRQ_NONE; 3940a8a69ddSRusty Russell } 3950a8a69ddSRusty Russell 3960a8a69ddSRusty Russell if (unlikely(vq->broken)) 3970a8a69ddSRusty Russell return IRQ_HANDLED; 3980a8a69ddSRusty Russell 3990a8a69ddSRusty Russell pr_debug("virtqueue callback for %p (%p)\n", vq, vq->vq.callback); 40018445c4dSRusty Russell if (vq->vq.callback) 40118445c4dSRusty Russell vq->vq.callback(&vq->vq); 4020a8a69ddSRusty Russell 4030a8a69ddSRusty Russell return IRQ_HANDLED; 4040a8a69ddSRusty Russell } 405c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_interrupt); 4060a8a69ddSRusty Russell 4070a8a69ddSRusty Russell struct virtqueue *vring_new_virtqueue(unsigned int num, 40887c7d57cSRusty Russell unsigned int vring_align, 4090a8a69ddSRusty Russell struct virtio_device *vdev, 4100a8a69ddSRusty Russell void *pages, 4110a8a69ddSRusty Russell void (*notify)(struct virtqueue *), 4129499f5e7SRusty Russell void (*callback)(struct virtqueue *), 4139499f5e7SRusty Russell const char *name) 4140a8a69ddSRusty Russell { 4150a8a69ddSRusty Russell struct vring_virtqueue *vq; 4160a8a69ddSRusty Russell unsigned int i; 4170a8a69ddSRusty Russell 41842b36cc0SRusty Russell /* We assume num is a power of 2. */ 41942b36cc0SRusty Russell if (num & (num - 1)) { 42042b36cc0SRusty Russell dev_warn(&vdev->dev, "Bad virtqueue length %u\n", num); 42142b36cc0SRusty Russell return NULL; 42242b36cc0SRusty Russell } 42342b36cc0SRusty Russell 4240a8a69ddSRusty Russell vq = kmalloc(sizeof(*vq) + sizeof(void *)*num, GFP_KERNEL); 4250a8a69ddSRusty Russell if (!vq) 4260a8a69ddSRusty Russell return NULL; 4270a8a69ddSRusty Russell 42887c7d57cSRusty Russell vring_init(&vq->vring, num, pages, vring_align); 4290a8a69ddSRusty Russell vq->vq.callback = callback; 4300a8a69ddSRusty Russell vq->vq.vdev = vdev; 4319499f5e7SRusty Russell vq->vq.name = name; 4320a8a69ddSRusty Russell vq->notify = notify; 4330a8a69ddSRusty Russell vq->broken = false; 4340a8a69ddSRusty Russell vq->last_used_idx = 0; 4350a8a69ddSRusty Russell vq->num_added = 0; 4369499f5e7SRusty Russell list_add_tail(&vq->vq.list, &vdev->vqs); 4370a8a69ddSRusty Russell #ifdef DEBUG 4380a8a69ddSRusty Russell vq->in_use = false; 4390a8a69ddSRusty Russell #endif 4400a8a69ddSRusty Russell 4419fa29b9dSMark McLoughlin vq->indirect = virtio_has_feature(vdev, VIRTIO_RING_F_INDIRECT_DESC); 4429fa29b9dSMark McLoughlin 4430a8a69ddSRusty Russell /* No callback? Tell other side not to bother us. */ 4440a8a69ddSRusty Russell if (!callback) 4450a8a69ddSRusty Russell vq->vring.avail->flags |= VRING_AVAIL_F_NO_INTERRUPT; 4460a8a69ddSRusty Russell 4470a8a69ddSRusty Russell /* Put everything in free lists. */ 4480a8a69ddSRusty Russell vq->num_free = num; 4490a8a69ddSRusty Russell vq->free_head = 0; 4503b870624SAmit Shah for (i = 0; i < num-1; i++) { 4510a8a69ddSRusty Russell vq->vring.desc[i].next = i+1; 4523b870624SAmit Shah vq->data[i] = NULL; 4533b870624SAmit Shah } 4543b870624SAmit Shah vq->data[i] = NULL; 4550a8a69ddSRusty Russell 4560a8a69ddSRusty Russell return &vq->vq; 4570a8a69ddSRusty Russell } 458c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_new_virtqueue); 4590a8a69ddSRusty Russell 4600a8a69ddSRusty Russell void vring_del_virtqueue(struct virtqueue *vq) 4610a8a69ddSRusty Russell { 4629499f5e7SRusty Russell list_del(&vq->list); 4630a8a69ddSRusty Russell kfree(to_vvq(vq)); 4640a8a69ddSRusty Russell } 465c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_del_virtqueue); 4660a8a69ddSRusty Russell 467e34f8725SRusty Russell /* Manipulates transport-specific feature bits. */ 468e34f8725SRusty Russell void vring_transport_features(struct virtio_device *vdev) 469e34f8725SRusty Russell { 470e34f8725SRusty Russell unsigned int i; 471e34f8725SRusty Russell 472e34f8725SRusty Russell for (i = VIRTIO_TRANSPORT_F_START; i < VIRTIO_TRANSPORT_F_END; i++) { 473e34f8725SRusty Russell switch (i) { 4749fa29b9dSMark McLoughlin case VIRTIO_RING_F_INDIRECT_DESC: 4759fa29b9dSMark McLoughlin break; 476e34f8725SRusty Russell default: 477e34f8725SRusty Russell /* We don't understand this bit. */ 478e34f8725SRusty Russell clear_bit(i, vdev->features); 479e34f8725SRusty Russell } 480e34f8725SRusty Russell } 481e34f8725SRusty Russell } 482e34f8725SRusty Russell EXPORT_SYMBOL_GPL(vring_transport_features); 483e34f8725SRusty Russell 484c6fd4701SRusty Russell MODULE_LICENSE("GPL"); 485