10a8a69ddSRusty Russell /* Virtio ring implementation. 20a8a69ddSRusty Russell * 30a8a69ddSRusty Russell * Copyright 2007 Rusty Russell IBM Corporation 40a8a69ddSRusty Russell * 50a8a69ddSRusty Russell * This program is free software; you can redistribute it and/or modify 60a8a69ddSRusty Russell * it under the terms of the GNU General Public License as published by 70a8a69ddSRusty Russell * the Free Software Foundation; either version 2 of the License, or 80a8a69ddSRusty Russell * (at your option) any later version. 90a8a69ddSRusty Russell * 100a8a69ddSRusty Russell * This program is distributed in the hope that it will be useful, 110a8a69ddSRusty Russell * but WITHOUT ANY WARRANTY; without even the implied warranty of 120a8a69ddSRusty Russell * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 130a8a69ddSRusty Russell * GNU General Public License for more details. 140a8a69ddSRusty Russell * 150a8a69ddSRusty Russell * You should have received a copy of the GNU General Public License 160a8a69ddSRusty Russell * along with this program; if not, write to the Free Software 170a8a69ddSRusty Russell * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA 180a8a69ddSRusty Russell */ 190a8a69ddSRusty Russell #include <linux/virtio.h> 200a8a69ddSRusty Russell #include <linux/virtio_ring.h> 21e34f8725SRusty Russell #include <linux/virtio_config.h> 220a8a69ddSRusty Russell #include <linux/device.h> 235a0e3ad6STejun Heo #include <linux/slab.h> 24b5a2c4f1SPaul Gortmaker #include <linux/module.h> 25e93300b1SRusty Russell #include <linux/hrtimer.h> 266abb2dd9SJoel Stanley #include <linux/kmemleak.h> 270a8a69ddSRusty Russell 280a8a69ddSRusty Russell #ifdef DEBUG 290a8a69ddSRusty Russell /* For development, we want to crash whenever the ring is screwed. */ 309499f5e7SRusty Russell #define BAD_RING(_vq, fmt, args...) \ 319499f5e7SRusty Russell do { \ 329499f5e7SRusty Russell dev_err(&(_vq)->vq.vdev->dev, \ 339499f5e7SRusty Russell "%s:"fmt, (_vq)->vq.name, ##args); \ 349499f5e7SRusty Russell BUG(); \ 359499f5e7SRusty Russell } while (0) 36c5f841f1SRusty Russell /* Caller is supposed to guarantee no reentry. */ 373a35ce7dSRoel Kluin #define START_USE(_vq) \ 38c5f841f1SRusty Russell do { \ 39c5f841f1SRusty Russell if ((_vq)->in_use) \ 409499f5e7SRusty Russell panic("%s:in_use = %i\n", \ 419499f5e7SRusty Russell (_vq)->vq.name, (_vq)->in_use); \ 42c5f841f1SRusty Russell (_vq)->in_use = __LINE__; \ 43c5f841f1SRusty Russell } while (0) 443a35ce7dSRoel Kluin #define END_USE(_vq) \ 4597a545abSRusty Russell do { BUG_ON(!(_vq)->in_use); (_vq)->in_use = 0; } while(0) 460a8a69ddSRusty Russell #else 479499f5e7SRusty Russell #define BAD_RING(_vq, fmt, args...) \ 489499f5e7SRusty Russell do { \ 499499f5e7SRusty Russell dev_err(&_vq->vq.vdev->dev, \ 509499f5e7SRusty Russell "%s:"fmt, (_vq)->vq.name, ##args); \ 519499f5e7SRusty Russell (_vq)->broken = true; \ 529499f5e7SRusty Russell } while (0) 530a8a69ddSRusty Russell #define START_USE(vq) 540a8a69ddSRusty Russell #define END_USE(vq) 550a8a69ddSRusty Russell #endif 560a8a69ddSRusty Russell 570a8a69ddSRusty Russell struct vring_virtqueue 580a8a69ddSRusty Russell { 590a8a69ddSRusty Russell struct virtqueue vq; 600a8a69ddSRusty Russell 610a8a69ddSRusty Russell /* Actual memory layout for this queue */ 620a8a69ddSRusty Russell struct vring vring; 630a8a69ddSRusty Russell 647b21e34fSRusty Russell /* Can we use weak barriers? */ 657b21e34fSRusty Russell bool weak_barriers; 667b21e34fSRusty Russell 670a8a69ddSRusty Russell /* Other side has made a mess, don't try any more. */ 680a8a69ddSRusty Russell bool broken; 690a8a69ddSRusty Russell 709fa29b9dSMark McLoughlin /* Host supports indirect buffers */ 719fa29b9dSMark McLoughlin bool indirect; 729fa29b9dSMark McLoughlin 73a5c262c5SMichael S. Tsirkin /* Host publishes avail event idx */ 74a5c262c5SMichael S. Tsirkin bool event; 75a5c262c5SMichael S. Tsirkin 760a8a69ddSRusty Russell /* Head of free buffer list. */ 770a8a69ddSRusty Russell unsigned int free_head; 780a8a69ddSRusty Russell /* Number we've added since last sync. */ 790a8a69ddSRusty Russell unsigned int num_added; 800a8a69ddSRusty Russell 810a8a69ddSRusty Russell /* Last used index we've seen. */ 821bc4953eSAnthony Liguori u16 last_used_idx; 830a8a69ddSRusty Russell 840a8a69ddSRusty Russell /* How to notify other side. FIXME: commonalize hcalls! */ 8546f9c2b9SHeinz Graalfs bool (*notify)(struct virtqueue *vq); 860a8a69ddSRusty Russell 870a8a69ddSRusty Russell #ifdef DEBUG 880a8a69ddSRusty Russell /* They're supposed to lock for us. */ 890a8a69ddSRusty Russell unsigned int in_use; 90e93300b1SRusty Russell 91e93300b1SRusty Russell /* Figure out if their kicks are too delayed. */ 92e93300b1SRusty Russell bool last_add_time_valid; 93e93300b1SRusty Russell ktime_t last_add_time; 940a8a69ddSRusty Russell #endif 950a8a69ddSRusty Russell 960a8a69ddSRusty Russell /* Tokens for callbacks. */ 970a8a69ddSRusty Russell void *data[]; 980a8a69ddSRusty Russell }; 990a8a69ddSRusty Russell 1000a8a69ddSRusty Russell #define to_vvq(_vq) container_of(_vq, struct vring_virtqueue, vq) 1010a8a69ddSRusty Russell 1029fa29b9dSMark McLoughlin /* Set up an indirect table of descriptors and add it to the queue. */ 10313816c76SRusty Russell static inline int vring_add_indirect(struct vring_virtqueue *vq, 10413816c76SRusty Russell struct scatterlist *sgs[], 10513816c76SRusty Russell unsigned int total_sg, 10613816c76SRusty Russell unsigned int out_sgs, 10713816c76SRusty Russell unsigned int in_sgs, 108bbd603efSMichael S. Tsirkin gfp_t gfp) 1099fa29b9dSMark McLoughlin { 1109fa29b9dSMark McLoughlin struct vring_desc *desc; 1119fa29b9dSMark McLoughlin unsigned head; 11213816c76SRusty Russell struct scatterlist *sg; 11313816c76SRusty Russell int i, n; 1149fa29b9dSMark McLoughlin 115b92b1b89SWill Deacon /* 116b92b1b89SWill Deacon * We require lowmem mappings for the descriptors because 117b92b1b89SWill Deacon * otherwise virt_to_phys will give us bogus addresses in the 118b92b1b89SWill Deacon * virtqueue. 119b92b1b89SWill Deacon */ 120b92b1b89SWill Deacon gfp &= ~(__GFP_HIGHMEM | __GFP_HIGH); 121b92b1b89SWill Deacon 12213816c76SRusty Russell desc = kmalloc(total_sg * sizeof(struct vring_desc), gfp); 1239fa29b9dSMark McLoughlin if (!desc) 124686d3637SMichael S. Tsirkin return -ENOMEM; 1259fa29b9dSMark McLoughlin 12613816c76SRusty Russell /* Transfer entries from the sg lists into the indirect page */ 12713816c76SRusty Russell i = 0; 12813816c76SRusty Russell for (n = 0; n < out_sgs; n++) { 129*eeebf9b1SRusty Russell for (sg = sgs[n]; sg; sg = sg_next(sg)) { 1309fa29b9dSMark McLoughlin desc[i].flags = VRING_DESC_F_NEXT; 1319fa29b9dSMark McLoughlin desc[i].addr = sg_phys(sg); 1329fa29b9dSMark McLoughlin desc[i].len = sg->length; 1339fa29b9dSMark McLoughlin desc[i].next = i+1; 13413816c76SRusty Russell i++; 1359fa29b9dSMark McLoughlin } 13613816c76SRusty Russell } 13713816c76SRusty Russell for (; n < (out_sgs + in_sgs); n++) { 138*eeebf9b1SRusty Russell for (sg = sgs[n]; sg; sg = sg_next(sg)) { 1399fa29b9dSMark McLoughlin desc[i].flags = VRING_DESC_F_NEXT|VRING_DESC_F_WRITE; 1409fa29b9dSMark McLoughlin desc[i].addr = sg_phys(sg); 1419fa29b9dSMark McLoughlin desc[i].len = sg->length; 1429fa29b9dSMark McLoughlin desc[i].next = i+1; 14313816c76SRusty Russell i++; 1449fa29b9dSMark McLoughlin } 14513816c76SRusty Russell } 14613816c76SRusty Russell BUG_ON(i != total_sg); 1479fa29b9dSMark McLoughlin 1489fa29b9dSMark McLoughlin /* Last one doesn't continue. */ 1499fa29b9dSMark McLoughlin desc[i-1].flags &= ~VRING_DESC_F_NEXT; 1509fa29b9dSMark McLoughlin desc[i-1].next = 0; 1519fa29b9dSMark McLoughlin 1529fa29b9dSMark McLoughlin /* We're about to use a buffer */ 15306ca287dSRusty Russell vq->vq.num_free--; 1549fa29b9dSMark McLoughlin 1559fa29b9dSMark McLoughlin /* Use a single buffer which doesn't continue */ 1569fa29b9dSMark McLoughlin head = vq->free_head; 1579fa29b9dSMark McLoughlin vq->vring.desc[head].flags = VRING_DESC_F_INDIRECT; 1589fa29b9dSMark McLoughlin vq->vring.desc[head].addr = virt_to_phys(desc); 159bb478d8bSRusty Russell /* kmemleak gives a false positive, as it's hidden by virt_to_phys */ 160bb478d8bSRusty Russell kmemleak_ignore(desc); 1619fa29b9dSMark McLoughlin vq->vring.desc[head].len = i * sizeof(struct vring_desc); 1629fa29b9dSMark McLoughlin 1639fa29b9dSMark McLoughlin /* Update free pointer */ 1649fa29b9dSMark McLoughlin vq->free_head = vq->vring.desc[head].next; 1659fa29b9dSMark McLoughlin 1669fa29b9dSMark McLoughlin return head; 1679fa29b9dSMark McLoughlin } 1689fa29b9dSMark McLoughlin 16913816c76SRusty Russell static inline int virtqueue_add(struct virtqueue *_vq, 17013816c76SRusty Russell struct scatterlist *sgs[], 171*eeebf9b1SRusty Russell unsigned int total_sg, 17213816c76SRusty Russell unsigned int out_sgs, 17313816c76SRusty Russell unsigned int in_sgs, 174bbd603efSMichael S. Tsirkin void *data, 175bbd603efSMichael S. Tsirkin gfp_t gfp) 1760a8a69ddSRusty Russell { 1770a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 17813816c76SRusty Russell struct scatterlist *sg; 179*eeebf9b1SRusty Russell unsigned int i, n, avail, uninitialized_var(prev); 1801fe9b6feSMichael S. Tsirkin int head; 1810a8a69ddSRusty Russell 1829fa29b9dSMark McLoughlin START_USE(vq); 1839fa29b9dSMark McLoughlin 1840a8a69ddSRusty Russell BUG_ON(data == NULL); 1859fa29b9dSMark McLoughlin 18670670444SRusty Russell if (unlikely(vq->broken)) { 18770670444SRusty Russell END_USE(vq); 18870670444SRusty Russell return -EIO; 18970670444SRusty Russell } 19070670444SRusty Russell 191e93300b1SRusty Russell #ifdef DEBUG 192e93300b1SRusty Russell { 193e93300b1SRusty Russell ktime_t now = ktime_get(); 194e93300b1SRusty Russell 195e93300b1SRusty Russell /* No kick or get, with .1 second between? Warn. */ 196e93300b1SRusty Russell if (vq->last_add_time_valid) 197e93300b1SRusty Russell WARN_ON(ktime_to_ms(ktime_sub(now, vq->last_add_time)) 198e93300b1SRusty Russell > 100); 199e93300b1SRusty Russell vq->last_add_time = now; 200e93300b1SRusty Russell vq->last_add_time_valid = true; 201e93300b1SRusty Russell } 202e93300b1SRusty Russell #endif 203e93300b1SRusty Russell 2049fa29b9dSMark McLoughlin /* If the host supports indirect descriptor tables, and we have multiple 2059fa29b9dSMark McLoughlin * buffers, then go indirect. FIXME: tune this threshold */ 20613816c76SRusty Russell if (vq->indirect && total_sg > 1 && vq->vq.num_free) { 207*eeebf9b1SRusty Russell head = vring_add_indirect(vq, sgs, total_sg, 20813816c76SRusty Russell out_sgs, in_sgs, gfp); 2091fe9b6feSMichael S. Tsirkin if (likely(head >= 0)) 2109fa29b9dSMark McLoughlin goto add_head; 2119fa29b9dSMark McLoughlin } 2129fa29b9dSMark McLoughlin 21313816c76SRusty Russell BUG_ON(total_sg > vq->vring.num); 21413816c76SRusty Russell BUG_ON(total_sg == 0); 2150a8a69ddSRusty Russell 21613816c76SRusty Russell if (vq->vq.num_free < total_sg) { 2170a8a69ddSRusty Russell pr_debug("Can't add buf len %i - avail = %i\n", 21813816c76SRusty Russell total_sg, vq->vq.num_free); 21944653eaeSRusty Russell /* FIXME: for historical reasons, we force a notify here if 22044653eaeSRusty Russell * there are outgoing parts to the buffer. Presumably the 22144653eaeSRusty Russell * host should service the ring ASAP. */ 22213816c76SRusty Russell if (out_sgs) 223426e3e0aSRusty Russell vq->notify(&vq->vq); 2240a8a69ddSRusty Russell END_USE(vq); 2250a8a69ddSRusty Russell return -ENOSPC; 2260a8a69ddSRusty Russell } 2270a8a69ddSRusty Russell 2280a8a69ddSRusty Russell /* We're about to use some buffers from the free list. */ 22913816c76SRusty Russell vq->vq.num_free -= total_sg; 2300a8a69ddSRusty Russell 23113816c76SRusty Russell head = i = vq->free_head; 23213816c76SRusty Russell for (n = 0; n < out_sgs; n++) { 233*eeebf9b1SRusty Russell for (sg = sgs[n]; sg; sg = sg_next(sg)) { 2340a8a69ddSRusty Russell vq->vring.desc[i].flags = VRING_DESC_F_NEXT; 23515f9c890SRusty Russell vq->vring.desc[i].addr = sg_phys(sg); 2360a8a69ddSRusty Russell vq->vring.desc[i].len = sg->length; 2370a8a69ddSRusty Russell prev = i; 23813816c76SRusty Russell i = vq->vring.desc[i].next; 2390a8a69ddSRusty Russell } 24013816c76SRusty Russell } 24113816c76SRusty Russell for (; n < (out_sgs + in_sgs); n++) { 242*eeebf9b1SRusty Russell for (sg = sgs[n]; sg; sg = sg_next(sg)) { 2430a8a69ddSRusty Russell vq->vring.desc[i].flags = VRING_DESC_F_NEXT|VRING_DESC_F_WRITE; 24415f9c890SRusty Russell vq->vring.desc[i].addr = sg_phys(sg); 2450a8a69ddSRusty Russell vq->vring.desc[i].len = sg->length; 2460a8a69ddSRusty Russell prev = i; 24713816c76SRusty Russell i = vq->vring.desc[i].next; 24813816c76SRusty Russell } 2490a8a69ddSRusty Russell } 2500a8a69ddSRusty Russell /* Last one doesn't continue. */ 2510a8a69ddSRusty Russell vq->vring.desc[prev].flags &= ~VRING_DESC_F_NEXT; 2520a8a69ddSRusty Russell 2530a8a69ddSRusty Russell /* Update free pointer */ 2540a8a69ddSRusty Russell vq->free_head = i; 2550a8a69ddSRusty Russell 2569fa29b9dSMark McLoughlin add_head: 2570a8a69ddSRusty Russell /* Set token. */ 2580a8a69ddSRusty Russell vq->data[head] = data; 2590a8a69ddSRusty Russell 2600a8a69ddSRusty Russell /* Put entry in available array (but don't update avail->idx until they 2613b720b8cSRusty Russell * do sync). */ 262ee7cd898SRusty Russell avail = (vq->vring.avail->idx & (vq->vring.num-1)); 2630a8a69ddSRusty Russell vq->vring.avail->ring[avail] = head; 2640a8a69ddSRusty Russell 265ee7cd898SRusty Russell /* Descriptors and available array need to be set before we expose the 266ee7cd898SRusty Russell * new available array entries. */ 267a9a0fef7SRusty Russell virtio_wmb(vq->weak_barriers); 268ee7cd898SRusty Russell vq->vring.avail->idx++; 269ee7cd898SRusty Russell vq->num_added++; 270ee7cd898SRusty Russell 271ee7cd898SRusty Russell /* This is very unlikely, but theoretically possible. Kick 272ee7cd898SRusty Russell * just in case. */ 273ee7cd898SRusty Russell if (unlikely(vq->num_added == (1 << 16) - 1)) 274ee7cd898SRusty Russell virtqueue_kick(_vq); 275ee7cd898SRusty Russell 2760a8a69ddSRusty Russell pr_debug("Added buffer head %i to %p\n", head, vq); 2770a8a69ddSRusty Russell END_USE(vq); 2783c1b27d5SRusty Russell 27998e8c6bcSRusty Russell return 0; 2800a8a69ddSRusty Russell } 28113816c76SRusty Russell 28213816c76SRusty Russell /** 28313816c76SRusty Russell * virtqueue_add_sgs - expose buffers to other end 28413816c76SRusty Russell * @vq: the struct virtqueue we're talking about. 28513816c76SRusty Russell * @sgs: array of terminated scatterlists. 28613816c76SRusty Russell * @out_num: the number of scatterlists readable by other side 28713816c76SRusty Russell * @in_num: the number of scatterlists which are writable (after readable ones) 28813816c76SRusty Russell * @data: the token identifying the buffer. 28913816c76SRusty Russell * @gfp: how to do memory allocations (if necessary). 29013816c76SRusty Russell * 29113816c76SRusty Russell * Caller must ensure we don't call this with other virtqueue operations 29213816c76SRusty Russell * at the same time (except where noted). 29313816c76SRusty Russell * 29470670444SRusty Russell * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 29513816c76SRusty Russell */ 29613816c76SRusty Russell int virtqueue_add_sgs(struct virtqueue *_vq, 29713816c76SRusty Russell struct scatterlist *sgs[], 29813816c76SRusty Russell unsigned int out_sgs, 29913816c76SRusty Russell unsigned int in_sgs, 30013816c76SRusty Russell void *data, 30113816c76SRusty Russell gfp_t gfp) 30213816c76SRusty Russell { 303*eeebf9b1SRusty Russell unsigned int i, total_sg = 0; 30413816c76SRusty Russell 30513816c76SRusty Russell /* Count them first. */ 306*eeebf9b1SRusty Russell for (i = 0; i < out_sgs + in_sgs; i++) { 30713816c76SRusty Russell struct scatterlist *sg; 30813816c76SRusty Russell for (sg = sgs[i]; sg; sg = sg_next(sg)) 309*eeebf9b1SRusty Russell total_sg++; 31013816c76SRusty Russell } 311*eeebf9b1SRusty Russell return virtqueue_add(_vq, sgs, total_sg, out_sgs, in_sgs, data, gfp); 31213816c76SRusty Russell } 31313816c76SRusty Russell EXPORT_SYMBOL_GPL(virtqueue_add_sgs); 31413816c76SRusty Russell 31513816c76SRusty Russell /** 316282edb36SRusty Russell * virtqueue_add_outbuf - expose output buffers to other end 317282edb36SRusty Russell * @vq: the struct virtqueue we're talking about. 318*eeebf9b1SRusty Russell * @sg: scatterlist (must be well-formed and terminated!) 319*eeebf9b1SRusty Russell * @num: the number of entries in @sg readable by other side 320282edb36SRusty Russell * @data: the token identifying the buffer. 321282edb36SRusty Russell * @gfp: how to do memory allocations (if necessary). 322282edb36SRusty Russell * 323282edb36SRusty Russell * Caller must ensure we don't call this with other virtqueue operations 324282edb36SRusty Russell * at the same time (except where noted). 325282edb36SRusty Russell * 32670670444SRusty Russell * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 327282edb36SRusty Russell */ 328282edb36SRusty Russell int virtqueue_add_outbuf(struct virtqueue *vq, 329*eeebf9b1SRusty Russell struct scatterlist *sg, unsigned int num, 330282edb36SRusty Russell void *data, 331282edb36SRusty Russell gfp_t gfp) 332282edb36SRusty Russell { 333*eeebf9b1SRusty Russell return virtqueue_add(vq, &sg, num, 1, 0, data, gfp); 334282edb36SRusty Russell } 335282edb36SRusty Russell EXPORT_SYMBOL_GPL(virtqueue_add_outbuf); 336282edb36SRusty Russell 337282edb36SRusty Russell /** 338282edb36SRusty Russell * virtqueue_add_inbuf - expose input buffers to other end 339282edb36SRusty Russell * @vq: the struct virtqueue we're talking about. 340*eeebf9b1SRusty Russell * @sg: scatterlist (must be well-formed and terminated!) 341*eeebf9b1SRusty Russell * @num: the number of entries in @sg writable by other side 342282edb36SRusty Russell * @data: the token identifying the buffer. 343282edb36SRusty Russell * @gfp: how to do memory allocations (if necessary). 344282edb36SRusty Russell * 345282edb36SRusty Russell * Caller must ensure we don't call this with other virtqueue operations 346282edb36SRusty Russell * at the same time (except where noted). 347282edb36SRusty Russell * 34870670444SRusty Russell * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 349282edb36SRusty Russell */ 350282edb36SRusty Russell int virtqueue_add_inbuf(struct virtqueue *vq, 351*eeebf9b1SRusty Russell struct scatterlist *sg, unsigned int num, 352282edb36SRusty Russell void *data, 353282edb36SRusty Russell gfp_t gfp) 354282edb36SRusty Russell { 355*eeebf9b1SRusty Russell return virtqueue_add(vq, &sg, num, 0, 1, data, gfp); 356282edb36SRusty Russell } 357282edb36SRusty Russell EXPORT_SYMBOL_GPL(virtqueue_add_inbuf); 358282edb36SRusty Russell 359282edb36SRusty Russell /** 36041f0377fSRusty Russell * virtqueue_kick_prepare - first half of split virtqueue_kick call. 3615dfc1762SRusty Russell * @vq: the struct virtqueue 3625dfc1762SRusty Russell * 36341f0377fSRusty Russell * Instead of virtqueue_kick(), you can do: 36441f0377fSRusty Russell * if (virtqueue_kick_prepare(vq)) 36541f0377fSRusty Russell * virtqueue_notify(vq); 3665dfc1762SRusty Russell * 36741f0377fSRusty Russell * This is sometimes useful because the virtqueue_kick_prepare() needs 36841f0377fSRusty Russell * to be serialized, but the actual virtqueue_notify() call does not. 3695dfc1762SRusty Russell */ 37041f0377fSRusty Russell bool virtqueue_kick_prepare(struct virtqueue *_vq) 3710a8a69ddSRusty Russell { 3720a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 373a5c262c5SMichael S. Tsirkin u16 new, old; 37441f0377fSRusty Russell bool needs_kick; 37541f0377fSRusty Russell 3760a8a69ddSRusty Russell START_USE(vq); 377a72caae2SJason Wang /* We need to expose available array entries before checking avail 378a72caae2SJason Wang * event. */ 379a9a0fef7SRusty Russell virtio_mb(vq->weak_barriers); 3800a8a69ddSRusty Russell 381ee7cd898SRusty Russell old = vq->vring.avail->idx - vq->num_added; 382ee7cd898SRusty Russell new = vq->vring.avail->idx; 3830a8a69ddSRusty Russell vq->num_added = 0; 3840a8a69ddSRusty Russell 385e93300b1SRusty Russell #ifdef DEBUG 386e93300b1SRusty Russell if (vq->last_add_time_valid) { 387e93300b1SRusty Russell WARN_ON(ktime_to_ms(ktime_sub(ktime_get(), 388e93300b1SRusty Russell vq->last_add_time)) > 100); 389e93300b1SRusty Russell } 390e93300b1SRusty Russell vq->last_add_time_valid = false; 391e93300b1SRusty Russell #endif 392e93300b1SRusty Russell 39341f0377fSRusty Russell if (vq->event) { 39441f0377fSRusty Russell needs_kick = vring_need_event(vring_avail_event(&vq->vring), 39541f0377fSRusty Russell new, old); 39641f0377fSRusty Russell } else { 39741f0377fSRusty Russell needs_kick = !(vq->vring.used->flags & VRING_USED_F_NO_NOTIFY); 39841f0377fSRusty Russell } 3990a8a69ddSRusty Russell END_USE(vq); 40041f0377fSRusty Russell return needs_kick; 40141f0377fSRusty Russell } 40241f0377fSRusty Russell EXPORT_SYMBOL_GPL(virtqueue_kick_prepare); 40341f0377fSRusty Russell 40441f0377fSRusty Russell /** 40541f0377fSRusty Russell * virtqueue_notify - second half of split virtqueue_kick call. 40641f0377fSRusty Russell * @vq: the struct virtqueue 40741f0377fSRusty Russell * 40841f0377fSRusty Russell * This does not need to be serialized. 4095b1bf7cbSHeinz Graalfs * 4105b1bf7cbSHeinz Graalfs * Returns false if host notify failed or queue is broken, otherwise true. 41141f0377fSRusty Russell */ 4125b1bf7cbSHeinz Graalfs bool virtqueue_notify(struct virtqueue *_vq) 41341f0377fSRusty Russell { 41441f0377fSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 41541f0377fSRusty Russell 4165b1bf7cbSHeinz Graalfs if (unlikely(vq->broken)) 4175b1bf7cbSHeinz Graalfs return false; 4185b1bf7cbSHeinz Graalfs 41941f0377fSRusty Russell /* Prod other side to tell it about changes. */ 4202342d6a6SHeinz Graalfs if (!vq->notify(_vq)) { 4215b1bf7cbSHeinz Graalfs vq->broken = true; 4225b1bf7cbSHeinz Graalfs return false; 4235b1bf7cbSHeinz Graalfs } 4245b1bf7cbSHeinz Graalfs return true; 42541f0377fSRusty Russell } 42641f0377fSRusty Russell EXPORT_SYMBOL_GPL(virtqueue_notify); 42741f0377fSRusty Russell 42841f0377fSRusty Russell /** 42941f0377fSRusty Russell * virtqueue_kick - update after add_buf 43041f0377fSRusty Russell * @vq: the struct virtqueue 43141f0377fSRusty Russell * 432b3087e48SRusty Russell * After one or more virtqueue_add_* calls, invoke this to kick 43341f0377fSRusty Russell * the other side. 43441f0377fSRusty Russell * 43541f0377fSRusty Russell * Caller must ensure we don't call this with other virtqueue 43641f0377fSRusty Russell * operations at the same time (except where noted). 4375b1bf7cbSHeinz Graalfs * 4385b1bf7cbSHeinz Graalfs * Returns false if kick failed, otherwise true. 43941f0377fSRusty Russell */ 4405b1bf7cbSHeinz Graalfs bool virtqueue_kick(struct virtqueue *vq) 44141f0377fSRusty Russell { 44241f0377fSRusty Russell if (virtqueue_kick_prepare(vq)) 4435b1bf7cbSHeinz Graalfs return virtqueue_notify(vq); 4445b1bf7cbSHeinz Graalfs return true; 4450a8a69ddSRusty Russell } 4467c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_kick); 4470a8a69ddSRusty Russell 4480a8a69ddSRusty Russell static void detach_buf(struct vring_virtqueue *vq, unsigned int head) 4490a8a69ddSRusty Russell { 4500a8a69ddSRusty Russell unsigned int i; 4510a8a69ddSRusty Russell 4520a8a69ddSRusty Russell /* Clear data ptr. */ 4530a8a69ddSRusty Russell vq->data[head] = NULL; 4540a8a69ddSRusty Russell 4550a8a69ddSRusty Russell /* Put back on free list: find end */ 4560a8a69ddSRusty Russell i = head; 4579fa29b9dSMark McLoughlin 4589fa29b9dSMark McLoughlin /* Free the indirect table */ 4599fa29b9dSMark McLoughlin if (vq->vring.desc[i].flags & VRING_DESC_F_INDIRECT) 4609fa29b9dSMark McLoughlin kfree(phys_to_virt(vq->vring.desc[i].addr)); 4619fa29b9dSMark McLoughlin 4620a8a69ddSRusty Russell while (vq->vring.desc[i].flags & VRING_DESC_F_NEXT) { 4630a8a69ddSRusty Russell i = vq->vring.desc[i].next; 46406ca287dSRusty Russell vq->vq.num_free++; 4650a8a69ddSRusty Russell } 4660a8a69ddSRusty Russell 4670a8a69ddSRusty Russell vq->vring.desc[i].next = vq->free_head; 4680a8a69ddSRusty Russell vq->free_head = head; 4690a8a69ddSRusty Russell /* Plus final descriptor */ 47006ca287dSRusty Russell vq->vq.num_free++; 4710a8a69ddSRusty Russell } 4720a8a69ddSRusty Russell 4730a8a69ddSRusty Russell static inline bool more_used(const struct vring_virtqueue *vq) 4740a8a69ddSRusty Russell { 4750a8a69ddSRusty Russell return vq->last_used_idx != vq->vring.used->idx; 4760a8a69ddSRusty Russell } 4770a8a69ddSRusty Russell 4785dfc1762SRusty Russell /** 4795dfc1762SRusty Russell * virtqueue_get_buf - get the next used buffer 4805dfc1762SRusty Russell * @vq: the struct virtqueue we're talking about. 4815dfc1762SRusty Russell * @len: the length written into the buffer 4825dfc1762SRusty Russell * 4835dfc1762SRusty Russell * If the driver wrote data into the buffer, @len will be set to the 4845dfc1762SRusty Russell * amount written. This means you don't need to clear the buffer 4855dfc1762SRusty Russell * beforehand to ensure there's no data leakage in the case of short 4865dfc1762SRusty Russell * writes. 4875dfc1762SRusty Russell * 4885dfc1762SRusty Russell * Caller must ensure we don't call this with other virtqueue 4895dfc1762SRusty Russell * operations at the same time (except where noted). 4905dfc1762SRusty Russell * 4915dfc1762SRusty Russell * Returns NULL if there are no used buffers, or the "data" token 492b3087e48SRusty Russell * handed to virtqueue_add_*(). 4935dfc1762SRusty Russell */ 4947c5e9ed0SMichael S. Tsirkin void *virtqueue_get_buf(struct virtqueue *_vq, unsigned int *len) 4950a8a69ddSRusty Russell { 4960a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 4970a8a69ddSRusty Russell void *ret; 4980a8a69ddSRusty Russell unsigned int i; 4993b720b8cSRusty Russell u16 last_used; 5000a8a69ddSRusty Russell 5010a8a69ddSRusty Russell START_USE(vq); 5020a8a69ddSRusty Russell 5035ef82752SRusty Russell if (unlikely(vq->broken)) { 5045ef82752SRusty Russell END_USE(vq); 5055ef82752SRusty Russell return NULL; 5065ef82752SRusty Russell } 5075ef82752SRusty Russell 5080a8a69ddSRusty Russell if (!more_used(vq)) { 5090a8a69ddSRusty Russell pr_debug("No more buffers in queue\n"); 5100a8a69ddSRusty Russell END_USE(vq); 5110a8a69ddSRusty Russell return NULL; 5120a8a69ddSRusty Russell } 5130a8a69ddSRusty Russell 5142d61ba95SMichael S. Tsirkin /* Only get used array entries after they have been exposed by host. */ 515a9a0fef7SRusty Russell virtio_rmb(vq->weak_barriers); 5162d61ba95SMichael S. Tsirkin 5173b720b8cSRusty Russell last_used = (vq->last_used_idx & (vq->vring.num - 1)); 5183b720b8cSRusty Russell i = vq->vring.used->ring[last_used].id; 5193b720b8cSRusty Russell *len = vq->vring.used->ring[last_used].len; 5200a8a69ddSRusty Russell 5210a8a69ddSRusty Russell if (unlikely(i >= vq->vring.num)) { 5220a8a69ddSRusty Russell BAD_RING(vq, "id %u out of range\n", i); 5230a8a69ddSRusty Russell return NULL; 5240a8a69ddSRusty Russell } 5250a8a69ddSRusty Russell if (unlikely(!vq->data[i])) { 5260a8a69ddSRusty Russell BAD_RING(vq, "id %u is not a head!\n", i); 5270a8a69ddSRusty Russell return NULL; 5280a8a69ddSRusty Russell } 5290a8a69ddSRusty Russell 5300a8a69ddSRusty Russell /* detach_buf clears data, so grab it now. */ 5310a8a69ddSRusty Russell ret = vq->data[i]; 5320a8a69ddSRusty Russell detach_buf(vq, i); 5330a8a69ddSRusty Russell vq->last_used_idx++; 534a5c262c5SMichael S. Tsirkin /* If we expect an interrupt for the next entry, tell host 535a5c262c5SMichael S. Tsirkin * by writing event index and flush out the write before 536a5c262c5SMichael S. Tsirkin * the read in the next get_buf call. */ 537a5c262c5SMichael S. Tsirkin if (!(vq->vring.avail->flags & VRING_AVAIL_F_NO_INTERRUPT)) { 538a5c262c5SMichael S. Tsirkin vring_used_event(&vq->vring) = vq->last_used_idx; 539a9a0fef7SRusty Russell virtio_mb(vq->weak_barriers); 540a5c262c5SMichael S. Tsirkin } 541a5c262c5SMichael S. Tsirkin 542e93300b1SRusty Russell #ifdef DEBUG 543e93300b1SRusty Russell vq->last_add_time_valid = false; 544e93300b1SRusty Russell #endif 545e93300b1SRusty Russell 5460a8a69ddSRusty Russell END_USE(vq); 5470a8a69ddSRusty Russell return ret; 5480a8a69ddSRusty Russell } 5497c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_get_buf); 5500a8a69ddSRusty Russell 5515dfc1762SRusty Russell /** 5525dfc1762SRusty Russell * virtqueue_disable_cb - disable callbacks 5535dfc1762SRusty Russell * @vq: the struct virtqueue we're talking about. 5545dfc1762SRusty Russell * 5555dfc1762SRusty Russell * Note that this is not necessarily synchronous, hence unreliable and only 5565dfc1762SRusty Russell * useful as an optimization. 5575dfc1762SRusty Russell * 5585dfc1762SRusty Russell * Unlike other operations, this need not be serialized. 5595dfc1762SRusty Russell */ 5607c5e9ed0SMichael S. Tsirkin void virtqueue_disable_cb(struct virtqueue *_vq) 56118445c4dSRusty Russell { 56218445c4dSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 56318445c4dSRusty Russell 56418445c4dSRusty Russell vq->vring.avail->flags |= VRING_AVAIL_F_NO_INTERRUPT; 56518445c4dSRusty Russell } 5667c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_disable_cb); 56718445c4dSRusty Russell 5685dfc1762SRusty Russell /** 569cc229884SMichael S. Tsirkin * virtqueue_enable_cb_prepare - restart callbacks after disable_cb 570cc229884SMichael S. Tsirkin * @vq: the struct virtqueue we're talking about. 571cc229884SMichael S. Tsirkin * 572cc229884SMichael S. Tsirkin * This re-enables callbacks; it returns current queue state 573cc229884SMichael S. Tsirkin * in an opaque unsigned value. This value should be later tested by 574cc229884SMichael S. Tsirkin * virtqueue_poll, to detect a possible race between the driver checking for 575cc229884SMichael S. Tsirkin * more work, and enabling callbacks. 576cc229884SMichael S. Tsirkin * 577cc229884SMichael S. Tsirkin * Caller must ensure we don't call this with other virtqueue 578cc229884SMichael S. Tsirkin * operations at the same time (except where noted). 579cc229884SMichael S. Tsirkin */ 580cc229884SMichael S. Tsirkin unsigned virtqueue_enable_cb_prepare(struct virtqueue *_vq) 581cc229884SMichael S. Tsirkin { 582cc229884SMichael S. Tsirkin struct vring_virtqueue *vq = to_vvq(_vq); 583cc229884SMichael S. Tsirkin u16 last_used_idx; 584cc229884SMichael S. Tsirkin 585cc229884SMichael S. Tsirkin START_USE(vq); 586cc229884SMichael S. Tsirkin 587cc229884SMichael S. Tsirkin /* We optimistically turn back on interrupts, then check if there was 588cc229884SMichael S. Tsirkin * more to do. */ 589cc229884SMichael S. Tsirkin /* Depending on the VIRTIO_RING_F_EVENT_IDX feature, we need to 590cc229884SMichael S. Tsirkin * either clear the flags bit or point the event index at the next 591cc229884SMichael S. Tsirkin * entry. Always do both to keep code simple. */ 592cc229884SMichael S. Tsirkin vq->vring.avail->flags &= ~VRING_AVAIL_F_NO_INTERRUPT; 593cc229884SMichael S. Tsirkin vring_used_event(&vq->vring) = last_used_idx = vq->last_used_idx; 594cc229884SMichael S. Tsirkin END_USE(vq); 595cc229884SMichael S. Tsirkin return last_used_idx; 596cc229884SMichael S. Tsirkin } 597cc229884SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_enable_cb_prepare); 598cc229884SMichael S. Tsirkin 599cc229884SMichael S. Tsirkin /** 600cc229884SMichael S. Tsirkin * virtqueue_poll - query pending used buffers 601cc229884SMichael S. Tsirkin * @vq: the struct virtqueue we're talking about. 602cc229884SMichael S. Tsirkin * @last_used_idx: virtqueue state (from call to virtqueue_enable_cb_prepare). 603cc229884SMichael S. Tsirkin * 604cc229884SMichael S. Tsirkin * Returns "true" if there are pending used buffers in the queue. 605cc229884SMichael S. Tsirkin * 606cc229884SMichael S. Tsirkin * This does not need to be serialized. 607cc229884SMichael S. Tsirkin */ 608cc229884SMichael S. Tsirkin bool virtqueue_poll(struct virtqueue *_vq, unsigned last_used_idx) 609cc229884SMichael S. Tsirkin { 610cc229884SMichael S. Tsirkin struct vring_virtqueue *vq = to_vvq(_vq); 611cc229884SMichael S. Tsirkin 612cc229884SMichael S. Tsirkin virtio_mb(vq->weak_barriers); 613cc229884SMichael S. Tsirkin return (u16)last_used_idx != vq->vring.used->idx; 614cc229884SMichael S. Tsirkin } 615cc229884SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_poll); 616cc229884SMichael S. Tsirkin 617cc229884SMichael S. Tsirkin /** 6185dfc1762SRusty Russell * virtqueue_enable_cb - restart callbacks after disable_cb. 6195dfc1762SRusty Russell * @vq: the struct virtqueue we're talking about. 6205dfc1762SRusty Russell * 6215dfc1762SRusty Russell * This re-enables callbacks; it returns "false" if there are pending 6225dfc1762SRusty Russell * buffers in the queue, to detect a possible race between the driver 6235dfc1762SRusty Russell * checking for more work, and enabling callbacks. 6245dfc1762SRusty Russell * 6255dfc1762SRusty Russell * Caller must ensure we don't call this with other virtqueue 6265dfc1762SRusty Russell * operations at the same time (except where noted). 6275dfc1762SRusty Russell */ 6287c5e9ed0SMichael S. Tsirkin bool virtqueue_enable_cb(struct virtqueue *_vq) 6290a8a69ddSRusty Russell { 630cc229884SMichael S. Tsirkin unsigned last_used_idx = virtqueue_enable_cb_prepare(_vq); 631cc229884SMichael S. Tsirkin return !virtqueue_poll(_vq, last_used_idx); 6320a8a69ddSRusty Russell } 6337c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_enable_cb); 6340a8a69ddSRusty Russell 6355dfc1762SRusty Russell /** 6365dfc1762SRusty Russell * virtqueue_enable_cb_delayed - restart callbacks after disable_cb. 6375dfc1762SRusty Russell * @vq: the struct virtqueue we're talking about. 6385dfc1762SRusty Russell * 6395dfc1762SRusty Russell * This re-enables callbacks but hints to the other side to delay 6405dfc1762SRusty Russell * interrupts until most of the available buffers have been processed; 6415dfc1762SRusty Russell * it returns "false" if there are many pending buffers in the queue, 6425dfc1762SRusty Russell * to detect a possible race between the driver checking for more work, 6435dfc1762SRusty Russell * and enabling callbacks. 6445dfc1762SRusty Russell * 6455dfc1762SRusty Russell * Caller must ensure we don't call this with other virtqueue 6465dfc1762SRusty Russell * operations at the same time (except where noted). 6475dfc1762SRusty Russell */ 6487ab358c2SMichael S. Tsirkin bool virtqueue_enable_cb_delayed(struct virtqueue *_vq) 6497ab358c2SMichael S. Tsirkin { 6507ab358c2SMichael S. Tsirkin struct vring_virtqueue *vq = to_vvq(_vq); 6517ab358c2SMichael S. Tsirkin u16 bufs; 6527ab358c2SMichael S. Tsirkin 6537ab358c2SMichael S. Tsirkin START_USE(vq); 6547ab358c2SMichael S. Tsirkin 6557ab358c2SMichael S. Tsirkin /* We optimistically turn back on interrupts, then check if there was 6567ab358c2SMichael S. Tsirkin * more to do. */ 6577ab358c2SMichael S. Tsirkin /* Depending on the VIRTIO_RING_F_USED_EVENT_IDX feature, we need to 6587ab358c2SMichael S. Tsirkin * either clear the flags bit or point the event index at the next 6597ab358c2SMichael S. Tsirkin * entry. Always do both to keep code simple. */ 6607ab358c2SMichael S. Tsirkin vq->vring.avail->flags &= ~VRING_AVAIL_F_NO_INTERRUPT; 6617ab358c2SMichael S. Tsirkin /* TODO: tune this threshold */ 6627ab358c2SMichael S. Tsirkin bufs = (u16)(vq->vring.avail->idx - vq->last_used_idx) * 3 / 4; 6637ab358c2SMichael S. Tsirkin vring_used_event(&vq->vring) = vq->last_used_idx + bufs; 664a9a0fef7SRusty Russell virtio_mb(vq->weak_barriers); 6657ab358c2SMichael S. Tsirkin if (unlikely((u16)(vq->vring.used->idx - vq->last_used_idx) > bufs)) { 6667ab358c2SMichael S. Tsirkin END_USE(vq); 6677ab358c2SMichael S. Tsirkin return false; 6687ab358c2SMichael S. Tsirkin } 6697ab358c2SMichael S. Tsirkin 6707ab358c2SMichael S. Tsirkin END_USE(vq); 6717ab358c2SMichael S. Tsirkin return true; 6727ab358c2SMichael S. Tsirkin } 6737ab358c2SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_enable_cb_delayed); 6747ab358c2SMichael S. Tsirkin 6755dfc1762SRusty Russell /** 6765dfc1762SRusty Russell * virtqueue_detach_unused_buf - detach first unused buffer 6775dfc1762SRusty Russell * @vq: the struct virtqueue we're talking about. 6785dfc1762SRusty Russell * 679b3087e48SRusty Russell * Returns NULL or the "data" token handed to virtqueue_add_*(). 6805dfc1762SRusty Russell * This is not valid on an active queue; it is useful only for device 6815dfc1762SRusty Russell * shutdown. 6825dfc1762SRusty Russell */ 6837c5e9ed0SMichael S. Tsirkin void *virtqueue_detach_unused_buf(struct virtqueue *_vq) 684c021eac4SShirley Ma { 685c021eac4SShirley Ma struct vring_virtqueue *vq = to_vvq(_vq); 686c021eac4SShirley Ma unsigned int i; 687c021eac4SShirley Ma void *buf; 688c021eac4SShirley Ma 689c021eac4SShirley Ma START_USE(vq); 690c021eac4SShirley Ma 691c021eac4SShirley Ma for (i = 0; i < vq->vring.num; i++) { 692c021eac4SShirley Ma if (!vq->data[i]) 693c021eac4SShirley Ma continue; 694c021eac4SShirley Ma /* detach_buf clears data, so grab it now. */ 695c021eac4SShirley Ma buf = vq->data[i]; 696c021eac4SShirley Ma detach_buf(vq, i); 697b3258ff1SAmit Shah vq->vring.avail->idx--; 698c021eac4SShirley Ma END_USE(vq); 699c021eac4SShirley Ma return buf; 700c021eac4SShirley Ma } 701c021eac4SShirley Ma /* That should have freed everything. */ 70206ca287dSRusty Russell BUG_ON(vq->vq.num_free != vq->vring.num); 703c021eac4SShirley Ma 704c021eac4SShirley Ma END_USE(vq); 705c021eac4SShirley Ma return NULL; 706c021eac4SShirley Ma } 7077c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_detach_unused_buf); 708c021eac4SShirley Ma 7090a8a69ddSRusty Russell irqreturn_t vring_interrupt(int irq, void *_vq) 7100a8a69ddSRusty Russell { 7110a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 7120a8a69ddSRusty Russell 7130a8a69ddSRusty Russell if (!more_used(vq)) { 7140a8a69ddSRusty Russell pr_debug("virtqueue interrupt with no work for %p\n", vq); 7150a8a69ddSRusty Russell return IRQ_NONE; 7160a8a69ddSRusty Russell } 7170a8a69ddSRusty Russell 7180a8a69ddSRusty Russell if (unlikely(vq->broken)) 7190a8a69ddSRusty Russell return IRQ_HANDLED; 7200a8a69ddSRusty Russell 7210a8a69ddSRusty Russell pr_debug("virtqueue callback for %p (%p)\n", vq, vq->vq.callback); 72218445c4dSRusty Russell if (vq->vq.callback) 72318445c4dSRusty Russell vq->vq.callback(&vq->vq); 7240a8a69ddSRusty Russell 7250a8a69ddSRusty Russell return IRQ_HANDLED; 7260a8a69ddSRusty Russell } 727c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_interrupt); 7280a8a69ddSRusty Russell 72917bb6d40SJason Wang struct virtqueue *vring_new_virtqueue(unsigned int index, 73017bb6d40SJason Wang unsigned int num, 73187c7d57cSRusty Russell unsigned int vring_align, 7320a8a69ddSRusty Russell struct virtio_device *vdev, 7337b21e34fSRusty Russell bool weak_barriers, 7340a8a69ddSRusty Russell void *pages, 73546f9c2b9SHeinz Graalfs bool (*notify)(struct virtqueue *), 7369499f5e7SRusty Russell void (*callback)(struct virtqueue *), 7379499f5e7SRusty Russell const char *name) 7380a8a69ddSRusty Russell { 7390a8a69ddSRusty Russell struct vring_virtqueue *vq; 7400a8a69ddSRusty Russell unsigned int i; 7410a8a69ddSRusty Russell 74242b36cc0SRusty Russell /* We assume num is a power of 2. */ 74342b36cc0SRusty Russell if (num & (num - 1)) { 74442b36cc0SRusty Russell dev_warn(&vdev->dev, "Bad virtqueue length %u\n", num); 74542b36cc0SRusty Russell return NULL; 74642b36cc0SRusty Russell } 74742b36cc0SRusty Russell 7480a8a69ddSRusty Russell vq = kmalloc(sizeof(*vq) + sizeof(void *)*num, GFP_KERNEL); 7490a8a69ddSRusty Russell if (!vq) 7500a8a69ddSRusty Russell return NULL; 7510a8a69ddSRusty Russell 75287c7d57cSRusty Russell vring_init(&vq->vring, num, pages, vring_align); 7530a8a69ddSRusty Russell vq->vq.callback = callback; 7540a8a69ddSRusty Russell vq->vq.vdev = vdev; 7559499f5e7SRusty Russell vq->vq.name = name; 75606ca287dSRusty Russell vq->vq.num_free = num; 75706ca287dSRusty Russell vq->vq.index = index; 7580a8a69ddSRusty Russell vq->notify = notify; 7597b21e34fSRusty Russell vq->weak_barriers = weak_barriers; 7600a8a69ddSRusty Russell vq->broken = false; 7610a8a69ddSRusty Russell vq->last_used_idx = 0; 7620a8a69ddSRusty Russell vq->num_added = 0; 7639499f5e7SRusty Russell list_add_tail(&vq->vq.list, &vdev->vqs); 7640a8a69ddSRusty Russell #ifdef DEBUG 7650a8a69ddSRusty Russell vq->in_use = false; 766e93300b1SRusty Russell vq->last_add_time_valid = false; 7670a8a69ddSRusty Russell #endif 7680a8a69ddSRusty Russell 7699fa29b9dSMark McLoughlin vq->indirect = virtio_has_feature(vdev, VIRTIO_RING_F_INDIRECT_DESC); 770a5c262c5SMichael S. Tsirkin vq->event = virtio_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX); 7719fa29b9dSMark McLoughlin 7720a8a69ddSRusty Russell /* No callback? Tell other side not to bother us. */ 7730a8a69ddSRusty Russell if (!callback) 7740a8a69ddSRusty Russell vq->vring.avail->flags |= VRING_AVAIL_F_NO_INTERRUPT; 7750a8a69ddSRusty Russell 7760a8a69ddSRusty Russell /* Put everything in free lists. */ 7770a8a69ddSRusty Russell vq->free_head = 0; 7783b870624SAmit Shah for (i = 0; i < num-1; i++) { 7790a8a69ddSRusty Russell vq->vring.desc[i].next = i+1; 7803b870624SAmit Shah vq->data[i] = NULL; 7813b870624SAmit Shah } 7823b870624SAmit Shah vq->data[i] = NULL; 7830a8a69ddSRusty Russell 7840a8a69ddSRusty Russell return &vq->vq; 7850a8a69ddSRusty Russell } 786c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_new_virtqueue); 7870a8a69ddSRusty Russell 7880a8a69ddSRusty Russell void vring_del_virtqueue(struct virtqueue *vq) 7890a8a69ddSRusty Russell { 7909499f5e7SRusty Russell list_del(&vq->list); 7910a8a69ddSRusty Russell kfree(to_vvq(vq)); 7920a8a69ddSRusty Russell } 793c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_del_virtqueue); 7940a8a69ddSRusty Russell 795e34f8725SRusty Russell /* Manipulates transport-specific feature bits. */ 796e34f8725SRusty Russell void vring_transport_features(struct virtio_device *vdev) 797e34f8725SRusty Russell { 798e34f8725SRusty Russell unsigned int i; 799e34f8725SRusty Russell 800e34f8725SRusty Russell for (i = VIRTIO_TRANSPORT_F_START; i < VIRTIO_TRANSPORT_F_END; i++) { 801e34f8725SRusty Russell switch (i) { 8029fa29b9dSMark McLoughlin case VIRTIO_RING_F_INDIRECT_DESC: 8039fa29b9dSMark McLoughlin break; 804a5c262c5SMichael S. Tsirkin case VIRTIO_RING_F_EVENT_IDX: 805a5c262c5SMichael S. Tsirkin break; 806e34f8725SRusty Russell default: 807e34f8725SRusty Russell /* We don't understand this bit. */ 808e34f8725SRusty Russell clear_bit(i, vdev->features); 809e34f8725SRusty Russell } 810e34f8725SRusty Russell } 811e34f8725SRusty Russell } 812e34f8725SRusty Russell EXPORT_SYMBOL_GPL(vring_transport_features); 813e34f8725SRusty Russell 8145dfc1762SRusty Russell /** 8155dfc1762SRusty Russell * virtqueue_get_vring_size - return the size of the virtqueue's vring 8165dfc1762SRusty Russell * @vq: the struct virtqueue containing the vring of interest. 8175dfc1762SRusty Russell * 8185dfc1762SRusty Russell * Returns the size of the vring. This is mainly used for boasting to 8195dfc1762SRusty Russell * userspace. Unlike other operations, this need not be serialized. 8205dfc1762SRusty Russell */ 8218f9f4668SRick Jones unsigned int virtqueue_get_vring_size(struct virtqueue *_vq) 8228f9f4668SRick Jones { 8238f9f4668SRick Jones 8248f9f4668SRick Jones struct vring_virtqueue *vq = to_vvq(_vq); 8258f9f4668SRick Jones 8268f9f4668SRick Jones return vq->vring.num; 8278f9f4668SRick Jones } 8288f9f4668SRick Jones EXPORT_SYMBOL_GPL(virtqueue_get_vring_size); 8298f9f4668SRick Jones 830b3b32c94SHeinz Graalfs bool virtqueue_is_broken(struct virtqueue *_vq) 831b3b32c94SHeinz Graalfs { 832b3b32c94SHeinz Graalfs struct vring_virtqueue *vq = to_vvq(_vq); 833b3b32c94SHeinz Graalfs 834b3b32c94SHeinz Graalfs return vq->broken; 835b3b32c94SHeinz Graalfs } 836b3b32c94SHeinz Graalfs EXPORT_SYMBOL_GPL(virtqueue_is_broken); 837b3b32c94SHeinz Graalfs 838e2dcdfe9SRusty Russell /* 839e2dcdfe9SRusty Russell * This should prevent the device from being used, allowing drivers to 840e2dcdfe9SRusty Russell * recover. You may need to grab appropriate locks to flush. 841e2dcdfe9SRusty Russell */ 842e2dcdfe9SRusty Russell void virtio_break_device(struct virtio_device *dev) 843e2dcdfe9SRusty Russell { 844e2dcdfe9SRusty Russell struct virtqueue *_vq; 845e2dcdfe9SRusty Russell 846e2dcdfe9SRusty Russell list_for_each_entry(_vq, &dev->vqs, list) { 847e2dcdfe9SRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 848e2dcdfe9SRusty Russell vq->broken = true; 849e2dcdfe9SRusty Russell } 850e2dcdfe9SRusty Russell } 851e2dcdfe9SRusty Russell EXPORT_SYMBOL_GPL(virtio_break_device); 852e2dcdfe9SRusty Russell 853c6fd4701SRusty Russell MODULE_LICENSE("GPL"); 854