10a8a69ddSRusty Russell /* Virtio ring implementation. 20a8a69ddSRusty Russell * 30a8a69ddSRusty Russell * Copyright 2007 Rusty Russell IBM Corporation 40a8a69ddSRusty Russell * 50a8a69ddSRusty Russell * This program is free software; you can redistribute it and/or modify 60a8a69ddSRusty Russell * it under the terms of the GNU General Public License as published by 70a8a69ddSRusty Russell * the Free Software Foundation; either version 2 of the License, or 80a8a69ddSRusty Russell * (at your option) any later version. 90a8a69ddSRusty Russell * 100a8a69ddSRusty Russell * This program is distributed in the hope that it will be useful, 110a8a69ddSRusty Russell * but WITHOUT ANY WARRANTY; without even the implied warranty of 120a8a69ddSRusty Russell * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 130a8a69ddSRusty Russell * GNU General Public License for more details. 140a8a69ddSRusty Russell * 150a8a69ddSRusty Russell * You should have received a copy of the GNU General Public License 160a8a69ddSRusty Russell * along with this program; if not, write to the Free Software 170a8a69ddSRusty Russell * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA 180a8a69ddSRusty Russell */ 190a8a69ddSRusty Russell #include <linux/virtio.h> 200a8a69ddSRusty Russell #include <linux/virtio_ring.h> 21e34f8725SRusty Russell #include <linux/virtio_config.h> 220a8a69ddSRusty Russell #include <linux/device.h> 235a0e3ad6STejun Heo #include <linux/slab.h> 24b5a2c4f1SPaul Gortmaker #include <linux/module.h> 25e93300b1SRusty Russell #include <linux/hrtimer.h> 26780bc790SAndy Lutomirski #include <linux/dma-mapping.h> 2778fe3987SAndy Lutomirski #include <xen/xen.h> 280a8a69ddSRusty Russell 290a8a69ddSRusty Russell #ifdef DEBUG 300a8a69ddSRusty Russell /* For development, we want to crash whenever the ring is screwed. */ 319499f5e7SRusty Russell #define BAD_RING(_vq, fmt, args...) \ 329499f5e7SRusty Russell do { \ 339499f5e7SRusty Russell dev_err(&(_vq)->vq.vdev->dev, \ 349499f5e7SRusty Russell "%s:"fmt, (_vq)->vq.name, ##args); \ 359499f5e7SRusty Russell BUG(); \ 369499f5e7SRusty Russell } while (0) 37c5f841f1SRusty Russell /* Caller is supposed to guarantee no reentry. */ 383a35ce7dSRoel Kluin #define START_USE(_vq) \ 39c5f841f1SRusty Russell do { \ 40c5f841f1SRusty Russell if ((_vq)->in_use) \ 419499f5e7SRusty Russell panic("%s:in_use = %i\n", \ 429499f5e7SRusty Russell (_vq)->vq.name, (_vq)->in_use); \ 43c5f841f1SRusty Russell (_vq)->in_use = __LINE__; \ 44c5f841f1SRusty Russell } while (0) 453a35ce7dSRoel Kluin #define END_USE(_vq) \ 4697a545abSRusty Russell do { BUG_ON(!(_vq)->in_use); (_vq)->in_use = 0; } while(0) 47*4d6a105eSTiwei Bie #define LAST_ADD_TIME_UPDATE(_vq) \ 48*4d6a105eSTiwei Bie do { \ 49*4d6a105eSTiwei Bie ktime_t now = ktime_get(); \ 50*4d6a105eSTiwei Bie \ 51*4d6a105eSTiwei Bie /* No kick or get, with .1 second between? Warn. */ \ 52*4d6a105eSTiwei Bie if ((_vq)->last_add_time_valid) \ 53*4d6a105eSTiwei Bie WARN_ON(ktime_to_ms(ktime_sub(now, \ 54*4d6a105eSTiwei Bie (_vq)->last_add_time)) > 100); \ 55*4d6a105eSTiwei Bie (_vq)->last_add_time = now; \ 56*4d6a105eSTiwei Bie (_vq)->last_add_time_valid = true; \ 57*4d6a105eSTiwei Bie } while (0) 58*4d6a105eSTiwei Bie #define LAST_ADD_TIME_CHECK(_vq) \ 59*4d6a105eSTiwei Bie do { \ 60*4d6a105eSTiwei Bie if ((_vq)->last_add_time_valid) { \ 61*4d6a105eSTiwei Bie WARN_ON(ktime_to_ms(ktime_sub(ktime_get(), \ 62*4d6a105eSTiwei Bie (_vq)->last_add_time)) > 100); \ 63*4d6a105eSTiwei Bie } \ 64*4d6a105eSTiwei Bie } while (0) 65*4d6a105eSTiwei Bie #define LAST_ADD_TIME_INVALID(_vq) \ 66*4d6a105eSTiwei Bie ((_vq)->last_add_time_valid = false) 670a8a69ddSRusty Russell #else 689499f5e7SRusty Russell #define BAD_RING(_vq, fmt, args...) \ 699499f5e7SRusty Russell do { \ 709499f5e7SRusty Russell dev_err(&_vq->vq.vdev->dev, \ 719499f5e7SRusty Russell "%s:"fmt, (_vq)->vq.name, ##args); \ 729499f5e7SRusty Russell (_vq)->broken = true; \ 739499f5e7SRusty Russell } while (0) 740a8a69ddSRusty Russell #define START_USE(vq) 750a8a69ddSRusty Russell #define END_USE(vq) 76*4d6a105eSTiwei Bie #define LAST_ADD_TIME_UPDATE(vq) 77*4d6a105eSTiwei Bie #define LAST_ADD_TIME_CHECK(vq) 78*4d6a105eSTiwei Bie #define LAST_ADD_TIME_INVALID(vq) 790a8a69ddSRusty Russell #endif 800a8a69ddSRusty Russell 81780bc790SAndy Lutomirski struct vring_desc_state { 82780bc790SAndy Lutomirski void *data; /* Data for callback. */ 83780bc790SAndy Lutomirski struct vring_desc *indir_desc; /* Indirect descriptor, if any. */ 84780bc790SAndy Lutomirski }; 85780bc790SAndy Lutomirski 8643b4f721SMichael S. Tsirkin struct vring_virtqueue { 870a8a69ddSRusty Russell struct virtqueue vq; 880a8a69ddSRusty Russell 897b21e34fSRusty Russell /* Can we use weak barriers? */ 907b21e34fSRusty Russell bool weak_barriers; 917b21e34fSRusty Russell 920a8a69ddSRusty Russell /* Other side has made a mess, don't try any more. */ 930a8a69ddSRusty Russell bool broken; 940a8a69ddSRusty Russell 959fa29b9dSMark McLoughlin /* Host supports indirect buffers */ 969fa29b9dSMark McLoughlin bool indirect; 979fa29b9dSMark McLoughlin 98a5c262c5SMichael S. Tsirkin /* Host publishes avail event idx */ 99a5c262c5SMichael S. Tsirkin bool event; 100a5c262c5SMichael S. Tsirkin 1010a8a69ddSRusty Russell /* Head of free buffer list. */ 1020a8a69ddSRusty Russell unsigned int free_head; 1030a8a69ddSRusty Russell /* Number we've added since last sync. */ 1040a8a69ddSRusty Russell unsigned int num_added; 1050a8a69ddSRusty Russell 1060a8a69ddSRusty Russell /* Last used index we've seen. */ 1071bc4953eSAnthony Liguori u16 last_used_idx; 1080a8a69ddSRusty Russell 109e593bf97STiwei Bie struct { 110e593bf97STiwei Bie /* Actual memory layout for this queue */ 111e593bf97STiwei Bie struct vring vring; 112e593bf97STiwei Bie 113f277ec42SVenkatesh Srinivas /* Last written value to avail->flags */ 114f277ec42SVenkatesh Srinivas u16 avail_flags_shadow; 115f277ec42SVenkatesh Srinivas 116f277ec42SVenkatesh Srinivas /* Last written value to avail->idx in guest byte order */ 117f277ec42SVenkatesh Srinivas u16 avail_idx_shadow; 118e593bf97STiwei Bie } split; 119f277ec42SVenkatesh Srinivas 1200a8a69ddSRusty Russell /* How to notify other side. FIXME: commonalize hcalls! */ 12146f9c2b9SHeinz Graalfs bool (*notify)(struct virtqueue *vq); 1220a8a69ddSRusty Russell 1232a2d1382SAndy Lutomirski /* DMA, allocation, and size information */ 1242a2d1382SAndy Lutomirski bool we_own_ring; 1252a2d1382SAndy Lutomirski size_t queue_size_in_bytes; 1262a2d1382SAndy Lutomirski dma_addr_t queue_dma_addr; 1272a2d1382SAndy Lutomirski 1280a8a69ddSRusty Russell #ifdef DEBUG 1290a8a69ddSRusty Russell /* They're supposed to lock for us. */ 1300a8a69ddSRusty Russell unsigned int in_use; 131e93300b1SRusty Russell 132e93300b1SRusty Russell /* Figure out if their kicks are too delayed. */ 133e93300b1SRusty Russell bool last_add_time_valid; 134e93300b1SRusty Russell ktime_t last_add_time; 1350a8a69ddSRusty Russell #endif 1360a8a69ddSRusty Russell 137780bc790SAndy Lutomirski /* Per-descriptor state. */ 138780bc790SAndy Lutomirski struct vring_desc_state desc_state[]; 1390a8a69ddSRusty Russell }; 1400a8a69ddSRusty Russell 141e6f633e5STiwei Bie 142e6f633e5STiwei Bie /* 143e6f633e5STiwei Bie * Helpers. 144e6f633e5STiwei Bie */ 145e6f633e5STiwei Bie 1460a8a69ddSRusty Russell #define to_vvq(_vq) container_of(_vq, struct vring_virtqueue, vq) 1470a8a69ddSRusty Russell 148d26c96c8SAndy Lutomirski /* 1491a937693SMichael S. Tsirkin * Modern virtio devices have feature bits to specify whether they need a 1501a937693SMichael S. Tsirkin * quirk and bypass the IOMMU. If not there, just use the DMA API. 1511a937693SMichael S. Tsirkin * 1521a937693SMichael S. Tsirkin * If there, the interaction between virtio and DMA API is messy. 153d26c96c8SAndy Lutomirski * 154d26c96c8SAndy Lutomirski * On most systems with virtio, physical addresses match bus addresses, 155d26c96c8SAndy Lutomirski * and it doesn't particularly matter whether we use the DMA API. 156d26c96c8SAndy Lutomirski * 157d26c96c8SAndy Lutomirski * On some systems, including Xen and any system with a physical device 158d26c96c8SAndy Lutomirski * that speaks virtio behind a physical IOMMU, we must use the DMA API 159d26c96c8SAndy Lutomirski * for virtio DMA to work at all. 160d26c96c8SAndy Lutomirski * 161d26c96c8SAndy Lutomirski * On other systems, including SPARC and PPC64, virtio-pci devices are 162d26c96c8SAndy Lutomirski * enumerated as though they are behind an IOMMU, but the virtio host 163d26c96c8SAndy Lutomirski * ignores the IOMMU, so we must either pretend that the IOMMU isn't 164d26c96c8SAndy Lutomirski * there or somehow map everything as the identity. 165d26c96c8SAndy Lutomirski * 166d26c96c8SAndy Lutomirski * For the time being, we preserve historic behavior and bypass the DMA 167d26c96c8SAndy Lutomirski * API. 1681a937693SMichael S. Tsirkin * 1691a937693SMichael S. Tsirkin * TODO: install a per-device DMA ops structure that does the right thing 1701a937693SMichael S. Tsirkin * taking into account all the above quirks, and use the DMA API 1711a937693SMichael S. Tsirkin * unconditionally on data path. 172d26c96c8SAndy Lutomirski */ 173d26c96c8SAndy Lutomirski 174d26c96c8SAndy Lutomirski static bool vring_use_dma_api(struct virtio_device *vdev) 175d26c96c8SAndy Lutomirski { 1761a937693SMichael S. Tsirkin if (!virtio_has_iommu_quirk(vdev)) 1771a937693SMichael S. Tsirkin return true; 1781a937693SMichael S. Tsirkin 1791a937693SMichael S. Tsirkin /* Otherwise, we are left to guess. */ 18078fe3987SAndy Lutomirski /* 18178fe3987SAndy Lutomirski * In theory, it's possible to have a buggy QEMU-supposed 18278fe3987SAndy Lutomirski * emulated Q35 IOMMU and Xen enabled at the same time. On 18378fe3987SAndy Lutomirski * such a configuration, virtio has never worked and will 18478fe3987SAndy Lutomirski * not work without an even larger kludge. Instead, enable 18578fe3987SAndy Lutomirski * the DMA API if we're a Xen guest, which at least allows 18678fe3987SAndy Lutomirski * all of the sensible Xen configurations to work correctly. 18778fe3987SAndy Lutomirski */ 18878fe3987SAndy Lutomirski if (xen_domain()) 18978fe3987SAndy Lutomirski return true; 19078fe3987SAndy Lutomirski 191d26c96c8SAndy Lutomirski return false; 192d26c96c8SAndy Lutomirski } 193d26c96c8SAndy Lutomirski 194780bc790SAndy Lutomirski /* 195780bc790SAndy Lutomirski * The DMA ops on various arches are rather gnarly right now, and 196780bc790SAndy Lutomirski * making all of the arch DMA ops work on the vring device itself 197780bc790SAndy Lutomirski * is a mess. For now, we use the parent device for DMA ops. 198780bc790SAndy Lutomirski */ 19975bfa81bSMichael S. Tsirkin static inline struct device *vring_dma_dev(const struct vring_virtqueue *vq) 200780bc790SAndy Lutomirski { 201780bc790SAndy Lutomirski return vq->vq.vdev->dev.parent; 202780bc790SAndy Lutomirski } 203780bc790SAndy Lutomirski 204780bc790SAndy Lutomirski /* Map one sg entry. */ 205780bc790SAndy Lutomirski static dma_addr_t vring_map_one_sg(const struct vring_virtqueue *vq, 206780bc790SAndy Lutomirski struct scatterlist *sg, 207780bc790SAndy Lutomirski enum dma_data_direction direction) 208780bc790SAndy Lutomirski { 209780bc790SAndy Lutomirski if (!vring_use_dma_api(vq->vq.vdev)) 210780bc790SAndy Lutomirski return (dma_addr_t)sg_phys(sg); 211780bc790SAndy Lutomirski 212780bc790SAndy Lutomirski /* 213780bc790SAndy Lutomirski * We can't use dma_map_sg, because we don't use scatterlists in 214780bc790SAndy Lutomirski * the way it expects (we don't guarantee that the scatterlist 215780bc790SAndy Lutomirski * will exist for the lifetime of the mapping). 216780bc790SAndy Lutomirski */ 217780bc790SAndy Lutomirski return dma_map_page(vring_dma_dev(vq), 218780bc790SAndy Lutomirski sg_page(sg), sg->offset, sg->length, 219780bc790SAndy Lutomirski direction); 220780bc790SAndy Lutomirski } 221780bc790SAndy Lutomirski 222780bc790SAndy Lutomirski static dma_addr_t vring_map_single(const struct vring_virtqueue *vq, 223780bc790SAndy Lutomirski void *cpu_addr, size_t size, 224780bc790SAndy Lutomirski enum dma_data_direction direction) 225780bc790SAndy Lutomirski { 226780bc790SAndy Lutomirski if (!vring_use_dma_api(vq->vq.vdev)) 227780bc790SAndy Lutomirski return (dma_addr_t)virt_to_phys(cpu_addr); 228780bc790SAndy Lutomirski 229780bc790SAndy Lutomirski return dma_map_single(vring_dma_dev(vq), 230780bc790SAndy Lutomirski cpu_addr, size, direction); 231780bc790SAndy Lutomirski } 232780bc790SAndy Lutomirski 233e6f633e5STiwei Bie static int vring_mapping_error(const struct vring_virtqueue *vq, 234e6f633e5STiwei Bie dma_addr_t addr) 235e6f633e5STiwei Bie { 236e6f633e5STiwei Bie if (!vring_use_dma_api(vq->vq.vdev)) 237e6f633e5STiwei Bie return 0; 238e6f633e5STiwei Bie 239e6f633e5STiwei Bie return dma_mapping_error(vring_dma_dev(vq), addr); 240e6f633e5STiwei Bie } 241e6f633e5STiwei Bie 242e6f633e5STiwei Bie 243e6f633e5STiwei Bie /* 244e6f633e5STiwei Bie * Split ring specific functions - *_split(). 245e6f633e5STiwei Bie */ 246e6f633e5STiwei Bie 247138fd251STiwei Bie static void vring_unmap_one_split(const struct vring_virtqueue *vq, 248780bc790SAndy Lutomirski struct vring_desc *desc) 249780bc790SAndy Lutomirski { 250780bc790SAndy Lutomirski u16 flags; 251780bc790SAndy Lutomirski 252780bc790SAndy Lutomirski if (!vring_use_dma_api(vq->vq.vdev)) 253780bc790SAndy Lutomirski return; 254780bc790SAndy Lutomirski 255780bc790SAndy Lutomirski flags = virtio16_to_cpu(vq->vq.vdev, desc->flags); 256780bc790SAndy Lutomirski 257780bc790SAndy Lutomirski if (flags & VRING_DESC_F_INDIRECT) { 258780bc790SAndy Lutomirski dma_unmap_single(vring_dma_dev(vq), 259780bc790SAndy Lutomirski virtio64_to_cpu(vq->vq.vdev, desc->addr), 260780bc790SAndy Lutomirski virtio32_to_cpu(vq->vq.vdev, desc->len), 261780bc790SAndy Lutomirski (flags & VRING_DESC_F_WRITE) ? 262780bc790SAndy Lutomirski DMA_FROM_DEVICE : DMA_TO_DEVICE); 263780bc790SAndy Lutomirski } else { 264780bc790SAndy Lutomirski dma_unmap_page(vring_dma_dev(vq), 265780bc790SAndy Lutomirski virtio64_to_cpu(vq->vq.vdev, desc->addr), 266780bc790SAndy Lutomirski virtio32_to_cpu(vq->vq.vdev, desc->len), 267780bc790SAndy Lutomirski (flags & VRING_DESC_F_WRITE) ? 268780bc790SAndy Lutomirski DMA_FROM_DEVICE : DMA_TO_DEVICE); 269780bc790SAndy Lutomirski } 270780bc790SAndy Lutomirski } 271780bc790SAndy Lutomirski 272138fd251STiwei Bie static struct vring_desc *alloc_indirect_split(struct virtqueue *_vq, 273138fd251STiwei Bie unsigned int total_sg, 274138fd251STiwei Bie gfp_t gfp) 2759fa29b9dSMark McLoughlin { 2769fa29b9dSMark McLoughlin struct vring_desc *desc; 277b25bd251SRusty Russell unsigned int i; 2789fa29b9dSMark McLoughlin 279b92b1b89SWill Deacon /* 280b92b1b89SWill Deacon * We require lowmem mappings for the descriptors because 281b92b1b89SWill Deacon * otherwise virt_to_phys will give us bogus addresses in the 282b92b1b89SWill Deacon * virtqueue. 283b92b1b89SWill Deacon */ 28482107539SMichal Hocko gfp &= ~__GFP_HIGHMEM; 285b92b1b89SWill Deacon 2866da2ec56SKees Cook desc = kmalloc_array(total_sg, sizeof(struct vring_desc), gfp); 2879fa29b9dSMark McLoughlin if (!desc) 288b25bd251SRusty Russell return NULL; 2899fa29b9dSMark McLoughlin 290b25bd251SRusty Russell for (i = 0; i < total_sg; i++) 29100e6f3d9SMichael S. Tsirkin desc[i].next = cpu_to_virtio16(_vq->vdev, i + 1); 292b25bd251SRusty Russell return desc; 2939fa29b9dSMark McLoughlin } 2949fa29b9dSMark McLoughlin 295138fd251STiwei Bie static inline int virtqueue_add_split(struct virtqueue *_vq, 29613816c76SRusty Russell struct scatterlist *sgs[], 297eeebf9b1SRusty Russell unsigned int total_sg, 29813816c76SRusty Russell unsigned int out_sgs, 29913816c76SRusty Russell unsigned int in_sgs, 300bbd603efSMichael S. Tsirkin void *data, 3015a08b04fSMichael S. Tsirkin void *ctx, 302bbd603efSMichael S. Tsirkin gfp_t gfp) 3030a8a69ddSRusty Russell { 3040a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 30513816c76SRusty Russell struct scatterlist *sg; 306b25bd251SRusty Russell struct vring_desc *desc; 307780bc790SAndy Lutomirski unsigned int i, n, avail, descs_used, uninitialized_var(prev), err_idx; 3081fe9b6feSMichael S. Tsirkin int head; 309b25bd251SRusty Russell bool indirect; 3100a8a69ddSRusty Russell 3119fa29b9dSMark McLoughlin START_USE(vq); 3129fa29b9dSMark McLoughlin 3130a8a69ddSRusty Russell BUG_ON(data == NULL); 3145a08b04fSMichael S. Tsirkin BUG_ON(ctx && vq->indirect); 3159fa29b9dSMark McLoughlin 31670670444SRusty Russell if (unlikely(vq->broken)) { 31770670444SRusty Russell END_USE(vq); 31870670444SRusty Russell return -EIO; 31970670444SRusty Russell } 32070670444SRusty Russell 321*4d6a105eSTiwei Bie LAST_ADD_TIME_UPDATE(vq); 322e93300b1SRusty Russell 32313816c76SRusty Russell BUG_ON(total_sg == 0); 3240a8a69ddSRusty Russell 325b25bd251SRusty Russell head = vq->free_head; 326b25bd251SRusty Russell 327b25bd251SRusty Russell /* If the host supports indirect descriptor tables, and we have multiple 328b25bd251SRusty Russell * buffers, then go indirect. FIXME: tune this threshold */ 329b25bd251SRusty Russell if (vq->indirect && total_sg > 1 && vq->vq.num_free) 330138fd251STiwei Bie desc = alloc_indirect_split(_vq, total_sg, gfp); 33144ed8089SRichard W.M. Jones else { 332b25bd251SRusty Russell desc = NULL; 333e593bf97STiwei Bie WARN_ON_ONCE(total_sg > vq->split.vring.num && !vq->indirect); 33444ed8089SRichard W.M. Jones } 335b25bd251SRusty Russell 336b25bd251SRusty Russell if (desc) { 337b25bd251SRusty Russell /* Use a single buffer which doesn't continue */ 338780bc790SAndy Lutomirski indirect = true; 339b25bd251SRusty Russell /* Set up rest to use this indirect table. */ 340b25bd251SRusty Russell i = 0; 341b25bd251SRusty Russell descs_used = 1; 342b25bd251SRusty Russell } else { 343780bc790SAndy Lutomirski indirect = false; 344e593bf97STiwei Bie desc = vq->split.vring.desc; 345b25bd251SRusty Russell i = head; 346b25bd251SRusty Russell descs_used = total_sg; 347b25bd251SRusty Russell } 348b25bd251SRusty Russell 349b25bd251SRusty Russell if (vq->vq.num_free < descs_used) { 3500a8a69ddSRusty Russell pr_debug("Can't add buf len %i - avail = %i\n", 351b25bd251SRusty Russell descs_used, vq->vq.num_free); 35244653eaeSRusty Russell /* FIXME: for historical reasons, we force a notify here if 35344653eaeSRusty Russell * there are outgoing parts to the buffer. Presumably the 35444653eaeSRusty Russell * host should service the ring ASAP. */ 35513816c76SRusty Russell if (out_sgs) 356426e3e0aSRusty Russell vq->notify(&vq->vq); 35758625edfSWei Yongjun if (indirect) 35858625edfSWei Yongjun kfree(desc); 3590a8a69ddSRusty Russell END_USE(vq); 3600a8a69ddSRusty Russell return -ENOSPC; 3610a8a69ddSRusty Russell } 3620a8a69ddSRusty Russell 36313816c76SRusty Russell for (n = 0; n < out_sgs; n++) { 364eeebf9b1SRusty Russell for (sg = sgs[n]; sg; sg = sg_next(sg)) { 365780bc790SAndy Lutomirski dma_addr_t addr = vring_map_one_sg(vq, sg, DMA_TO_DEVICE); 366780bc790SAndy Lutomirski if (vring_mapping_error(vq, addr)) 367780bc790SAndy Lutomirski goto unmap_release; 368780bc790SAndy Lutomirski 36900e6f3d9SMichael S. Tsirkin desc[i].flags = cpu_to_virtio16(_vq->vdev, VRING_DESC_F_NEXT); 370780bc790SAndy Lutomirski desc[i].addr = cpu_to_virtio64(_vq->vdev, addr); 37100e6f3d9SMichael S. Tsirkin desc[i].len = cpu_to_virtio32(_vq->vdev, sg->length); 3720a8a69ddSRusty Russell prev = i; 37300e6f3d9SMichael S. Tsirkin i = virtio16_to_cpu(_vq->vdev, desc[i].next); 3740a8a69ddSRusty Russell } 37513816c76SRusty Russell } 37613816c76SRusty Russell for (; n < (out_sgs + in_sgs); n++) { 377eeebf9b1SRusty Russell for (sg = sgs[n]; sg; sg = sg_next(sg)) { 378780bc790SAndy Lutomirski dma_addr_t addr = vring_map_one_sg(vq, sg, DMA_FROM_DEVICE); 379780bc790SAndy Lutomirski if (vring_mapping_error(vq, addr)) 380780bc790SAndy Lutomirski goto unmap_release; 381780bc790SAndy Lutomirski 38200e6f3d9SMichael S. Tsirkin desc[i].flags = cpu_to_virtio16(_vq->vdev, VRING_DESC_F_NEXT | VRING_DESC_F_WRITE); 383780bc790SAndy Lutomirski desc[i].addr = cpu_to_virtio64(_vq->vdev, addr); 38400e6f3d9SMichael S. Tsirkin desc[i].len = cpu_to_virtio32(_vq->vdev, sg->length); 3850a8a69ddSRusty Russell prev = i; 38600e6f3d9SMichael S. Tsirkin i = virtio16_to_cpu(_vq->vdev, desc[i].next); 38713816c76SRusty Russell } 3880a8a69ddSRusty Russell } 3890a8a69ddSRusty Russell /* Last one doesn't continue. */ 39000e6f3d9SMichael S. Tsirkin desc[prev].flags &= cpu_to_virtio16(_vq->vdev, ~VRING_DESC_F_NEXT); 3910a8a69ddSRusty Russell 392780bc790SAndy Lutomirski if (indirect) { 393780bc790SAndy Lutomirski /* Now that the indirect table is filled in, map it. */ 394780bc790SAndy Lutomirski dma_addr_t addr = vring_map_single( 395780bc790SAndy Lutomirski vq, desc, total_sg * sizeof(struct vring_desc), 396780bc790SAndy Lutomirski DMA_TO_DEVICE); 397780bc790SAndy Lutomirski if (vring_mapping_error(vq, addr)) 398780bc790SAndy Lutomirski goto unmap_release; 399780bc790SAndy Lutomirski 400e593bf97STiwei Bie vq->split.vring.desc[head].flags = cpu_to_virtio16(_vq->vdev, 401e593bf97STiwei Bie VRING_DESC_F_INDIRECT); 402e593bf97STiwei Bie vq->split.vring.desc[head].addr = cpu_to_virtio64(_vq->vdev, 403e593bf97STiwei Bie addr); 404780bc790SAndy Lutomirski 405e593bf97STiwei Bie vq->split.vring.desc[head].len = cpu_to_virtio32(_vq->vdev, 406e593bf97STiwei Bie total_sg * sizeof(struct vring_desc)); 407780bc790SAndy Lutomirski } 408780bc790SAndy Lutomirski 409780bc790SAndy Lutomirski /* We're using some buffers from the free list. */ 410780bc790SAndy Lutomirski vq->vq.num_free -= descs_used; 411780bc790SAndy Lutomirski 4120a8a69ddSRusty Russell /* Update free pointer */ 413b25bd251SRusty Russell if (indirect) 414e593bf97STiwei Bie vq->free_head = virtio16_to_cpu(_vq->vdev, 415e593bf97STiwei Bie vq->split.vring.desc[head].next); 416b25bd251SRusty Russell else 4170a8a69ddSRusty Russell vq->free_head = i; 4180a8a69ddSRusty Russell 419780bc790SAndy Lutomirski /* Store token and indirect buffer state. */ 420780bc790SAndy Lutomirski vq->desc_state[head].data = data; 421780bc790SAndy Lutomirski if (indirect) 422780bc790SAndy Lutomirski vq->desc_state[head].indir_desc = desc; 42387646a34SJason Wang else 4245a08b04fSMichael S. Tsirkin vq->desc_state[head].indir_desc = ctx; 4250a8a69ddSRusty Russell 4260a8a69ddSRusty Russell /* Put entry in available array (but don't update avail->idx until they 4273b720b8cSRusty Russell * do sync). */ 428e593bf97STiwei Bie avail = vq->split.avail_idx_shadow & (vq->split.vring.num - 1); 429e593bf97STiwei Bie vq->split.vring.avail->ring[avail] = cpu_to_virtio16(_vq->vdev, head); 4300a8a69ddSRusty Russell 431ee7cd898SRusty Russell /* Descriptors and available array need to be set before we expose the 432ee7cd898SRusty Russell * new available array entries. */ 433a9a0fef7SRusty Russell virtio_wmb(vq->weak_barriers); 434e593bf97STiwei Bie vq->split.avail_idx_shadow++; 435e593bf97STiwei Bie vq->split.vring.avail->idx = cpu_to_virtio16(_vq->vdev, 436e593bf97STiwei Bie vq->split.avail_idx_shadow); 437ee7cd898SRusty Russell vq->num_added++; 438ee7cd898SRusty Russell 4395e05bf58STetsuo Handa pr_debug("Added buffer head %i to %p\n", head, vq); 4405e05bf58STetsuo Handa END_USE(vq); 4415e05bf58STetsuo Handa 442ee7cd898SRusty Russell /* This is very unlikely, but theoretically possible. Kick 443ee7cd898SRusty Russell * just in case. */ 444ee7cd898SRusty Russell if (unlikely(vq->num_added == (1 << 16) - 1)) 445ee7cd898SRusty Russell virtqueue_kick(_vq); 446ee7cd898SRusty Russell 44798e8c6bcSRusty Russell return 0; 448780bc790SAndy Lutomirski 449780bc790SAndy Lutomirski unmap_release: 450780bc790SAndy Lutomirski err_idx = i; 451780bc790SAndy Lutomirski i = head; 452780bc790SAndy Lutomirski 453780bc790SAndy Lutomirski for (n = 0; n < total_sg; n++) { 454780bc790SAndy Lutomirski if (i == err_idx) 455780bc790SAndy Lutomirski break; 456138fd251STiwei Bie vring_unmap_one_split(vq, &desc[i]); 457e593bf97STiwei Bie i = virtio16_to_cpu(_vq->vdev, vq->split.vring.desc[i].next); 458780bc790SAndy Lutomirski } 459780bc790SAndy Lutomirski 460780bc790SAndy Lutomirski if (indirect) 461780bc790SAndy Lutomirski kfree(desc); 462780bc790SAndy Lutomirski 4633cc36f6eSMichael S. Tsirkin END_USE(vq); 464780bc790SAndy Lutomirski return -EIO; 4650a8a69ddSRusty Russell } 46613816c76SRusty Russell 467138fd251STiwei Bie static bool virtqueue_kick_prepare_split(struct virtqueue *_vq) 4680a8a69ddSRusty Russell { 4690a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 470a5c262c5SMichael S. Tsirkin u16 new, old; 47141f0377fSRusty Russell bool needs_kick; 47241f0377fSRusty Russell 4730a8a69ddSRusty Russell START_USE(vq); 474a72caae2SJason Wang /* We need to expose available array entries before checking avail 475a72caae2SJason Wang * event. */ 476a9a0fef7SRusty Russell virtio_mb(vq->weak_barriers); 4770a8a69ddSRusty Russell 478e593bf97STiwei Bie old = vq->split.avail_idx_shadow - vq->num_added; 479e593bf97STiwei Bie new = vq->split.avail_idx_shadow; 4800a8a69ddSRusty Russell vq->num_added = 0; 4810a8a69ddSRusty Russell 482*4d6a105eSTiwei Bie LAST_ADD_TIME_CHECK(vq); 483*4d6a105eSTiwei Bie LAST_ADD_TIME_INVALID(vq); 484e93300b1SRusty Russell 48541f0377fSRusty Russell if (vq->event) { 486e593bf97STiwei Bie needs_kick = vring_need_event(virtio16_to_cpu(_vq->vdev, 487e593bf97STiwei Bie vring_avail_event(&vq->split.vring)), 48841f0377fSRusty Russell new, old); 48941f0377fSRusty Russell } else { 490e593bf97STiwei Bie needs_kick = !(vq->split.vring.used->flags & 491e593bf97STiwei Bie cpu_to_virtio16(_vq->vdev, 492e593bf97STiwei Bie VRING_USED_F_NO_NOTIFY)); 49341f0377fSRusty Russell } 4940a8a69ddSRusty Russell END_USE(vq); 49541f0377fSRusty Russell return needs_kick; 49641f0377fSRusty Russell } 497138fd251STiwei Bie 498138fd251STiwei Bie static void detach_buf_split(struct vring_virtqueue *vq, unsigned int head, 4995a08b04fSMichael S. Tsirkin void **ctx) 5000a8a69ddSRusty Russell { 501780bc790SAndy Lutomirski unsigned int i, j; 502c60923cbSGonglei __virtio16 nextflag = cpu_to_virtio16(vq->vq.vdev, VRING_DESC_F_NEXT); 5030a8a69ddSRusty Russell 5040a8a69ddSRusty Russell /* Clear data ptr. */ 505780bc790SAndy Lutomirski vq->desc_state[head].data = NULL; 5060a8a69ddSRusty Russell 507780bc790SAndy Lutomirski /* Put back on free list: unmap first-level descriptors and find end */ 5080a8a69ddSRusty Russell i = head; 5099fa29b9dSMark McLoughlin 510e593bf97STiwei Bie while (vq->split.vring.desc[i].flags & nextflag) { 511e593bf97STiwei Bie vring_unmap_one_split(vq, &vq->split.vring.desc[i]); 512e593bf97STiwei Bie i = virtio16_to_cpu(vq->vq.vdev, vq->split.vring.desc[i].next); 51306ca287dSRusty Russell vq->vq.num_free++; 5140a8a69ddSRusty Russell } 5150a8a69ddSRusty Russell 516e593bf97STiwei Bie vring_unmap_one_split(vq, &vq->split.vring.desc[i]); 517e593bf97STiwei Bie vq->split.vring.desc[i].next = cpu_to_virtio16(vq->vq.vdev, 518e593bf97STiwei Bie vq->free_head); 5190a8a69ddSRusty Russell vq->free_head = head; 520780bc790SAndy Lutomirski 5210a8a69ddSRusty Russell /* Plus final descriptor */ 52206ca287dSRusty Russell vq->vq.num_free++; 523780bc790SAndy Lutomirski 5245a08b04fSMichael S. Tsirkin if (vq->indirect) { 525780bc790SAndy Lutomirski struct vring_desc *indir_desc = vq->desc_state[head].indir_desc; 5265a08b04fSMichael S. Tsirkin u32 len; 5275a08b04fSMichael S. Tsirkin 5285a08b04fSMichael S. Tsirkin /* Free the indirect table, if any, now that it's unmapped. */ 5295a08b04fSMichael S. Tsirkin if (!indir_desc) 5305a08b04fSMichael S. Tsirkin return; 5315a08b04fSMichael S. Tsirkin 532e593bf97STiwei Bie len = virtio32_to_cpu(vq->vq.vdev, 533e593bf97STiwei Bie vq->split.vring.desc[head].len); 534780bc790SAndy Lutomirski 535e593bf97STiwei Bie BUG_ON(!(vq->split.vring.desc[head].flags & 536780bc790SAndy Lutomirski cpu_to_virtio16(vq->vq.vdev, VRING_DESC_F_INDIRECT))); 537780bc790SAndy Lutomirski BUG_ON(len == 0 || len % sizeof(struct vring_desc)); 538780bc790SAndy Lutomirski 539780bc790SAndy Lutomirski for (j = 0; j < len / sizeof(struct vring_desc); j++) 540138fd251STiwei Bie vring_unmap_one_split(vq, &indir_desc[j]); 541780bc790SAndy Lutomirski 5425a08b04fSMichael S. Tsirkin kfree(indir_desc); 543780bc790SAndy Lutomirski vq->desc_state[head].indir_desc = NULL; 5445a08b04fSMichael S. Tsirkin } else if (ctx) { 5455a08b04fSMichael S. Tsirkin *ctx = vq->desc_state[head].indir_desc; 546780bc790SAndy Lutomirski } 5470a8a69ddSRusty Russell } 5480a8a69ddSRusty Russell 549138fd251STiwei Bie static inline bool more_used_split(const struct vring_virtqueue *vq) 5500a8a69ddSRusty Russell { 551e593bf97STiwei Bie return vq->last_used_idx != virtio16_to_cpu(vq->vq.vdev, 552e593bf97STiwei Bie vq->split.vring.used->idx); 5530a8a69ddSRusty Russell } 5540a8a69ddSRusty Russell 555138fd251STiwei Bie static void *virtqueue_get_buf_ctx_split(struct virtqueue *_vq, 556138fd251STiwei Bie unsigned int *len, 5575a08b04fSMichael S. Tsirkin void **ctx) 5580a8a69ddSRusty Russell { 5590a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 5600a8a69ddSRusty Russell void *ret; 5610a8a69ddSRusty Russell unsigned int i; 5623b720b8cSRusty Russell u16 last_used; 5630a8a69ddSRusty Russell 5640a8a69ddSRusty Russell START_USE(vq); 5650a8a69ddSRusty Russell 5665ef82752SRusty Russell if (unlikely(vq->broken)) { 5675ef82752SRusty Russell END_USE(vq); 5685ef82752SRusty Russell return NULL; 5695ef82752SRusty Russell } 5705ef82752SRusty Russell 571138fd251STiwei Bie if (!more_used_split(vq)) { 5720a8a69ddSRusty Russell pr_debug("No more buffers in queue\n"); 5730a8a69ddSRusty Russell END_USE(vq); 5740a8a69ddSRusty Russell return NULL; 5750a8a69ddSRusty Russell } 5760a8a69ddSRusty Russell 5772d61ba95SMichael S. Tsirkin /* Only get used array entries after they have been exposed by host. */ 578a9a0fef7SRusty Russell virtio_rmb(vq->weak_barriers); 5792d61ba95SMichael S. Tsirkin 580e593bf97STiwei Bie last_used = (vq->last_used_idx & (vq->split.vring.num - 1)); 581e593bf97STiwei Bie i = virtio32_to_cpu(_vq->vdev, 582e593bf97STiwei Bie vq->split.vring.used->ring[last_used].id); 583e593bf97STiwei Bie *len = virtio32_to_cpu(_vq->vdev, 584e593bf97STiwei Bie vq->split.vring.used->ring[last_used].len); 5850a8a69ddSRusty Russell 586e593bf97STiwei Bie if (unlikely(i >= vq->split.vring.num)) { 5870a8a69ddSRusty Russell BAD_RING(vq, "id %u out of range\n", i); 5880a8a69ddSRusty Russell return NULL; 5890a8a69ddSRusty Russell } 590780bc790SAndy Lutomirski if (unlikely(!vq->desc_state[i].data)) { 5910a8a69ddSRusty Russell BAD_RING(vq, "id %u is not a head!\n", i); 5920a8a69ddSRusty Russell return NULL; 5930a8a69ddSRusty Russell } 5940a8a69ddSRusty Russell 595138fd251STiwei Bie /* detach_buf_split clears data, so grab it now. */ 596780bc790SAndy Lutomirski ret = vq->desc_state[i].data; 597138fd251STiwei Bie detach_buf_split(vq, i, ctx); 5980a8a69ddSRusty Russell vq->last_used_idx++; 599a5c262c5SMichael S. Tsirkin /* If we expect an interrupt for the next entry, tell host 600a5c262c5SMichael S. Tsirkin * by writing event index and flush out the write before 601a5c262c5SMichael S. Tsirkin * the read in the next get_buf call. */ 602e593bf97STiwei Bie if (!(vq->split.avail_flags_shadow & VRING_AVAIL_F_NO_INTERRUPT)) 603788e5b3aSMichael S. Tsirkin virtio_store_mb(vq->weak_barriers, 604e593bf97STiwei Bie &vring_used_event(&vq->split.vring), 605788e5b3aSMichael S. Tsirkin cpu_to_virtio16(_vq->vdev, vq->last_used_idx)); 606a5c262c5SMichael S. Tsirkin 607*4d6a105eSTiwei Bie LAST_ADD_TIME_INVALID(vq); 608e93300b1SRusty Russell 6090a8a69ddSRusty Russell END_USE(vq); 6100a8a69ddSRusty Russell return ret; 6110a8a69ddSRusty Russell } 612138fd251STiwei Bie 613138fd251STiwei Bie static void virtqueue_disable_cb_split(struct virtqueue *_vq) 614138fd251STiwei Bie { 615138fd251STiwei Bie struct vring_virtqueue *vq = to_vvq(_vq); 616138fd251STiwei Bie 617e593bf97STiwei Bie if (!(vq->split.avail_flags_shadow & VRING_AVAIL_F_NO_INTERRUPT)) { 618e593bf97STiwei Bie vq->split.avail_flags_shadow |= VRING_AVAIL_F_NO_INTERRUPT; 619138fd251STiwei Bie if (!vq->event) 620e593bf97STiwei Bie vq->split.vring.avail->flags = 621e593bf97STiwei Bie cpu_to_virtio16(_vq->vdev, 622e593bf97STiwei Bie vq->split.avail_flags_shadow); 623138fd251STiwei Bie } 624138fd251STiwei Bie } 625138fd251STiwei Bie 626138fd251STiwei Bie static unsigned virtqueue_enable_cb_prepare_split(struct virtqueue *_vq) 627cc229884SMichael S. Tsirkin { 628cc229884SMichael S. Tsirkin struct vring_virtqueue *vq = to_vvq(_vq); 629cc229884SMichael S. Tsirkin u16 last_used_idx; 630cc229884SMichael S. Tsirkin 631cc229884SMichael S. Tsirkin START_USE(vq); 632cc229884SMichael S. Tsirkin 633cc229884SMichael S. Tsirkin /* We optimistically turn back on interrupts, then check if there was 634cc229884SMichael S. Tsirkin * more to do. */ 635cc229884SMichael S. Tsirkin /* Depending on the VIRTIO_RING_F_EVENT_IDX feature, we need to 636cc229884SMichael S. Tsirkin * either clear the flags bit or point the event index at the next 637cc229884SMichael S. Tsirkin * entry. Always do both to keep code simple. */ 638e593bf97STiwei Bie if (vq->split.avail_flags_shadow & VRING_AVAIL_F_NO_INTERRUPT) { 639e593bf97STiwei Bie vq->split.avail_flags_shadow &= ~VRING_AVAIL_F_NO_INTERRUPT; 6400ea1e4a6SLadi Prosek if (!vq->event) 641e593bf97STiwei Bie vq->split.vring.avail->flags = 642e593bf97STiwei Bie cpu_to_virtio16(_vq->vdev, 643e593bf97STiwei Bie vq->split.avail_flags_shadow); 644f277ec42SVenkatesh Srinivas } 645e593bf97STiwei Bie vring_used_event(&vq->split.vring) = cpu_to_virtio16(_vq->vdev, 646e593bf97STiwei Bie last_used_idx = vq->last_used_idx); 647cc229884SMichael S. Tsirkin END_USE(vq); 648cc229884SMichael S. Tsirkin return last_used_idx; 649cc229884SMichael S. Tsirkin } 650138fd251STiwei Bie 651138fd251STiwei Bie static bool virtqueue_poll_split(struct virtqueue *_vq, unsigned last_used_idx) 652138fd251STiwei Bie { 653138fd251STiwei Bie struct vring_virtqueue *vq = to_vvq(_vq); 654138fd251STiwei Bie 655138fd251STiwei Bie return (u16)last_used_idx != virtio16_to_cpu(_vq->vdev, 656e593bf97STiwei Bie vq->split.vring.used->idx); 657138fd251STiwei Bie } 658138fd251STiwei Bie 659138fd251STiwei Bie static bool virtqueue_enable_cb_delayed_split(struct virtqueue *_vq) 6607ab358c2SMichael S. Tsirkin { 6617ab358c2SMichael S. Tsirkin struct vring_virtqueue *vq = to_vvq(_vq); 6627ab358c2SMichael S. Tsirkin u16 bufs; 6637ab358c2SMichael S. Tsirkin 6647ab358c2SMichael S. Tsirkin START_USE(vq); 6657ab358c2SMichael S. Tsirkin 6667ab358c2SMichael S. Tsirkin /* We optimistically turn back on interrupts, then check if there was 6677ab358c2SMichael S. Tsirkin * more to do. */ 6687ab358c2SMichael S. Tsirkin /* Depending on the VIRTIO_RING_F_USED_EVENT_IDX feature, we need to 6697ab358c2SMichael S. Tsirkin * either clear the flags bit or point the event index at the next 6700ea1e4a6SLadi Prosek * entry. Always update the event index to keep code simple. */ 671e593bf97STiwei Bie if (vq->split.avail_flags_shadow & VRING_AVAIL_F_NO_INTERRUPT) { 672e593bf97STiwei Bie vq->split.avail_flags_shadow &= ~VRING_AVAIL_F_NO_INTERRUPT; 6730ea1e4a6SLadi Prosek if (!vq->event) 674e593bf97STiwei Bie vq->split.vring.avail->flags = 675e593bf97STiwei Bie cpu_to_virtio16(_vq->vdev, 676e593bf97STiwei Bie vq->split.avail_flags_shadow); 677f277ec42SVenkatesh Srinivas } 6787ab358c2SMichael S. Tsirkin /* TODO: tune this threshold */ 679e593bf97STiwei Bie bufs = (u16)(vq->split.avail_idx_shadow - vq->last_used_idx) * 3 / 4; 680788e5b3aSMichael S. Tsirkin 681788e5b3aSMichael S. Tsirkin virtio_store_mb(vq->weak_barriers, 682e593bf97STiwei Bie &vring_used_event(&vq->split.vring), 683788e5b3aSMichael S. Tsirkin cpu_to_virtio16(_vq->vdev, vq->last_used_idx + bufs)); 684788e5b3aSMichael S. Tsirkin 685e593bf97STiwei Bie if (unlikely((u16)(virtio16_to_cpu(_vq->vdev, vq->split.vring.used->idx) 686e593bf97STiwei Bie - vq->last_used_idx) > bufs)) { 6877ab358c2SMichael S. Tsirkin END_USE(vq); 6887ab358c2SMichael S. Tsirkin return false; 6897ab358c2SMichael S. Tsirkin } 6907ab358c2SMichael S. Tsirkin 6917ab358c2SMichael S. Tsirkin END_USE(vq); 6927ab358c2SMichael S. Tsirkin return true; 6937ab358c2SMichael S. Tsirkin } 6947ab358c2SMichael S. Tsirkin 695138fd251STiwei Bie static void *virtqueue_detach_unused_buf_split(struct virtqueue *_vq) 696c021eac4SShirley Ma { 697c021eac4SShirley Ma struct vring_virtqueue *vq = to_vvq(_vq); 698c021eac4SShirley Ma unsigned int i; 699c021eac4SShirley Ma void *buf; 700c021eac4SShirley Ma 701c021eac4SShirley Ma START_USE(vq); 702c021eac4SShirley Ma 703e593bf97STiwei Bie for (i = 0; i < vq->split.vring.num; i++) { 704780bc790SAndy Lutomirski if (!vq->desc_state[i].data) 705c021eac4SShirley Ma continue; 706138fd251STiwei Bie /* detach_buf_split clears data, so grab it now. */ 707780bc790SAndy Lutomirski buf = vq->desc_state[i].data; 708138fd251STiwei Bie detach_buf_split(vq, i, NULL); 709e593bf97STiwei Bie vq->split.avail_idx_shadow--; 710e593bf97STiwei Bie vq->split.vring.avail->idx = cpu_to_virtio16(_vq->vdev, 711e593bf97STiwei Bie vq->split.avail_idx_shadow); 712c021eac4SShirley Ma END_USE(vq); 713c021eac4SShirley Ma return buf; 714c021eac4SShirley Ma } 715c021eac4SShirley Ma /* That should have freed everything. */ 716e593bf97STiwei Bie BUG_ON(vq->vq.num_free != vq->split.vring.num); 717c021eac4SShirley Ma 718c021eac4SShirley Ma END_USE(vq); 719c021eac4SShirley Ma return NULL; 720c021eac4SShirley Ma } 721138fd251STiwei Bie 722e6f633e5STiwei Bie 723e6f633e5STiwei Bie /* 724e6f633e5STiwei Bie * Generic functions and exported symbols. 725e6f633e5STiwei Bie */ 726e6f633e5STiwei Bie 727e6f633e5STiwei Bie static inline int virtqueue_add(struct virtqueue *_vq, 728e6f633e5STiwei Bie struct scatterlist *sgs[], 729e6f633e5STiwei Bie unsigned int total_sg, 730e6f633e5STiwei Bie unsigned int out_sgs, 731e6f633e5STiwei Bie unsigned int in_sgs, 732e6f633e5STiwei Bie void *data, 733e6f633e5STiwei Bie void *ctx, 734e6f633e5STiwei Bie gfp_t gfp) 735e6f633e5STiwei Bie { 736e6f633e5STiwei Bie return virtqueue_add_split(_vq, sgs, total_sg, 737e6f633e5STiwei Bie out_sgs, in_sgs, data, ctx, gfp); 738e6f633e5STiwei Bie } 739e6f633e5STiwei Bie 740e6f633e5STiwei Bie /** 741e6f633e5STiwei Bie * virtqueue_add_sgs - expose buffers to other end 742e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 743e6f633e5STiwei Bie * @sgs: array of terminated scatterlists. 744e6f633e5STiwei Bie * @out_num: the number of scatterlists readable by other side 745e6f633e5STiwei Bie * @in_num: the number of scatterlists which are writable (after readable ones) 746e6f633e5STiwei Bie * @data: the token identifying the buffer. 747e6f633e5STiwei Bie * @gfp: how to do memory allocations (if necessary). 748e6f633e5STiwei Bie * 749e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue operations 750e6f633e5STiwei Bie * at the same time (except where noted). 751e6f633e5STiwei Bie * 752e6f633e5STiwei Bie * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 753e6f633e5STiwei Bie */ 754e6f633e5STiwei Bie int virtqueue_add_sgs(struct virtqueue *_vq, 755e6f633e5STiwei Bie struct scatterlist *sgs[], 756e6f633e5STiwei Bie unsigned int out_sgs, 757e6f633e5STiwei Bie unsigned int in_sgs, 758e6f633e5STiwei Bie void *data, 759e6f633e5STiwei Bie gfp_t gfp) 760e6f633e5STiwei Bie { 761e6f633e5STiwei Bie unsigned int i, total_sg = 0; 762e6f633e5STiwei Bie 763e6f633e5STiwei Bie /* Count them first. */ 764e6f633e5STiwei Bie for (i = 0; i < out_sgs + in_sgs; i++) { 765e6f633e5STiwei Bie struct scatterlist *sg; 766e6f633e5STiwei Bie 767e6f633e5STiwei Bie for (sg = sgs[i]; sg; sg = sg_next(sg)) 768e6f633e5STiwei Bie total_sg++; 769e6f633e5STiwei Bie } 770e6f633e5STiwei Bie return virtqueue_add(_vq, sgs, total_sg, out_sgs, in_sgs, 771e6f633e5STiwei Bie data, NULL, gfp); 772e6f633e5STiwei Bie } 773e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_add_sgs); 774e6f633e5STiwei Bie 775e6f633e5STiwei Bie /** 776e6f633e5STiwei Bie * virtqueue_add_outbuf - expose output buffers to other end 777e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 778e6f633e5STiwei Bie * @sg: scatterlist (must be well-formed and terminated!) 779e6f633e5STiwei Bie * @num: the number of entries in @sg readable by other side 780e6f633e5STiwei Bie * @data: the token identifying the buffer. 781e6f633e5STiwei Bie * @gfp: how to do memory allocations (if necessary). 782e6f633e5STiwei Bie * 783e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue operations 784e6f633e5STiwei Bie * at the same time (except where noted). 785e6f633e5STiwei Bie * 786e6f633e5STiwei Bie * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 787e6f633e5STiwei Bie */ 788e6f633e5STiwei Bie int virtqueue_add_outbuf(struct virtqueue *vq, 789e6f633e5STiwei Bie struct scatterlist *sg, unsigned int num, 790e6f633e5STiwei Bie void *data, 791e6f633e5STiwei Bie gfp_t gfp) 792e6f633e5STiwei Bie { 793e6f633e5STiwei Bie return virtqueue_add(vq, &sg, num, 1, 0, data, NULL, gfp); 794e6f633e5STiwei Bie } 795e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_add_outbuf); 796e6f633e5STiwei Bie 797e6f633e5STiwei Bie /** 798e6f633e5STiwei Bie * virtqueue_add_inbuf - expose input buffers to other end 799e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 800e6f633e5STiwei Bie * @sg: scatterlist (must be well-formed and terminated!) 801e6f633e5STiwei Bie * @num: the number of entries in @sg writable by other side 802e6f633e5STiwei Bie * @data: the token identifying the buffer. 803e6f633e5STiwei Bie * @gfp: how to do memory allocations (if necessary). 804e6f633e5STiwei Bie * 805e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue operations 806e6f633e5STiwei Bie * at the same time (except where noted). 807e6f633e5STiwei Bie * 808e6f633e5STiwei Bie * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 809e6f633e5STiwei Bie */ 810e6f633e5STiwei Bie int virtqueue_add_inbuf(struct virtqueue *vq, 811e6f633e5STiwei Bie struct scatterlist *sg, unsigned int num, 812e6f633e5STiwei Bie void *data, 813e6f633e5STiwei Bie gfp_t gfp) 814e6f633e5STiwei Bie { 815e6f633e5STiwei Bie return virtqueue_add(vq, &sg, num, 0, 1, data, NULL, gfp); 816e6f633e5STiwei Bie } 817e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_add_inbuf); 818e6f633e5STiwei Bie 819e6f633e5STiwei Bie /** 820e6f633e5STiwei Bie * virtqueue_add_inbuf_ctx - expose input buffers to other end 821e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 822e6f633e5STiwei Bie * @sg: scatterlist (must be well-formed and terminated!) 823e6f633e5STiwei Bie * @num: the number of entries in @sg writable by other side 824e6f633e5STiwei Bie * @data: the token identifying the buffer. 825e6f633e5STiwei Bie * @ctx: extra context for the token 826e6f633e5STiwei Bie * @gfp: how to do memory allocations (if necessary). 827e6f633e5STiwei Bie * 828e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue operations 829e6f633e5STiwei Bie * at the same time (except where noted). 830e6f633e5STiwei Bie * 831e6f633e5STiwei Bie * Returns zero or a negative error (ie. ENOSPC, ENOMEM, EIO). 832e6f633e5STiwei Bie */ 833e6f633e5STiwei Bie int virtqueue_add_inbuf_ctx(struct virtqueue *vq, 834e6f633e5STiwei Bie struct scatterlist *sg, unsigned int num, 835e6f633e5STiwei Bie void *data, 836e6f633e5STiwei Bie void *ctx, 837e6f633e5STiwei Bie gfp_t gfp) 838e6f633e5STiwei Bie { 839e6f633e5STiwei Bie return virtqueue_add(vq, &sg, num, 0, 1, data, ctx, gfp); 840e6f633e5STiwei Bie } 841e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_add_inbuf_ctx); 842e6f633e5STiwei Bie 843e6f633e5STiwei Bie /** 844e6f633e5STiwei Bie * virtqueue_kick_prepare - first half of split virtqueue_kick call. 845e6f633e5STiwei Bie * @vq: the struct virtqueue 846e6f633e5STiwei Bie * 847e6f633e5STiwei Bie * Instead of virtqueue_kick(), you can do: 848e6f633e5STiwei Bie * if (virtqueue_kick_prepare(vq)) 849e6f633e5STiwei Bie * virtqueue_notify(vq); 850e6f633e5STiwei Bie * 851e6f633e5STiwei Bie * This is sometimes useful because the virtqueue_kick_prepare() needs 852e6f633e5STiwei Bie * to be serialized, but the actual virtqueue_notify() call does not. 853e6f633e5STiwei Bie */ 854e6f633e5STiwei Bie bool virtqueue_kick_prepare(struct virtqueue *_vq) 855e6f633e5STiwei Bie { 856e6f633e5STiwei Bie return virtqueue_kick_prepare_split(_vq); 857e6f633e5STiwei Bie } 858e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_kick_prepare); 859e6f633e5STiwei Bie 860e6f633e5STiwei Bie /** 861e6f633e5STiwei Bie * virtqueue_notify - second half of split virtqueue_kick call. 862e6f633e5STiwei Bie * @vq: the struct virtqueue 863e6f633e5STiwei Bie * 864e6f633e5STiwei Bie * This does not need to be serialized. 865e6f633e5STiwei Bie * 866e6f633e5STiwei Bie * Returns false if host notify failed or queue is broken, otherwise true. 867e6f633e5STiwei Bie */ 868e6f633e5STiwei Bie bool virtqueue_notify(struct virtqueue *_vq) 869e6f633e5STiwei Bie { 870e6f633e5STiwei Bie struct vring_virtqueue *vq = to_vvq(_vq); 871e6f633e5STiwei Bie 872e6f633e5STiwei Bie if (unlikely(vq->broken)) 873e6f633e5STiwei Bie return false; 874e6f633e5STiwei Bie 875e6f633e5STiwei Bie /* Prod other side to tell it about changes. */ 876e6f633e5STiwei Bie if (!vq->notify(_vq)) { 877e6f633e5STiwei Bie vq->broken = true; 878e6f633e5STiwei Bie return false; 879e6f633e5STiwei Bie } 880e6f633e5STiwei Bie return true; 881e6f633e5STiwei Bie } 882e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_notify); 883e6f633e5STiwei Bie 884e6f633e5STiwei Bie /** 885e6f633e5STiwei Bie * virtqueue_kick - update after add_buf 886e6f633e5STiwei Bie * @vq: the struct virtqueue 887e6f633e5STiwei Bie * 888e6f633e5STiwei Bie * After one or more virtqueue_add_* calls, invoke this to kick 889e6f633e5STiwei Bie * the other side. 890e6f633e5STiwei Bie * 891e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue 892e6f633e5STiwei Bie * operations at the same time (except where noted). 893e6f633e5STiwei Bie * 894e6f633e5STiwei Bie * Returns false if kick failed, otherwise true. 895e6f633e5STiwei Bie */ 896e6f633e5STiwei Bie bool virtqueue_kick(struct virtqueue *vq) 897e6f633e5STiwei Bie { 898e6f633e5STiwei Bie if (virtqueue_kick_prepare(vq)) 899e6f633e5STiwei Bie return virtqueue_notify(vq); 900e6f633e5STiwei Bie return true; 901e6f633e5STiwei Bie } 902e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_kick); 903e6f633e5STiwei Bie 904e6f633e5STiwei Bie /** 905e6f633e5STiwei Bie * virtqueue_get_buf - get the next used buffer 906e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 907e6f633e5STiwei Bie * @len: the length written into the buffer 908e6f633e5STiwei Bie * 909e6f633e5STiwei Bie * If the device wrote data into the buffer, @len will be set to the 910e6f633e5STiwei Bie * amount written. This means you don't need to clear the buffer 911e6f633e5STiwei Bie * beforehand to ensure there's no data leakage in the case of short 912e6f633e5STiwei Bie * writes. 913e6f633e5STiwei Bie * 914e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue 915e6f633e5STiwei Bie * operations at the same time (except where noted). 916e6f633e5STiwei Bie * 917e6f633e5STiwei Bie * Returns NULL if there are no used buffers, or the "data" token 918e6f633e5STiwei Bie * handed to virtqueue_add_*(). 919e6f633e5STiwei Bie */ 920e6f633e5STiwei Bie void *virtqueue_get_buf_ctx(struct virtqueue *_vq, unsigned int *len, 921e6f633e5STiwei Bie void **ctx) 922e6f633e5STiwei Bie { 923e6f633e5STiwei Bie return virtqueue_get_buf_ctx_split(_vq, len, ctx); 924e6f633e5STiwei Bie } 925e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_get_buf_ctx); 926e6f633e5STiwei Bie 927e6f633e5STiwei Bie void *virtqueue_get_buf(struct virtqueue *_vq, unsigned int *len) 928e6f633e5STiwei Bie { 929e6f633e5STiwei Bie return virtqueue_get_buf_ctx(_vq, len, NULL); 930e6f633e5STiwei Bie } 931e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_get_buf); 932e6f633e5STiwei Bie 933e6f633e5STiwei Bie /** 934e6f633e5STiwei Bie * virtqueue_disable_cb - disable callbacks 935e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 936e6f633e5STiwei Bie * 937e6f633e5STiwei Bie * Note that this is not necessarily synchronous, hence unreliable and only 938e6f633e5STiwei Bie * useful as an optimization. 939e6f633e5STiwei Bie * 940e6f633e5STiwei Bie * Unlike other operations, this need not be serialized. 941e6f633e5STiwei Bie */ 942e6f633e5STiwei Bie void virtqueue_disable_cb(struct virtqueue *_vq) 943e6f633e5STiwei Bie { 944e6f633e5STiwei Bie virtqueue_disable_cb_split(_vq); 945e6f633e5STiwei Bie } 946e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_disable_cb); 947e6f633e5STiwei Bie 948e6f633e5STiwei Bie /** 949e6f633e5STiwei Bie * virtqueue_enable_cb_prepare - restart callbacks after disable_cb 950e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 951e6f633e5STiwei Bie * 952e6f633e5STiwei Bie * This re-enables callbacks; it returns current queue state 953e6f633e5STiwei Bie * in an opaque unsigned value. This value should be later tested by 954e6f633e5STiwei Bie * virtqueue_poll, to detect a possible race between the driver checking for 955e6f633e5STiwei Bie * more work, and enabling callbacks. 956e6f633e5STiwei Bie * 957e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue 958e6f633e5STiwei Bie * operations at the same time (except where noted). 959e6f633e5STiwei Bie */ 960e6f633e5STiwei Bie unsigned virtqueue_enable_cb_prepare(struct virtqueue *_vq) 961e6f633e5STiwei Bie { 962e6f633e5STiwei Bie return virtqueue_enable_cb_prepare_split(_vq); 963e6f633e5STiwei Bie } 964e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_enable_cb_prepare); 965e6f633e5STiwei Bie 966e6f633e5STiwei Bie /** 967e6f633e5STiwei Bie * virtqueue_poll - query pending used buffers 968e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 969e6f633e5STiwei Bie * @last_used_idx: virtqueue state (from call to virtqueue_enable_cb_prepare). 970e6f633e5STiwei Bie * 971e6f633e5STiwei Bie * Returns "true" if there are pending used buffers in the queue. 972e6f633e5STiwei Bie * 973e6f633e5STiwei Bie * This does not need to be serialized. 974e6f633e5STiwei Bie */ 975e6f633e5STiwei Bie bool virtqueue_poll(struct virtqueue *_vq, unsigned last_used_idx) 976e6f633e5STiwei Bie { 977e6f633e5STiwei Bie struct vring_virtqueue *vq = to_vvq(_vq); 978e6f633e5STiwei Bie 979e6f633e5STiwei Bie virtio_mb(vq->weak_barriers); 980e6f633e5STiwei Bie return virtqueue_poll_split(_vq, last_used_idx); 981e6f633e5STiwei Bie } 982e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_poll); 983e6f633e5STiwei Bie 984e6f633e5STiwei Bie /** 985e6f633e5STiwei Bie * virtqueue_enable_cb - restart callbacks after disable_cb. 986e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 987e6f633e5STiwei Bie * 988e6f633e5STiwei Bie * This re-enables callbacks; it returns "false" if there are pending 989e6f633e5STiwei Bie * buffers in the queue, to detect a possible race between the driver 990e6f633e5STiwei Bie * checking for more work, and enabling callbacks. 991e6f633e5STiwei Bie * 992e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue 993e6f633e5STiwei Bie * operations at the same time (except where noted). 994e6f633e5STiwei Bie */ 995e6f633e5STiwei Bie bool virtqueue_enable_cb(struct virtqueue *_vq) 996e6f633e5STiwei Bie { 997e6f633e5STiwei Bie unsigned last_used_idx = virtqueue_enable_cb_prepare(_vq); 998e6f633e5STiwei Bie 999e6f633e5STiwei Bie return !virtqueue_poll(_vq, last_used_idx); 1000e6f633e5STiwei Bie } 1001e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_enable_cb); 1002e6f633e5STiwei Bie 1003e6f633e5STiwei Bie /** 1004e6f633e5STiwei Bie * virtqueue_enable_cb_delayed - restart callbacks after disable_cb. 1005e6f633e5STiwei Bie * @vq: the struct virtqueue we're talking about. 1006e6f633e5STiwei Bie * 1007e6f633e5STiwei Bie * This re-enables callbacks but hints to the other side to delay 1008e6f633e5STiwei Bie * interrupts until most of the available buffers have been processed; 1009e6f633e5STiwei Bie * it returns "false" if there are many pending buffers in the queue, 1010e6f633e5STiwei Bie * to detect a possible race between the driver checking for more work, 1011e6f633e5STiwei Bie * and enabling callbacks. 1012e6f633e5STiwei Bie * 1013e6f633e5STiwei Bie * Caller must ensure we don't call this with other virtqueue 1014e6f633e5STiwei Bie * operations at the same time (except where noted). 1015e6f633e5STiwei Bie */ 1016e6f633e5STiwei Bie bool virtqueue_enable_cb_delayed(struct virtqueue *_vq) 1017e6f633e5STiwei Bie { 1018e6f633e5STiwei Bie return virtqueue_enable_cb_delayed_split(_vq); 1019e6f633e5STiwei Bie } 1020e6f633e5STiwei Bie EXPORT_SYMBOL_GPL(virtqueue_enable_cb_delayed); 1021e6f633e5STiwei Bie 1022138fd251STiwei Bie /** 1023138fd251STiwei Bie * virtqueue_detach_unused_buf - detach first unused buffer 1024138fd251STiwei Bie * @vq: the struct virtqueue we're talking about. 1025138fd251STiwei Bie * 1026138fd251STiwei Bie * Returns NULL or the "data" token handed to virtqueue_add_*(). 1027138fd251STiwei Bie * This is not valid on an active queue; it is useful only for device 1028138fd251STiwei Bie * shutdown. 1029138fd251STiwei Bie */ 1030138fd251STiwei Bie void *virtqueue_detach_unused_buf(struct virtqueue *_vq) 1031138fd251STiwei Bie { 1032138fd251STiwei Bie return virtqueue_detach_unused_buf_split(_vq); 1033138fd251STiwei Bie } 10347c5e9ed0SMichael S. Tsirkin EXPORT_SYMBOL_GPL(virtqueue_detach_unused_buf); 1035c021eac4SShirley Ma 1036138fd251STiwei Bie static inline bool more_used(const struct vring_virtqueue *vq) 1037138fd251STiwei Bie { 1038138fd251STiwei Bie return more_used_split(vq); 1039138fd251STiwei Bie } 1040138fd251STiwei Bie 10410a8a69ddSRusty Russell irqreturn_t vring_interrupt(int irq, void *_vq) 10420a8a69ddSRusty Russell { 10430a8a69ddSRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 10440a8a69ddSRusty Russell 10450a8a69ddSRusty Russell if (!more_used(vq)) { 10460a8a69ddSRusty Russell pr_debug("virtqueue interrupt with no work for %p\n", vq); 10470a8a69ddSRusty Russell return IRQ_NONE; 10480a8a69ddSRusty Russell } 10490a8a69ddSRusty Russell 10500a8a69ddSRusty Russell if (unlikely(vq->broken)) 10510a8a69ddSRusty Russell return IRQ_HANDLED; 10520a8a69ddSRusty Russell 10530a8a69ddSRusty Russell pr_debug("virtqueue callback for %p (%p)\n", vq, vq->vq.callback); 105418445c4dSRusty Russell if (vq->vq.callback) 105518445c4dSRusty Russell vq->vq.callback(&vq->vq); 10560a8a69ddSRusty Russell 10570a8a69ddSRusty Russell return IRQ_HANDLED; 10580a8a69ddSRusty Russell } 1059c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_interrupt); 10600a8a69ddSRusty Russell 10612a2d1382SAndy Lutomirski struct virtqueue *__vring_new_virtqueue(unsigned int index, 10622a2d1382SAndy Lutomirski struct vring vring, 10630a8a69ddSRusty Russell struct virtio_device *vdev, 10647b21e34fSRusty Russell bool weak_barriers, 1065f94682ddSMichael S. Tsirkin bool context, 106646f9c2b9SHeinz Graalfs bool (*notify)(struct virtqueue *), 10679499f5e7SRusty Russell void (*callback)(struct virtqueue *), 10689499f5e7SRusty Russell const char *name) 10690a8a69ddSRusty Russell { 10700a8a69ddSRusty Russell unsigned int i; 10712a2d1382SAndy Lutomirski struct vring_virtqueue *vq; 10720a8a69ddSRusty Russell 10732a2d1382SAndy Lutomirski vq = kmalloc(sizeof(*vq) + vring.num * sizeof(struct vring_desc_state), 1074780bc790SAndy Lutomirski GFP_KERNEL); 10750a8a69ddSRusty Russell if (!vq) 10760a8a69ddSRusty Russell return NULL; 10770a8a69ddSRusty Russell 10780a8a69ddSRusty Russell vq->vq.callback = callback; 10790a8a69ddSRusty Russell vq->vq.vdev = vdev; 10809499f5e7SRusty Russell vq->vq.name = name; 10812a2d1382SAndy Lutomirski vq->vq.num_free = vring.num; 108206ca287dSRusty Russell vq->vq.index = index; 10832a2d1382SAndy Lutomirski vq->we_own_ring = false; 10842a2d1382SAndy Lutomirski vq->queue_dma_addr = 0; 10852a2d1382SAndy Lutomirski vq->queue_size_in_bytes = 0; 10860a8a69ddSRusty Russell vq->notify = notify; 10877b21e34fSRusty Russell vq->weak_barriers = weak_barriers; 10880a8a69ddSRusty Russell vq->broken = false; 10890a8a69ddSRusty Russell vq->last_used_idx = 0; 10900a8a69ddSRusty Russell vq->num_added = 0; 10919499f5e7SRusty Russell list_add_tail(&vq->vq.list, &vdev->vqs); 10920a8a69ddSRusty Russell #ifdef DEBUG 10930a8a69ddSRusty Russell vq->in_use = false; 1094e93300b1SRusty Russell vq->last_add_time_valid = false; 10950a8a69ddSRusty Russell #endif 10960a8a69ddSRusty Russell 10975a08b04fSMichael S. Tsirkin vq->indirect = virtio_has_feature(vdev, VIRTIO_RING_F_INDIRECT_DESC) && 10985a08b04fSMichael S. Tsirkin !context; 1099a5c262c5SMichael S. Tsirkin vq->event = virtio_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX); 11009fa29b9dSMark McLoughlin 1101e593bf97STiwei Bie vq->split.vring = vring; 1102e593bf97STiwei Bie vq->split.avail_flags_shadow = 0; 1103e593bf97STiwei Bie vq->split.avail_idx_shadow = 0; 1104e593bf97STiwei Bie 11050a8a69ddSRusty Russell /* No callback? Tell other side not to bother us. */ 1106f277ec42SVenkatesh Srinivas if (!callback) { 1107e593bf97STiwei Bie vq->split.avail_flags_shadow |= VRING_AVAIL_F_NO_INTERRUPT; 11080ea1e4a6SLadi Prosek if (!vq->event) 1109e593bf97STiwei Bie vq->split.vring.avail->flags = cpu_to_virtio16(vdev, 1110e593bf97STiwei Bie vq->split.avail_flags_shadow); 1111f277ec42SVenkatesh Srinivas } 11120a8a69ddSRusty Russell 11130a8a69ddSRusty Russell /* Put everything in free lists. */ 11140a8a69ddSRusty Russell vq->free_head = 0; 11152a2d1382SAndy Lutomirski for (i = 0; i < vring.num-1; i++) 1116e593bf97STiwei Bie vq->split.vring.desc[i].next = cpu_to_virtio16(vdev, i + 1); 11172a2d1382SAndy Lutomirski memset(vq->desc_state, 0, vring.num * sizeof(struct vring_desc_state)); 11180a8a69ddSRusty Russell 11190a8a69ddSRusty Russell return &vq->vq; 11200a8a69ddSRusty Russell } 11212a2d1382SAndy Lutomirski EXPORT_SYMBOL_GPL(__vring_new_virtqueue); 11222a2d1382SAndy Lutomirski 11232a2d1382SAndy Lutomirski static void *vring_alloc_queue(struct virtio_device *vdev, size_t size, 11242a2d1382SAndy Lutomirski dma_addr_t *dma_handle, gfp_t flag) 11252a2d1382SAndy Lutomirski { 11262a2d1382SAndy Lutomirski if (vring_use_dma_api(vdev)) { 11272a2d1382SAndy Lutomirski return dma_alloc_coherent(vdev->dev.parent, size, 11282a2d1382SAndy Lutomirski dma_handle, flag); 11292a2d1382SAndy Lutomirski } else { 11302a2d1382SAndy Lutomirski void *queue = alloc_pages_exact(PAGE_ALIGN(size), flag); 11312a2d1382SAndy Lutomirski if (queue) { 11322a2d1382SAndy Lutomirski phys_addr_t phys_addr = virt_to_phys(queue); 11332a2d1382SAndy Lutomirski *dma_handle = (dma_addr_t)phys_addr; 11342a2d1382SAndy Lutomirski 11352a2d1382SAndy Lutomirski /* 11362a2d1382SAndy Lutomirski * Sanity check: make sure we dind't truncate 11372a2d1382SAndy Lutomirski * the address. The only arches I can find that 11382a2d1382SAndy Lutomirski * have 64-bit phys_addr_t but 32-bit dma_addr_t 11392a2d1382SAndy Lutomirski * are certain non-highmem MIPS and x86 11402a2d1382SAndy Lutomirski * configurations, but these configurations 11412a2d1382SAndy Lutomirski * should never allocate physical pages above 32 11422a2d1382SAndy Lutomirski * bits, so this is fine. Just in case, throw a 11432a2d1382SAndy Lutomirski * warning and abort if we end up with an 11442a2d1382SAndy Lutomirski * unrepresentable address. 11452a2d1382SAndy Lutomirski */ 11462a2d1382SAndy Lutomirski if (WARN_ON_ONCE(*dma_handle != phys_addr)) { 11472a2d1382SAndy Lutomirski free_pages_exact(queue, PAGE_ALIGN(size)); 11482a2d1382SAndy Lutomirski return NULL; 11492a2d1382SAndy Lutomirski } 11502a2d1382SAndy Lutomirski } 11512a2d1382SAndy Lutomirski return queue; 11522a2d1382SAndy Lutomirski } 11532a2d1382SAndy Lutomirski } 11542a2d1382SAndy Lutomirski 11552a2d1382SAndy Lutomirski static void vring_free_queue(struct virtio_device *vdev, size_t size, 11562a2d1382SAndy Lutomirski void *queue, dma_addr_t dma_handle) 11572a2d1382SAndy Lutomirski { 11582a2d1382SAndy Lutomirski if (vring_use_dma_api(vdev)) { 11592a2d1382SAndy Lutomirski dma_free_coherent(vdev->dev.parent, size, queue, dma_handle); 11602a2d1382SAndy Lutomirski } else { 11612a2d1382SAndy Lutomirski free_pages_exact(queue, PAGE_ALIGN(size)); 11622a2d1382SAndy Lutomirski } 11632a2d1382SAndy Lutomirski } 11642a2d1382SAndy Lutomirski 11652a2d1382SAndy Lutomirski struct virtqueue *vring_create_virtqueue( 11662a2d1382SAndy Lutomirski unsigned int index, 11672a2d1382SAndy Lutomirski unsigned int num, 11682a2d1382SAndy Lutomirski unsigned int vring_align, 11692a2d1382SAndy Lutomirski struct virtio_device *vdev, 11702a2d1382SAndy Lutomirski bool weak_barriers, 11712a2d1382SAndy Lutomirski bool may_reduce_num, 1172f94682ddSMichael S. Tsirkin bool context, 11732a2d1382SAndy Lutomirski bool (*notify)(struct virtqueue *), 11742a2d1382SAndy Lutomirski void (*callback)(struct virtqueue *), 11752a2d1382SAndy Lutomirski const char *name) 11762a2d1382SAndy Lutomirski { 11772a2d1382SAndy Lutomirski struct virtqueue *vq; 1178e00f7bd2SDan Carpenter void *queue = NULL; 11792a2d1382SAndy Lutomirski dma_addr_t dma_addr; 11802a2d1382SAndy Lutomirski size_t queue_size_in_bytes; 11812a2d1382SAndy Lutomirski struct vring vring; 11822a2d1382SAndy Lutomirski 11832a2d1382SAndy Lutomirski /* We assume num is a power of 2. */ 11842a2d1382SAndy Lutomirski if (num & (num - 1)) { 11852a2d1382SAndy Lutomirski dev_warn(&vdev->dev, "Bad virtqueue length %u\n", num); 11862a2d1382SAndy Lutomirski return NULL; 11872a2d1382SAndy Lutomirski } 11882a2d1382SAndy Lutomirski 11892a2d1382SAndy Lutomirski /* TODO: allocate each queue chunk individually */ 11902a2d1382SAndy Lutomirski for (; num && vring_size(num, vring_align) > PAGE_SIZE; num /= 2) { 11912a2d1382SAndy Lutomirski queue = vring_alloc_queue(vdev, vring_size(num, vring_align), 11922a2d1382SAndy Lutomirski &dma_addr, 11932a2d1382SAndy Lutomirski GFP_KERNEL|__GFP_NOWARN|__GFP_ZERO); 11942a2d1382SAndy Lutomirski if (queue) 11952a2d1382SAndy Lutomirski break; 11962a2d1382SAndy Lutomirski } 11972a2d1382SAndy Lutomirski 11982a2d1382SAndy Lutomirski if (!num) 11992a2d1382SAndy Lutomirski return NULL; 12002a2d1382SAndy Lutomirski 12012a2d1382SAndy Lutomirski if (!queue) { 12022a2d1382SAndy Lutomirski /* Try to get a single page. You are my only hope! */ 12032a2d1382SAndy Lutomirski queue = vring_alloc_queue(vdev, vring_size(num, vring_align), 12042a2d1382SAndy Lutomirski &dma_addr, GFP_KERNEL|__GFP_ZERO); 12052a2d1382SAndy Lutomirski } 12062a2d1382SAndy Lutomirski if (!queue) 12072a2d1382SAndy Lutomirski return NULL; 12082a2d1382SAndy Lutomirski 12092a2d1382SAndy Lutomirski queue_size_in_bytes = vring_size(num, vring_align); 12102a2d1382SAndy Lutomirski vring_init(&vring, num, queue, vring_align); 12112a2d1382SAndy Lutomirski 1212f94682ddSMichael S. Tsirkin vq = __vring_new_virtqueue(index, vring, vdev, weak_barriers, context, 12132a2d1382SAndy Lutomirski notify, callback, name); 12142a2d1382SAndy Lutomirski if (!vq) { 12152a2d1382SAndy Lutomirski vring_free_queue(vdev, queue_size_in_bytes, queue, 12162a2d1382SAndy Lutomirski dma_addr); 12172a2d1382SAndy Lutomirski return NULL; 12182a2d1382SAndy Lutomirski } 12192a2d1382SAndy Lutomirski 12202a2d1382SAndy Lutomirski to_vvq(vq)->queue_dma_addr = dma_addr; 12212a2d1382SAndy Lutomirski to_vvq(vq)->queue_size_in_bytes = queue_size_in_bytes; 12222a2d1382SAndy Lutomirski to_vvq(vq)->we_own_ring = true; 12232a2d1382SAndy Lutomirski 12242a2d1382SAndy Lutomirski return vq; 12252a2d1382SAndy Lutomirski } 12262a2d1382SAndy Lutomirski EXPORT_SYMBOL_GPL(vring_create_virtqueue); 12272a2d1382SAndy Lutomirski 12282a2d1382SAndy Lutomirski struct virtqueue *vring_new_virtqueue(unsigned int index, 12292a2d1382SAndy Lutomirski unsigned int num, 12302a2d1382SAndy Lutomirski unsigned int vring_align, 12312a2d1382SAndy Lutomirski struct virtio_device *vdev, 12322a2d1382SAndy Lutomirski bool weak_barriers, 1233f94682ddSMichael S. Tsirkin bool context, 12342a2d1382SAndy Lutomirski void *pages, 12352a2d1382SAndy Lutomirski bool (*notify)(struct virtqueue *vq), 12362a2d1382SAndy Lutomirski void (*callback)(struct virtqueue *vq), 12372a2d1382SAndy Lutomirski const char *name) 12382a2d1382SAndy Lutomirski { 12392a2d1382SAndy Lutomirski struct vring vring; 12402a2d1382SAndy Lutomirski vring_init(&vring, num, pages, vring_align); 1241f94682ddSMichael S. Tsirkin return __vring_new_virtqueue(index, vring, vdev, weak_barriers, context, 12422a2d1382SAndy Lutomirski notify, callback, name); 12432a2d1382SAndy Lutomirski } 1244c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_new_virtqueue); 12450a8a69ddSRusty Russell 12462a2d1382SAndy Lutomirski void vring_del_virtqueue(struct virtqueue *_vq) 12470a8a69ddSRusty Russell { 12482a2d1382SAndy Lutomirski struct vring_virtqueue *vq = to_vvq(_vq); 12492a2d1382SAndy Lutomirski 12502a2d1382SAndy Lutomirski if (vq->we_own_ring) { 12512a2d1382SAndy Lutomirski vring_free_queue(vq->vq.vdev, vq->queue_size_in_bytes, 1252e593bf97STiwei Bie vq->split.vring.desc, vq->queue_dma_addr); 12532a2d1382SAndy Lutomirski } 12542a2d1382SAndy Lutomirski list_del(&_vq->list); 12552a2d1382SAndy Lutomirski kfree(vq); 12560a8a69ddSRusty Russell } 1257c6fd4701SRusty Russell EXPORT_SYMBOL_GPL(vring_del_virtqueue); 12580a8a69ddSRusty Russell 1259e34f8725SRusty Russell /* Manipulates transport-specific feature bits. */ 1260e34f8725SRusty Russell void vring_transport_features(struct virtio_device *vdev) 1261e34f8725SRusty Russell { 1262e34f8725SRusty Russell unsigned int i; 1263e34f8725SRusty Russell 1264e34f8725SRusty Russell for (i = VIRTIO_TRANSPORT_F_START; i < VIRTIO_TRANSPORT_F_END; i++) { 1265e34f8725SRusty Russell switch (i) { 12669fa29b9dSMark McLoughlin case VIRTIO_RING_F_INDIRECT_DESC: 12679fa29b9dSMark McLoughlin break; 1268a5c262c5SMichael S. Tsirkin case VIRTIO_RING_F_EVENT_IDX: 1269a5c262c5SMichael S. Tsirkin break; 1270747ae34aSMichael S. Tsirkin case VIRTIO_F_VERSION_1: 1271747ae34aSMichael S. Tsirkin break; 12721a937693SMichael S. Tsirkin case VIRTIO_F_IOMMU_PLATFORM: 12731a937693SMichael S. Tsirkin break; 1274e34f8725SRusty Russell default: 1275e34f8725SRusty Russell /* We don't understand this bit. */ 1276e16e12beSMichael S. Tsirkin __virtio_clear_bit(vdev, i); 1277e34f8725SRusty Russell } 1278e34f8725SRusty Russell } 1279e34f8725SRusty Russell } 1280e34f8725SRusty Russell EXPORT_SYMBOL_GPL(vring_transport_features); 1281e34f8725SRusty Russell 12825dfc1762SRusty Russell /** 12835dfc1762SRusty Russell * virtqueue_get_vring_size - return the size of the virtqueue's vring 12845dfc1762SRusty Russell * @vq: the struct virtqueue containing the vring of interest. 12855dfc1762SRusty Russell * 12865dfc1762SRusty Russell * Returns the size of the vring. This is mainly used for boasting to 12875dfc1762SRusty Russell * userspace. Unlike other operations, this need not be serialized. 12885dfc1762SRusty Russell */ 12898f9f4668SRick Jones unsigned int virtqueue_get_vring_size(struct virtqueue *_vq) 12908f9f4668SRick Jones { 12918f9f4668SRick Jones 12928f9f4668SRick Jones struct vring_virtqueue *vq = to_vvq(_vq); 12938f9f4668SRick Jones 1294e593bf97STiwei Bie return vq->split.vring.num; 12958f9f4668SRick Jones } 12968f9f4668SRick Jones EXPORT_SYMBOL_GPL(virtqueue_get_vring_size); 12978f9f4668SRick Jones 1298b3b32c94SHeinz Graalfs bool virtqueue_is_broken(struct virtqueue *_vq) 1299b3b32c94SHeinz Graalfs { 1300b3b32c94SHeinz Graalfs struct vring_virtqueue *vq = to_vvq(_vq); 1301b3b32c94SHeinz Graalfs 1302b3b32c94SHeinz Graalfs return vq->broken; 1303b3b32c94SHeinz Graalfs } 1304b3b32c94SHeinz Graalfs EXPORT_SYMBOL_GPL(virtqueue_is_broken); 1305b3b32c94SHeinz Graalfs 1306e2dcdfe9SRusty Russell /* 1307e2dcdfe9SRusty Russell * This should prevent the device from being used, allowing drivers to 1308e2dcdfe9SRusty Russell * recover. You may need to grab appropriate locks to flush. 1309e2dcdfe9SRusty Russell */ 1310e2dcdfe9SRusty Russell void virtio_break_device(struct virtio_device *dev) 1311e2dcdfe9SRusty Russell { 1312e2dcdfe9SRusty Russell struct virtqueue *_vq; 1313e2dcdfe9SRusty Russell 1314e2dcdfe9SRusty Russell list_for_each_entry(_vq, &dev->vqs, list) { 1315e2dcdfe9SRusty Russell struct vring_virtqueue *vq = to_vvq(_vq); 1316e2dcdfe9SRusty Russell vq->broken = true; 1317e2dcdfe9SRusty Russell } 1318e2dcdfe9SRusty Russell } 1319e2dcdfe9SRusty Russell EXPORT_SYMBOL_GPL(virtio_break_device); 1320e2dcdfe9SRusty Russell 13212a2d1382SAndy Lutomirski dma_addr_t virtqueue_get_desc_addr(struct virtqueue *_vq) 132289062652SCornelia Huck { 132389062652SCornelia Huck struct vring_virtqueue *vq = to_vvq(_vq); 132489062652SCornelia Huck 13252a2d1382SAndy Lutomirski BUG_ON(!vq->we_own_ring); 132689062652SCornelia Huck 13272a2d1382SAndy Lutomirski return vq->queue_dma_addr; 13282a2d1382SAndy Lutomirski } 13292a2d1382SAndy Lutomirski EXPORT_SYMBOL_GPL(virtqueue_get_desc_addr); 13302a2d1382SAndy Lutomirski 13312a2d1382SAndy Lutomirski dma_addr_t virtqueue_get_avail_addr(struct virtqueue *_vq) 133289062652SCornelia Huck { 133389062652SCornelia Huck struct vring_virtqueue *vq = to_vvq(_vq); 133489062652SCornelia Huck 13352a2d1382SAndy Lutomirski BUG_ON(!vq->we_own_ring); 13362a2d1382SAndy Lutomirski 13372a2d1382SAndy Lutomirski return vq->queue_dma_addr + 1338e593bf97STiwei Bie ((char *)vq->split.vring.avail - (char *)vq->split.vring.desc); 133989062652SCornelia Huck } 13402a2d1382SAndy Lutomirski EXPORT_SYMBOL_GPL(virtqueue_get_avail_addr); 13412a2d1382SAndy Lutomirski 13422a2d1382SAndy Lutomirski dma_addr_t virtqueue_get_used_addr(struct virtqueue *_vq) 13432a2d1382SAndy Lutomirski { 13442a2d1382SAndy Lutomirski struct vring_virtqueue *vq = to_vvq(_vq); 13452a2d1382SAndy Lutomirski 13462a2d1382SAndy Lutomirski BUG_ON(!vq->we_own_ring); 13472a2d1382SAndy Lutomirski 13482a2d1382SAndy Lutomirski return vq->queue_dma_addr + 1349e593bf97STiwei Bie ((char *)vq->split.vring.used - (char *)vq->split.vring.desc); 13502a2d1382SAndy Lutomirski } 13512a2d1382SAndy Lutomirski EXPORT_SYMBOL_GPL(virtqueue_get_used_addr); 13522a2d1382SAndy Lutomirski 13532a2d1382SAndy Lutomirski const struct vring *virtqueue_get_vring(struct virtqueue *vq) 13542a2d1382SAndy Lutomirski { 1355e593bf97STiwei Bie return &to_vvq(vq)->split.vring; 13562a2d1382SAndy Lutomirski } 13572a2d1382SAndy Lutomirski EXPORT_SYMBOL_GPL(virtqueue_get_vring); 135889062652SCornelia Huck 1359c6fd4701SRusty Russell MODULE_LICENSE("GPL"); 1360