19fbe302bSMichael S. Tsirkin #ifndef _LINUX_VIRTIO_RING_H 29fbe302bSMichael S. Tsirkin #define _LINUX_VIRTIO_RING_H 3d4083f50SAlexey Perevalov /* An interface for efficient virtio implementation, currently for use by KVM, 4d4083f50SAlexey Perevalov * but hopefully others soon. Do NOT change this since it will 59fbe302bSMichael S. Tsirkin * break existing servers and clients. 69fbe302bSMichael S. Tsirkin * 79fbe302bSMichael S. Tsirkin * This header is BSD licensed so anyone can use the definitions to implement 89fbe302bSMichael S. Tsirkin * compatible drivers/servers. 99fbe302bSMichael S. Tsirkin * 109fbe302bSMichael S. Tsirkin * Redistribution and use in source and binary forms, with or without 119fbe302bSMichael S. Tsirkin * modification, are permitted provided that the following conditions 129fbe302bSMichael S. Tsirkin * are met: 139fbe302bSMichael S. Tsirkin * 1. Redistributions of source code must retain the above copyright 149fbe302bSMichael S. Tsirkin * notice, this list of conditions and the following disclaimer. 159fbe302bSMichael S. Tsirkin * 2. Redistributions in binary form must reproduce the above copyright 169fbe302bSMichael S. Tsirkin * notice, this list of conditions and the following disclaimer in the 179fbe302bSMichael S. Tsirkin * documentation and/or other materials provided with the distribution. 189fbe302bSMichael S. Tsirkin * 3. Neither the name of IBM nor the names of its contributors 199fbe302bSMichael S. Tsirkin * may be used to endorse or promote products derived from this software 209fbe302bSMichael S. Tsirkin * without specific prior written permission. 219fbe302bSMichael S. Tsirkin * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS ``AS IS'' AND 229fbe302bSMichael S. Tsirkin * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 239fbe302bSMichael S. Tsirkin * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 249fbe302bSMichael S. Tsirkin * ARE DISCLAIMED. IN NO EVENT SHALL IBM OR CONTRIBUTORS BE LIABLE 259fbe302bSMichael S. Tsirkin * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 269fbe302bSMichael S. Tsirkin * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 279fbe302bSMichael S. Tsirkin * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 289fbe302bSMichael S. Tsirkin * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 299fbe302bSMichael S. Tsirkin * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 309fbe302bSMichael S. Tsirkin * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 319fbe302bSMichael S. Tsirkin * SUCH DAMAGE. 329fbe302bSMichael S. Tsirkin * 339fbe302bSMichael S. Tsirkin * Copyright Rusty Russell IBM Corporation 2007. */ 34120758fbSPaolo Bonzini #include <stdint.h> 359fbe302bSMichael S. Tsirkin #include "standard-headers/linux/types.h" 369fbe302bSMichael S. Tsirkin #include "standard-headers/linux/virtio_types.h" 379fbe302bSMichael S. Tsirkin 389fbe302bSMichael S. Tsirkin /* This marks a buffer as continuing via the next field. */ 399fbe302bSMichael S. Tsirkin #define VRING_DESC_F_NEXT 1 409fbe302bSMichael S. Tsirkin /* This marks a buffer as write-only (otherwise read-only). */ 419fbe302bSMichael S. Tsirkin #define VRING_DESC_F_WRITE 2 429fbe302bSMichael S. Tsirkin /* This means the buffer contains a list of buffer descriptors. */ 439fbe302bSMichael S. Tsirkin #define VRING_DESC_F_INDIRECT 4 449fbe302bSMichael S. Tsirkin 45da054c64SPaolo Bonzini /* 46da054c64SPaolo Bonzini * Mark a descriptor as available or used in packed ring. 47da054c64SPaolo Bonzini * Notice: they are defined as shifts instead of shifted values. 48da054c64SPaolo Bonzini */ 49da054c64SPaolo Bonzini #define VRING_PACKED_DESC_F_AVAIL 7 50da054c64SPaolo Bonzini #define VRING_PACKED_DESC_F_USED 15 51da054c64SPaolo Bonzini 529fbe302bSMichael S. Tsirkin /* The Host uses this in used->flags to advise the Guest: don't kick me when 539fbe302bSMichael S. Tsirkin * you add a buffer. It's unreliable, so it's simply an optimization. Guest 549fbe302bSMichael S. Tsirkin * will still kick if it's out of buffers. */ 559fbe302bSMichael S. Tsirkin #define VRING_USED_F_NO_NOTIFY 1 569fbe302bSMichael S. Tsirkin /* The Guest uses this in avail->flags to advise the Host: don't interrupt me 579fbe302bSMichael S. Tsirkin * when you consume a buffer. It's unreliable, so it's simply an 589fbe302bSMichael S. Tsirkin * optimization. */ 599fbe302bSMichael S. Tsirkin #define VRING_AVAIL_F_NO_INTERRUPT 1 609fbe302bSMichael S. Tsirkin 61da054c64SPaolo Bonzini /* Enable events in packed ring. */ 62da054c64SPaolo Bonzini #define VRING_PACKED_EVENT_FLAG_ENABLE 0x0 63da054c64SPaolo Bonzini /* Disable events in packed ring. */ 64da054c64SPaolo Bonzini #define VRING_PACKED_EVENT_FLAG_DISABLE 0x1 65da054c64SPaolo Bonzini /* 66da054c64SPaolo Bonzini * Enable events for a specific descriptor in packed ring. 67da054c64SPaolo Bonzini * (as specified by Descriptor Ring Change Event Offset/Wrap Counter). 68da054c64SPaolo Bonzini * Only valid if VIRTIO_RING_F_EVENT_IDX has been negotiated. 69da054c64SPaolo Bonzini */ 70da054c64SPaolo Bonzini #define VRING_PACKED_EVENT_FLAG_DESC 0x2 71da054c64SPaolo Bonzini 72da054c64SPaolo Bonzini /* 73da054c64SPaolo Bonzini * Wrap counter bit shift in event suppression structure 74da054c64SPaolo Bonzini * of packed ring. 75da054c64SPaolo Bonzini */ 76da054c64SPaolo Bonzini #define VRING_PACKED_EVENT_F_WRAP_CTR 15 77da054c64SPaolo Bonzini 789fbe302bSMichael S. Tsirkin /* We support indirect buffer descriptors */ 799fbe302bSMichael S. Tsirkin #define VIRTIO_RING_F_INDIRECT_DESC 28 809fbe302bSMichael S. Tsirkin 819fbe302bSMichael S. Tsirkin /* The Guest publishes the used index for which it expects an interrupt 829fbe302bSMichael S. Tsirkin * at the end of the avail ring. Host should ignore the avail->flags field. */ 839fbe302bSMichael S. Tsirkin /* The Host publishes the avail index for which it expects a kick 849fbe302bSMichael S. Tsirkin * at the end of the used ring. Guest should ignore the used->flags field. */ 859fbe302bSMichael S. Tsirkin #define VIRTIO_RING_F_EVENT_IDX 29 869fbe302bSMichael S. Tsirkin 87f76b348eSCornelia Huck /* Alignment requirements for vring elements. 88f76b348eSCornelia Huck * When using pre-virtio 1.0 layout, these fall out naturally. 89f76b348eSCornelia Huck */ 90f76b348eSCornelia Huck #define VRING_AVAIL_ALIGN_SIZE 2 91f76b348eSCornelia Huck #define VRING_USED_ALIGN_SIZE 4 92f76b348eSCornelia Huck #define VRING_DESC_ALIGN_SIZE 16 93f76b348eSCornelia Huck 94*d525f73fSChenyi Qiang /** 95*d525f73fSChenyi Qiang * struct vring_desc - Virtio ring descriptors, 96*d525f73fSChenyi Qiang * 16 bytes long. These can chain together via @next. 97*d525f73fSChenyi Qiang * 98*d525f73fSChenyi Qiang * @addr: buffer address (guest-physical) 99*d525f73fSChenyi Qiang * @len: buffer length 100*d525f73fSChenyi Qiang * @flags: descriptor flags 101*d525f73fSChenyi Qiang * @next: index of the next descriptor in the chain, 102*d525f73fSChenyi Qiang * if the VRING_DESC_F_NEXT flag is set. We chain unused 103*d525f73fSChenyi Qiang * descriptors via this, too. 104*d525f73fSChenyi Qiang */ 1059fbe302bSMichael S. Tsirkin struct vring_desc { 1069fbe302bSMichael S. Tsirkin __virtio64 addr; 1079fbe302bSMichael S. Tsirkin __virtio32 len; 1089fbe302bSMichael S. Tsirkin __virtio16 flags; 1099fbe302bSMichael S. Tsirkin __virtio16 next; 1109fbe302bSMichael S. Tsirkin }; 1119fbe302bSMichael S. Tsirkin 1129fbe302bSMichael S. Tsirkin struct vring_avail { 1139fbe302bSMichael S. Tsirkin __virtio16 flags; 1149fbe302bSMichael S. Tsirkin __virtio16 idx; 1159fbe302bSMichael S. Tsirkin __virtio16 ring[]; 1169fbe302bSMichael S. Tsirkin }; 1179fbe302bSMichael S. Tsirkin 1189f2d175dSPaolo Bonzini /* uint32_t is used here for ids for padding reasons. */ 1199fbe302bSMichael S. Tsirkin struct vring_used_elem { 1209fbe302bSMichael S. Tsirkin /* Index of start of used descriptor chain. */ 1219fbe302bSMichael S. Tsirkin __virtio32 id; 1229fbe302bSMichael S. Tsirkin /* Total length of the descriptor chain which was used (written to) */ 1239fbe302bSMichael S. Tsirkin __virtio32 len; 1249fbe302bSMichael S. Tsirkin }; 1259fbe302bSMichael S. Tsirkin 126f76b348eSCornelia Huck typedef struct vring_used_elem __attribute__((aligned(VRING_USED_ALIGN_SIZE))) 127f76b348eSCornelia Huck vring_used_elem_t; 128f76b348eSCornelia Huck 1299fbe302bSMichael S. Tsirkin struct vring_used { 1309fbe302bSMichael S. Tsirkin __virtio16 flags; 1319fbe302bSMichael S. Tsirkin __virtio16 idx; 132f76b348eSCornelia Huck vring_used_elem_t ring[]; 1339fbe302bSMichael S. Tsirkin }; 1349fbe302bSMichael S. Tsirkin 135f76b348eSCornelia Huck /* 136f76b348eSCornelia Huck * The ring element addresses are passed between components with different 137f76b348eSCornelia Huck * alignments assumptions. Thus, we might need to decrease the compiler-selected 138f76b348eSCornelia Huck * alignment, and so must use a typedef to make sure the aligned attribute 139f76b348eSCornelia Huck * actually takes hold: 140f76b348eSCornelia Huck * 141f76b348eSCornelia Huck * https://gcc.gnu.org/onlinedocs//gcc/Common-Type-Attributes.html#Common-Type-Attributes 142f76b348eSCornelia Huck * 143f76b348eSCornelia Huck * When used on a struct, or struct member, the aligned attribute can only 144f76b348eSCornelia Huck * increase the alignment; in order to decrease it, the packed attribute must 145f76b348eSCornelia Huck * be specified as well. When used as part of a typedef, the aligned attribute 146f76b348eSCornelia Huck * can both increase and decrease alignment, and specifying the packed 147f76b348eSCornelia Huck * attribute generates a warning. 148f76b348eSCornelia Huck */ 149f76b348eSCornelia Huck typedef struct vring_desc __attribute__((aligned(VRING_DESC_ALIGN_SIZE))) 150f76b348eSCornelia Huck vring_desc_t; 151f76b348eSCornelia Huck typedef struct vring_avail __attribute__((aligned(VRING_AVAIL_ALIGN_SIZE))) 152f76b348eSCornelia Huck vring_avail_t; 153f76b348eSCornelia Huck typedef struct vring_used __attribute__((aligned(VRING_USED_ALIGN_SIZE))) 154f76b348eSCornelia Huck vring_used_t; 155f76b348eSCornelia Huck 1569fbe302bSMichael S. Tsirkin struct vring { 1579fbe302bSMichael S. Tsirkin unsigned int num; 1589fbe302bSMichael S. Tsirkin 159f76b348eSCornelia Huck vring_desc_t *desc; 1609fbe302bSMichael S. Tsirkin 161f76b348eSCornelia Huck vring_avail_t *avail; 1629fbe302bSMichael S. Tsirkin 163f76b348eSCornelia Huck vring_used_t *used; 1649fbe302bSMichael S. Tsirkin }; 1659fbe302bSMichael S. Tsirkin 166f76b348eSCornelia Huck #ifndef VIRTIO_RING_NO_LEGACY 1679fbe302bSMichael S. Tsirkin 1689fbe302bSMichael S. Tsirkin /* The standard layout for the ring is a continuous chunk of memory which looks 1699fbe302bSMichael S. Tsirkin * like this. We assume num is a power of 2. 1709fbe302bSMichael S. Tsirkin * 1719fbe302bSMichael S. Tsirkin * struct vring 1729fbe302bSMichael S. Tsirkin * { 1739fbe302bSMichael S. Tsirkin * // The actual descriptors (16 bytes each) 1749fbe302bSMichael S. Tsirkin * struct vring_desc desc[num]; 1759fbe302bSMichael S. Tsirkin * 1769fbe302bSMichael S. Tsirkin * // A ring of available descriptor heads with free-running index. 1779fbe302bSMichael S. Tsirkin * __virtio16 avail_flags; 1789fbe302bSMichael S. Tsirkin * __virtio16 avail_idx; 1799fbe302bSMichael S. Tsirkin * __virtio16 available[num]; 1809fbe302bSMichael S. Tsirkin * __virtio16 used_event_idx; 1819fbe302bSMichael S. Tsirkin * 1829fbe302bSMichael S. Tsirkin * // Padding to the next align boundary. 1839fbe302bSMichael S. Tsirkin * char pad[]; 1849fbe302bSMichael S. Tsirkin * 1859fbe302bSMichael S. Tsirkin * // A ring of used descriptor heads with free-running index. 1869fbe302bSMichael S. Tsirkin * __virtio16 used_flags; 1879fbe302bSMichael S. Tsirkin * __virtio16 used_idx; 1889fbe302bSMichael S. Tsirkin * struct vring_used_elem used[num]; 1899fbe302bSMichael S. Tsirkin * __virtio16 avail_event_idx; 1909fbe302bSMichael S. Tsirkin * }; 1919fbe302bSMichael S. Tsirkin */ 1929fbe302bSMichael S. Tsirkin /* We publish the used event index at the end of the available ring, and vice 1939fbe302bSMichael S. Tsirkin * versa. They are at the end for backwards compatibility. */ 1949fbe302bSMichael S. Tsirkin #define vring_used_event(vr) ((vr)->avail->ring[(vr)->num]) 1959fbe302bSMichael S. Tsirkin #define vring_avail_event(vr) (*(__virtio16 *)&(vr)->used->ring[(vr)->num]) 1969fbe302bSMichael S. Tsirkin 197e0d2be2aSMichael S. Tsirkin static inline void vring_init(struct vring *vr, unsigned int num, void *p, 1989fbe302bSMichael S. Tsirkin unsigned long align) 1999fbe302bSMichael S. Tsirkin { 2009fbe302bSMichael S. Tsirkin vr->num = num; 2019fbe302bSMichael S. Tsirkin vr->desc = p; 2022a886794SGreg Kurz vr->avail = (struct vring_avail *)((char *)p + num * sizeof(struct vring_desc)); 203120758fbSPaolo Bonzini vr->used = (void *)(((uintptr_t)&vr->avail->ring[num] + sizeof(__virtio16) 2049fbe302bSMichael S. Tsirkin + align-1) & ~(align - 1)); 2059fbe302bSMichael S. Tsirkin } 2069fbe302bSMichael S. Tsirkin 207e0d2be2aSMichael S. Tsirkin static inline unsigned vring_size(unsigned int num, unsigned long align) 2089fbe302bSMichael S. Tsirkin { 2099fbe302bSMichael S. Tsirkin return ((sizeof(struct vring_desc) * num + sizeof(__virtio16) * (3 + num) 2109fbe302bSMichael S. Tsirkin + align - 1) & ~(align - 1)) 2119fbe302bSMichael S. Tsirkin + sizeof(__virtio16) * 3 + sizeof(struct vring_used_elem) * num; 2129fbe302bSMichael S. Tsirkin } 2139fbe302bSMichael S. Tsirkin 214f76b348eSCornelia Huck #endif /* VIRTIO_RING_NO_LEGACY */ 215f76b348eSCornelia Huck 2169fbe302bSMichael S. Tsirkin /* The following is used with USED_EVENT_IDX and AVAIL_EVENT_IDX */ 21724a31426SPaolo Bonzini /* Assuming a given event_idx value from the other side, if 2189fbe302bSMichael S. Tsirkin * we have just incremented index from old to new_idx, 2199fbe302bSMichael S. Tsirkin * should we trigger an event? */ 220e0d2be2aSMichael S. Tsirkin static inline int vring_need_event(uint16_t event_idx, uint16_t new_idx, uint16_t old) 2219fbe302bSMichael S. Tsirkin { 2229fbe302bSMichael S. Tsirkin /* Note: Xen has similar logic for notification hold-off 2239fbe302bSMichael S. Tsirkin * in include/xen/interface/io/ring.h with req_event and req_prod 2249fbe302bSMichael S. Tsirkin * corresponding to event_idx + 1 and new_idx respectively. 2259fbe302bSMichael S. Tsirkin * Note also that req_event and req_prod in Xen start at 1, 2269fbe302bSMichael S. Tsirkin * event indexes in virtio start at 0. */ 2279fbe302bSMichael S. Tsirkin return (uint16_t)(new_idx - event_idx - 1) < (uint16_t)(new_idx - old); 2289fbe302bSMichael S. Tsirkin } 2299fbe302bSMichael S. Tsirkin 230da054c64SPaolo Bonzini struct vring_packed_desc_event { 231da054c64SPaolo Bonzini /* Descriptor Ring Change Event Offset/Wrap Counter. */ 232da054c64SPaolo Bonzini uint16_t off_wrap; 233da054c64SPaolo Bonzini /* Descriptor Ring Change Event Flags. */ 234da054c64SPaolo Bonzini uint16_t flags; 235da054c64SPaolo Bonzini }; 236da054c64SPaolo Bonzini 237da054c64SPaolo Bonzini struct vring_packed_desc { 238da054c64SPaolo Bonzini /* Buffer Address. */ 239da054c64SPaolo Bonzini uint64_t addr; 240da054c64SPaolo Bonzini /* Buffer Length. */ 241da054c64SPaolo Bonzini uint32_t len; 242da054c64SPaolo Bonzini /* Buffer ID. */ 243da054c64SPaolo Bonzini uint16_t id; 244da054c64SPaolo Bonzini /* The flags depending on descriptor type. */ 245da054c64SPaolo Bonzini uint16_t flags; 246da054c64SPaolo Bonzini }; 247da054c64SPaolo Bonzini 2489fbe302bSMichael S. Tsirkin #endif /* _LINUX_VIRTIO_RING_H */ 249