xref: /openbmc/qemu/hw/virtio/virtio.c (revision 9884abee)
1 /*
2  * Virtio Support
3  *
4  * Copyright IBM, Corp. 2007
5  *
6  * Authors:
7  *  Anthony Liguori   <aliguori@us.ibm.com>
8  *
9  * This work is licensed under the terms of the GNU GPL, version 2.  See
10  * the COPYING file in the top-level directory.
11  *
12  */
13 
14 #include "qemu/osdep.h"
15 
16 #include "trace.h"
17 #include "exec/address-spaces.h"
18 #include "qemu/error-report.h"
19 #include "hw/virtio/virtio.h"
20 #include "qemu/atomic.h"
21 #include "hw/virtio/virtio-bus.h"
22 #include "migration/migration.h"
23 #include "hw/virtio/virtio-access.h"
24 
25 /*
26  * The alignment to use between consumer and producer parts of vring.
27  * x86 pagesize again. This is the default, used by transports like PCI
28  * which don't provide a means for the guest to tell the host the alignment.
29  */
30 #define VIRTIO_PCI_VRING_ALIGN         4096
31 
32 typedef struct VRingDesc
33 {
34     uint64_t addr;
35     uint32_t len;
36     uint16_t flags;
37     uint16_t next;
38 } VRingDesc;
39 
40 typedef struct VRingAvail
41 {
42     uint16_t flags;
43     uint16_t idx;
44     uint16_t ring[0];
45 } VRingAvail;
46 
47 typedef struct VRingUsedElem
48 {
49     uint32_t id;
50     uint32_t len;
51 } VRingUsedElem;
52 
53 typedef struct VRingUsed
54 {
55     uint16_t flags;
56     uint16_t idx;
57     VRingUsedElem ring[0];
58 } VRingUsed;
59 
60 typedef struct VRing
61 {
62     unsigned int num;
63     unsigned int num_default;
64     unsigned int align;
65     hwaddr desc;
66     hwaddr avail;
67     hwaddr used;
68 } VRing;
69 
70 struct VirtQueue
71 {
72     VRing vring;
73     uint16_t last_avail_idx;
74     /* Last used index value we have signalled on */
75     uint16_t signalled_used;
76 
77     /* Last used index value we have signalled on */
78     bool signalled_used_valid;
79 
80     /* Notification enabled? */
81     bool notification;
82 
83     uint16_t queue_index;
84 
85     int inuse;
86 
87     uint16_t vector;
88     void (*handle_output)(VirtIODevice *vdev, VirtQueue *vq);
89     VirtIODevice *vdev;
90     EventNotifier guest_notifier;
91     EventNotifier host_notifier;
92     QLIST_ENTRY(VirtQueue) node;
93 };
94 
95 /* virt queue functions */
96 void virtio_queue_update_rings(VirtIODevice *vdev, int n)
97 {
98     VRing *vring = &vdev->vq[n].vring;
99 
100     if (!vring->desc) {
101         /* not yet setup -> nothing to do */
102         return;
103     }
104     vring->avail = vring->desc + vring->num * sizeof(VRingDesc);
105     vring->used = vring_align(vring->avail +
106                               offsetof(VRingAvail, ring[vring->num]),
107                               vring->align);
108 }
109 
110 static inline uint64_t vring_desc_addr(VirtIODevice *vdev, hwaddr desc_pa,
111                                        int i)
112 {
113     hwaddr pa;
114     pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, addr);
115     return virtio_ldq_phys(vdev, pa);
116 }
117 
118 static inline uint32_t vring_desc_len(VirtIODevice *vdev, hwaddr desc_pa, int i)
119 {
120     hwaddr pa;
121     pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, len);
122     return virtio_ldl_phys(vdev, pa);
123 }
124 
125 static inline uint16_t vring_desc_flags(VirtIODevice *vdev, hwaddr desc_pa,
126                                         int i)
127 {
128     hwaddr pa;
129     pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, flags);
130     return virtio_lduw_phys(vdev, pa);
131 }
132 
133 static inline uint16_t vring_desc_next(VirtIODevice *vdev, hwaddr desc_pa,
134                                        int i)
135 {
136     hwaddr pa;
137     pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, next);
138     return virtio_lduw_phys(vdev, pa);
139 }
140 
141 static inline uint16_t vring_avail_flags(VirtQueue *vq)
142 {
143     hwaddr pa;
144     pa = vq->vring.avail + offsetof(VRingAvail, flags);
145     return virtio_lduw_phys(vq->vdev, pa);
146 }
147 
148 static inline uint16_t vring_avail_idx(VirtQueue *vq)
149 {
150     hwaddr pa;
151     pa = vq->vring.avail + offsetof(VRingAvail, idx);
152     return virtio_lduw_phys(vq->vdev, pa);
153 }
154 
155 static inline uint16_t vring_avail_ring(VirtQueue *vq, int i)
156 {
157     hwaddr pa;
158     pa = vq->vring.avail + offsetof(VRingAvail, ring[i]);
159     return virtio_lduw_phys(vq->vdev, pa);
160 }
161 
162 static inline uint16_t vring_get_used_event(VirtQueue *vq)
163 {
164     return vring_avail_ring(vq, vq->vring.num);
165 }
166 
167 static inline void vring_used_ring_id(VirtQueue *vq, int i, uint32_t val)
168 {
169     hwaddr pa;
170     pa = vq->vring.used + offsetof(VRingUsed, ring[i].id);
171     virtio_stl_phys(vq->vdev, pa, val);
172 }
173 
174 static inline void vring_used_ring_len(VirtQueue *vq, int i, uint32_t val)
175 {
176     hwaddr pa;
177     pa = vq->vring.used + offsetof(VRingUsed, ring[i].len);
178     virtio_stl_phys(vq->vdev, pa, val);
179 }
180 
181 static uint16_t vring_used_idx(VirtQueue *vq)
182 {
183     hwaddr pa;
184     pa = vq->vring.used + offsetof(VRingUsed, idx);
185     return virtio_lduw_phys(vq->vdev, pa);
186 }
187 
188 static inline void vring_used_idx_set(VirtQueue *vq, uint16_t val)
189 {
190     hwaddr pa;
191     pa = vq->vring.used + offsetof(VRingUsed, idx);
192     virtio_stw_phys(vq->vdev, pa, val);
193 }
194 
195 static inline void vring_used_flags_set_bit(VirtQueue *vq, int mask)
196 {
197     VirtIODevice *vdev = vq->vdev;
198     hwaddr pa;
199     pa = vq->vring.used + offsetof(VRingUsed, flags);
200     virtio_stw_phys(vdev, pa, virtio_lduw_phys(vdev, pa) | mask);
201 }
202 
203 static inline void vring_used_flags_unset_bit(VirtQueue *vq, int mask)
204 {
205     VirtIODevice *vdev = vq->vdev;
206     hwaddr pa;
207     pa = vq->vring.used + offsetof(VRingUsed, flags);
208     virtio_stw_phys(vdev, pa, virtio_lduw_phys(vdev, pa) & ~mask);
209 }
210 
211 static inline void vring_set_avail_event(VirtQueue *vq, uint16_t val)
212 {
213     hwaddr pa;
214     if (!vq->notification) {
215         return;
216     }
217     pa = vq->vring.used + offsetof(VRingUsed, ring[vq->vring.num]);
218     virtio_stw_phys(vq->vdev, pa, val);
219 }
220 
221 void virtio_queue_set_notification(VirtQueue *vq, int enable)
222 {
223     vq->notification = enable;
224     if (virtio_vdev_has_feature(vq->vdev, VIRTIO_RING_F_EVENT_IDX)) {
225         vring_set_avail_event(vq, vring_avail_idx(vq));
226     } else if (enable) {
227         vring_used_flags_unset_bit(vq, VRING_USED_F_NO_NOTIFY);
228     } else {
229         vring_used_flags_set_bit(vq, VRING_USED_F_NO_NOTIFY);
230     }
231     if (enable) {
232         /* Expose avail event/used flags before caller checks the avail idx. */
233         smp_mb();
234     }
235 }
236 
237 int virtio_queue_ready(VirtQueue *vq)
238 {
239     return vq->vring.avail != 0;
240 }
241 
242 int virtio_queue_empty(VirtQueue *vq)
243 {
244     return vring_avail_idx(vq) == vq->last_avail_idx;
245 }
246 
247 static void virtqueue_unmap_sg(VirtQueue *vq, const VirtQueueElement *elem,
248                                unsigned int len)
249 {
250     unsigned int offset;
251     int i;
252 
253     offset = 0;
254     for (i = 0; i < elem->in_num; i++) {
255         size_t size = MIN(len - offset, elem->in_sg[i].iov_len);
256 
257         cpu_physical_memory_unmap(elem->in_sg[i].iov_base,
258                                   elem->in_sg[i].iov_len,
259                                   1, size);
260 
261         offset += size;
262     }
263 
264     for (i = 0; i < elem->out_num; i++)
265         cpu_physical_memory_unmap(elem->out_sg[i].iov_base,
266                                   elem->out_sg[i].iov_len,
267                                   0, elem->out_sg[i].iov_len);
268 }
269 
270 void virtqueue_discard(VirtQueue *vq, const VirtQueueElement *elem,
271                        unsigned int len)
272 {
273     vq->last_avail_idx--;
274     virtqueue_unmap_sg(vq, elem, len);
275 }
276 
277 void virtqueue_fill(VirtQueue *vq, const VirtQueueElement *elem,
278                     unsigned int len, unsigned int idx)
279 {
280     trace_virtqueue_fill(vq, elem, len, idx);
281 
282     virtqueue_unmap_sg(vq, elem, len);
283 
284     idx = (idx + vring_used_idx(vq)) % vq->vring.num;
285 
286     /* Get a pointer to the next entry in the used ring. */
287     vring_used_ring_id(vq, idx, elem->index);
288     vring_used_ring_len(vq, idx, len);
289 }
290 
291 void virtqueue_flush(VirtQueue *vq, unsigned int count)
292 {
293     uint16_t old, new;
294     /* Make sure buffer is written before we update index. */
295     smp_wmb();
296     trace_virtqueue_flush(vq, count);
297     old = vring_used_idx(vq);
298     new = old + count;
299     vring_used_idx_set(vq, new);
300     vq->inuse -= count;
301     if (unlikely((int16_t)(new - vq->signalled_used) < (uint16_t)(new - old)))
302         vq->signalled_used_valid = false;
303 }
304 
305 void virtqueue_push(VirtQueue *vq, const VirtQueueElement *elem,
306                     unsigned int len)
307 {
308     virtqueue_fill(vq, elem, len, 0);
309     virtqueue_flush(vq, 1);
310 }
311 
312 static int virtqueue_num_heads(VirtQueue *vq, unsigned int idx)
313 {
314     uint16_t num_heads = vring_avail_idx(vq) - idx;
315 
316     /* Check it isn't doing very strange things with descriptor numbers. */
317     if (num_heads > vq->vring.num) {
318         error_report("Guest moved used index from %u to %u",
319                      idx, vring_avail_idx(vq));
320         exit(1);
321     }
322     /* On success, callers read a descriptor at vq->last_avail_idx.
323      * Make sure descriptor read does not bypass avail index read. */
324     if (num_heads) {
325         smp_rmb();
326     }
327 
328     return num_heads;
329 }
330 
331 static unsigned int virtqueue_get_head(VirtQueue *vq, unsigned int idx)
332 {
333     unsigned int head;
334 
335     /* Grab the next descriptor number they're advertising, and increment
336      * the index we've seen. */
337     head = vring_avail_ring(vq, idx % vq->vring.num);
338 
339     /* If their number is silly, that's a fatal mistake. */
340     if (head >= vq->vring.num) {
341         error_report("Guest says index %u is available", head);
342         exit(1);
343     }
344 
345     return head;
346 }
347 
348 static unsigned virtqueue_next_desc(VirtIODevice *vdev, hwaddr desc_pa,
349                                     unsigned int i, unsigned int max)
350 {
351     unsigned int next;
352 
353     /* If this descriptor says it doesn't chain, we're done. */
354     if (!(vring_desc_flags(vdev, desc_pa, i) & VRING_DESC_F_NEXT)) {
355         return max;
356     }
357 
358     /* Check they're not leading us off end of descriptors. */
359     next = vring_desc_next(vdev, desc_pa, i);
360     /* Make sure compiler knows to grab that: we don't want it changing! */
361     smp_wmb();
362 
363     if (next >= max) {
364         error_report("Desc next is %u", next);
365         exit(1);
366     }
367 
368     return next;
369 }
370 
371 void virtqueue_get_avail_bytes(VirtQueue *vq, unsigned int *in_bytes,
372                                unsigned int *out_bytes,
373                                unsigned max_in_bytes, unsigned max_out_bytes)
374 {
375     unsigned int idx;
376     unsigned int total_bufs, in_total, out_total;
377 
378     idx = vq->last_avail_idx;
379 
380     total_bufs = in_total = out_total = 0;
381     while (virtqueue_num_heads(vq, idx)) {
382         VirtIODevice *vdev = vq->vdev;
383         unsigned int max, num_bufs, indirect = 0;
384         hwaddr desc_pa;
385         int i;
386 
387         max = vq->vring.num;
388         num_bufs = total_bufs;
389         i = virtqueue_get_head(vq, idx++);
390         desc_pa = vq->vring.desc;
391 
392         if (vring_desc_flags(vdev, desc_pa, i) & VRING_DESC_F_INDIRECT) {
393             if (vring_desc_len(vdev, desc_pa, i) % sizeof(VRingDesc)) {
394                 error_report("Invalid size for indirect buffer table");
395                 exit(1);
396             }
397 
398             /* If we've got too many, that implies a descriptor loop. */
399             if (num_bufs >= max) {
400                 error_report("Looped descriptor");
401                 exit(1);
402             }
403 
404             /* loop over the indirect descriptor table */
405             indirect = 1;
406             max = vring_desc_len(vdev, desc_pa, i) / sizeof(VRingDesc);
407             desc_pa = vring_desc_addr(vdev, desc_pa, i);
408             num_bufs = i = 0;
409         }
410 
411         do {
412             /* If we've got too many, that implies a descriptor loop. */
413             if (++num_bufs > max) {
414                 error_report("Looped descriptor");
415                 exit(1);
416             }
417 
418             if (vring_desc_flags(vdev, desc_pa, i) & VRING_DESC_F_WRITE) {
419                 in_total += vring_desc_len(vdev, desc_pa, i);
420             } else {
421                 out_total += vring_desc_len(vdev, desc_pa, i);
422             }
423             if (in_total >= max_in_bytes && out_total >= max_out_bytes) {
424                 goto done;
425             }
426         } while ((i = virtqueue_next_desc(vdev, desc_pa, i, max)) != max);
427 
428         if (!indirect)
429             total_bufs = num_bufs;
430         else
431             total_bufs++;
432     }
433 done:
434     if (in_bytes) {
435         *in_bytes = in_total;
436     }
437     if (out_bytes) {
438         *out_bytes = out_total;
439     }
440 }
441 
442 int virtqueue_avail_bytes(VirtQueue *vq, unsigned int in_bytes,
443                           unsigned int out_bytes)
444 {
445     unsigned int in_total, out_total;
446 
447     virtqueue_get_avail_bytes(vq, &in_total, &out_total, in_bytes, out_bytes);
448     return in_bytes <= in_total && out_bytes <= out_total;
449 }
450 
451 static void virtqueue_map_iovec(struct iovec *sg, hwaddr *addr,
452                                 unsigned int *num_sg, unsigned int max_size,
453                                 int is_write)
454 {
455     unsigned int i;
456     hwaddr len;
457 
458     /* Note: this function MUST validate input, some callers
459      * are passing in num_sg values received over the network.
460      */
461     /* TODO: teach all callers that this can fail, and return failure instead
462      * of asserting here.
463      * When we do, we might be able to re-enable NDEBUG below.
464      */
465 #ifdef NDEBUG
466 #error building with NDEBUG is not supported
467 #endif
468     assert(*num_sg <= max_size);
469 
470     for (i = 0; i < *num_sg; i++) {
471         len = sg[i].iov_len;
472         sg[i].iov_base = cpu_physical_memory_map(addr[i], &len, is_write);
473         if (!sg[i].iov_base) {
474             error_report("virtio: error trying to map MMIO memory");
475             exit(1);
476         }
477         if (len == sg[i].iov_len) {
478             continue;
479         }
480         if (*num_sg >= max_size) {
481             error_report("virtio: memory split makes iovec too large");
482             exit(1);
483         }
484         memmove(sg + i + 1, sg + i, sizeof(*sg) * (*num_sg - i));
485         memmove(addr + i + 1, addr + i, sizeof(*addr) * (*num_sg - i));
486         assert(len < sg[i + 1].iov_len);
487         sg[i].iov_len = len;
488         addr[i + 1] += len;
489         sg[i + 1].iov_len -= len;
490         ++*num_sg;
491     }
492 }
493 
494 void virtqueue_map(VirtQueueElement *elem)
495 {
496     virtqueue_map_iovec(elem->in_sg, elem->in_addr, &elem->in_num,
497                         MIN(ARRAY_SIZE(elem->in_sg), ARRAY_SIZE(elem->in_addr)),
498                         1);
499     virtqueue_map_iovec(elem->out_sg, elem->out_addr, &elem->out_num,
500                         MIN(ARRAY_SIZE(elem->out_sg), ARRAY_SIZE(elem->out_addr)),
501                         0);
502 }
503 
504 int virtqueue_pop(VirtQueue *vq, VirtQueueElement *elem)
505 {
506     unsigned int i, head, max;
507     hwaddr desc_pa = vq->vring.desc;
508     VirtIODevice *vdev = vq->vdev;
509 
510     if (!virtqueue_num_heads(vq, vq->last_avail_idx))
511         return 0;
512 
513     /* When we start there are none of either input nor output. */
514     elem->out_num = elem->in_num = 0;
515 
516     max = vq->vring.num;
517 
518     i = head = virtqueue_get_head(vq, vq->last_avail_idx++);
519     if (virtio_vdev_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX)) {
520         vring_set_avail_event(vq, vq->last_avail_idx);
521     }
522 
523     if (vring_desc_flags(vdev, desc_pa, i) & VRING_DESC_F_INDIRECT) {
524         if (vring_desc_len(vdev, desc_pa, i) % sizeof(VRingDesc)) {
525             error_report("Invalid size for indirect buffer table");
526             exit(1);
527         }
528 
529         /* loop over the indirect descriptor table */
530         max = vring_desc_len(vdev, desc_pa, i) / sizeof(VRingDesc);
531         desc_pa = vring_desc_addr(vdev, desc_pa, i);
532         i = 0;
533     }
534 
535     /* Collect all the descriptors */
536     do {
537         struct iovec *sg;
538 
539         if (vring_desc_flags(vdev, desc_pa, i) & VRING_DESC_F_WRITE) {
540             if (elem->in_num >= ARRAY_SIZE(elem->in_sg)) {
541                 error_report("Too many write descriptors in indirect table");
542                 exit(1);
543             }
544             elem->in_addr[elem->in_num] = vring_desc_addr(vdev, desc_pa, i);
545             sg = &elem->in_sg[elem->in_num++];
546         } else {
547             if (elem->out_num >= ARRAY_SIZE(elem->out_sg)) {
548                 error_report("Too many read descriptors in indirect table");
549                 exit(1);
550             }
551             elem->out_addr[elem->out_num] = vring_desc_addr(vdev, desc_pa, i);
552             sg = &elem->out_sg[elem->out_num++];
553         }
554 
555         sg->iov_len = vring_desc_len(vdev, desc_pa, i);
556 
557         /* If we've got too many, that implies a descriptor loop. */
558         if ((elem->in_num + elem->out_num) > max) {
559             error_report("Looped descriptor");
560             exit(1);
561         }
562     } while ((i = virtqueue_next_desc(vdev, desc_pa, i, max)) != max);
563 
564     /* Now map what we have collected */
565     virtqueue_map(elem);
566 
567     elem->index = head;
568 
569     vq->inuse++;
570 
571     trace_virtqueue_pop(vq, elem, elem->in_num, elem->out_num);
572     return elem->in_num + elem->out_num;
573 }
574 
575 /* virtio device */
576 static void virtio_notify_vector(VirtIODevice *vdev, uint16_t vector)
577 {
578     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
579     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
580 
581     if (k->notify) {
582         k->notify(qbus->parent, vector);
583     }
584 }
585 
586 void virtio_update_irq(VirtIODevice *vdev)
587 {
588     virtio_notify_vector(vdev, VIRTIO_NO_VECTOR);
589 }
590 
591 static int virtio_validate_features(VirtIODevice *vdev)
592 {
593     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
594 
595     if (k->validate_features) {
596         return k->validate_features(vdev);
597     } else {
598         return 0;
599     }
600 }
601 
602 int virtio_set_status(VirtIODevice *vdev, uint8_t val)
603 {
604     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
605     trace_virtio_set_status(vdev, val);
606 
607     if (virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1)) {
608         if (!(vdev->status & VIRTIO_CONFIG_S_FEATURES_OK) &&
609             val & VIRTIO_CONFIG_S_FEATURES_OK) {
610             int ret = virtio_validate_features(vdev);
611 
612             if (ret) {
613                 return ret;
614             }
615         }
616     }
617     if (k->set_status) {
618         k->set_status(vdev, val);
619     }
620     vdev->status = val;
621     return 0;
622 }
623 
624 bool target_words_bigendian(void);
625 static enum virtio_device_endian virtio_default_endian(void)
626 {
627     if (target_words_bigendian()) {
628         return VIRTIO_DEVICE_ENDIAN_BIG;
629     } else {
630         return VIRTIO_DEVICE_ENDIAN_LITTLE;
631     }
632 }
633 
634 static enum virtio_device_endian virtio_current_cpu_endian(void)
635 {
636     CPUClass *cc = CPU_GET_CLASS(current_cpu);
637 
638     if (cc->virtio_is_big_endian(current_cpu)) {
639         return VIRTIO_DEVICE_ENDIAN_BIG;
640     } else {
641         return VIRTIO_DEVICE_ENDIAN_LITTLE;
642     }
643 }
644 
645 void virtio_reset(void *opaque)
646 {
647     VirtIODevice *vdev = opaque;
648     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
649     int i;
650 
651     virtio_set_status(vdev, 0);
652     if (current_cpu) {
653         /* Guest initiated reset */
654         vdev->device_endian = virtio_current_cpu_endian();
655     } else {
656         /* System reset */
657         vdev->device_endian = virtio_default_endian();
658     }
659 
660     if (k->reset) {
661         k->reset(vdev);
662     }
663 
664     vdev->guest_features = 0;
665     vdev->queue_sel = 0;
666     vdev->status = 0;
667     vdev->isr = 0;
668     vdev->config_vector = VIRTIO_NO_VECTOR;
669     virtio_notify_vector(vdev, vdev->config_vector);
670 
671     for(i = 0; i < VIRTIO_QUEUE_MAX; i++) {
672         vdev->vq[i].vring.desc = 0;
673         vdev->vq[i].vring.avail = 0;
674         vdev->vq[i].vring.used = 0;
675         vdev->vq[i].last_avail_idx = 0;
676         virtio_queue_set_vector(vdev, i, VIRTIO_NO_VECTOR);
677         vdev->vq[i].signalled_used = 0;
678         vdev->vq[i].signalled_used_valid = false;
679         vdev->vq[i].notification = true;
680         vdev->vq[i].vring.num = vdev->vq[i].vring.num_default;
681     }
682 }
683 
684 uint32_t virtio_config_readb(VirtIODevice *vdev, uint32_t addr)
685 {
686     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
687     uint8_t val;
688 
689     if (addr + sizeof(val) > vdev->config_len) {
690         return (uint32_t)-1;
691     }
692 
693     k->get_config(vdev, vdev->config);
694 
695     val = ldub_p(vdev->config + addr);
696     return val;
697 }
698 
699 uint32_t virtio_config_readw(VirtIODevice *vdev, uint32_t addr)
700 {
701     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
702     uint16_t val;
703 
704     if (addr + sizeof(val) > vdev->config_len) {
705         return (uint32_t)-1;
706     }
707 
708     k->get_config(vdev, vdev->config);
709 
710     val = lduw_p(vdev->config + addr);
711     return val;
712 }
713 
714 uint32_t virtio_config_readl(VirtIODevice *vdev, uint32_t addr)
715 {
716     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
717     uint32_t val;
718 
719     if (addr + sizeof(val) > vdev->config_len) {
720         return (uint32_t)-1;
721     }
722 
723     k->get_config(vdev, vdev->config);
724 
725     val = ldl_p(vdev->config + addr);
726     return val;
727 }
728 
729 void virtio_config_writeb(VirtIODevice *vdev, uint32_t addr, uint32_t data)
730 {
731     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
732     uint8_t val = data;
733 
734     if (addr + sizeof(val) > vdev->config_len) {
735         return;
736     }
737 
738     stb_p(vdev->config + addr, val);
739 
740     if (k->set_config) {
741         k->set_config(vdev, vdev->config);
742     }
743 }
744 
745 void virtio_config_writew(VirtIODevice *vdev, uint32_t addr, uint32_t data)
746 {
747     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
748     uint16_t val = data;
749 
750     if (addr + sizeof(val) > vdev->config_len) {
751         return;
752     }
753 
754     stw_p(vdev->config + addr, val);
755 
756     if (k->set_config) {
757         k->set_config(vdev, vdev->config);
758     }
759 }
760 
761 void virtio_config_writel(VirtIODevice *vdev, uint32_t addr, uint32_t data)
762 {
763     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
764     uint32_t val = data;
765 
766     if (addr + sizeof(val) > vdev->config_len) {
767         return;
768     }
769 
770     stl_p(vdev->config + addr, val);
771 
772     if (k->set_config) {
773         k->set_config(vdev, vdev->config);
774     }
775 }
776 
777 uint32_t virtio_config_modern_readb(VirtIODevice *vdev, uint32_t addr)
778 {
779     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
780     uint8_t val;
781 
782     if (addr + sizeof(val) > vdev->config_len) {
783         return (uint32_t)-1;
784     }
785 
786     k->get_config(vdev, vdev->config);
787 
788     val = ldub_p(vdev->config + addr);
789     return val;
790 }
791 
792 uint32_t virtio_config_modern_readw(VirtIODevice *vdev, uint32_t addr)
793 {
794     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
795     uint16_t val;
796 
797     if (addr + sizeof(val) > vdev->config_len) {
798         return (uint32_t)-1;
799     }
800 
801     k->get_config(vdev, vdev->config);
802 
803     val = lduw_le_p(vdev->config + addr);
804     return val;
805 }
806 
807 uint32_t virtio_config_modern_readl(VirtIODevice *vdev, uint32_t addr)
808 {
809     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
810     uint32_t val;
811 
812     if (addr + sizeof(val) > vdev->config_len) {
813         return (uint32_t)-1;
814     }
815 
816     k->get_config(vdev, vdev->config);
817 
818     val = ldl_le_p(vdev->config + addr);
819     return val;
820 }
821 
822 void virtio_config_modern_writeb(VirtIODevice *vdev,
823                                  uint32_t addr, uint32_t data)
824 {
825     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
826     uint8_t val = data;
827 
828     if (addr + sizeof(val) > vdev->config_len) {
829         return;
830     }
831 
832     stb_p(vdev->config + addr, val);
833 
834     if (k->set_config) {
835         k->set_config(vdev, vdev->config);
836     }
837 }
838 
839 void virtio_config_modern_writew(VirtIODevice *vdev,
840                                  uint32_t addr, uint32_t data)
841 {
842     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
843     uint16_t val = data;
844 
845     if (addr + sizeof(val) > vdev->config_len) {
846         return;
847     }
848 
849     stw_le_p(vdev->config + addr, val);
850 
851     if (k->set_config) {
852         k->set_config(vdev, vdev->config);
853     }
854 }
855 
856 void virtio_config_modern_writel(VirtIODevice *vdev,
857                                  uint32_t addr, uint32_t data)
858 {
859     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
860     uint32_t val = data;
861 
862     if (addr + sizeof(val) > vdev->config_len) {
863         return;
864     }
865 
866     stl_le_p(vdev->config + addr, val);
867 
868     if (k->set_config) {
869         k->set_config(vdev, vdev->config);
870     }
871 }
872 
873 void virtio_queue_set_addr(VirtIODevice *vdev, int n, hwaddr addr)
874 {
875     vdev->vq[n].vring.desc = addr;
876     virtio_queue_update_rings(vdev, n);
877 }
878 
879 hwaddr virtio_queue_get_addr(VirtIODevice *vdev, int n)
880 {
881     return vdev->vq[n].vring.desc;
882 }
883 
884 void virtio_queue_set_rings(VirtIODevice *vdev, int n, hwaddr desc,
885                             hwaddr avail, hwaddr used)
886 {
887     vdev->vq[n].vring.desc = desc;
888     vdev->vq[n].vring.avail = avail;
889     vdev->vq[n].vring.used = used;
890 }
891 
892 void virtio_queue_set_num(VirtIODevice *vdev, int n, int num)
893 {
894     /* Don't allow guest to flip queue between existent and
895      * nonexistent states, or to set it to an invalid size.
896      */
897     if (!!num != !!vdev->vq[n].vring.num ||
898         num > VIRTQUEUE_MAX_SIZE ||
899         num < 0) {
900         return;
901     }
902     vdev->vq[n].vring.num = num;
903 }
904 
905 VirtQueue *virtio_vector_first_queue(VirtIODevice *vdev, uint16_t vector)
906 {
907     return QLIST_FIRST(&vdev->vector_queues[vector]);
908 }
909 
910 VirtQueue *virtio_vector_next_queue(VirtQueue *vq)
911 {
912     return QLIST_NEXT(vq, node);
913 }
914 
915 int virtio_queue_get_num(VirtIODevice *vdev, int n)
916 {
917     return vdev->vq[n].vring.num;
918 }
919 
920 int virtio_get_num_queues(VirtIODevice *vdev)
921 {
922     int i;
923 
924     for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
925         if (!virtio_queue_get_num(vdev, i)) {
926             break;
927         }
928     }
929 
930     return i;
931 }
932 
933 int virtio_queue_get_id(VirtQueue *vq)
934 {
935     VirtIODevice *vdev = vq->vdev;
936     assert(vq >= &vdev->vq[0] && vq < &vdev->vq[VIRTIO_QUEUE_MAX]);
937     return vq - &vdev->vq[0];
938 }
939 
940 void virtio_queue_set_align(VirtIODevice *vdev, int n, int align)
941 {
942     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
943     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
944 
945     /* virtio-1 compliant devices cannot change the alignment */
946     if (virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1)) {
947         error_report("tried to modify queue alignment for virtio-1 device");
948         return;
949     }
950     /* Check that the transport told us it was going to do this
951      * (so a buggy transport will immediately assert rather than
952      * silently failing to migrate this state)
953      */
954     assert(k->has_variable_vring_alignment);
955 
956     vdev->vq[n].vring.align = align;
957     virtio_queue_update_rings(vdev, n);
958 }
959 
960 void virtio_queue_notify_vq(VirtQueue *vq)
961 {
962     if (vq->vring.desc && vq->handle_output) {
963         VirtIODevice *vdev = vq->vdev;
964 
965         trace_virtio_queue_notify(vdev, vq - vdev->vq, vq);
966         vq->handle_output(vdev, vq);
967     }
968 }
969 
970 void virtio_queue_notify(VirtIODevice *vdev, int n)
971 {
972     virtio_queue_notify_vq(&vdev->vq[n]);
973 }
974 
975 uint16_t virtio_queue_vector(VirtIODevice *vdev, int n)
976 {
977     return n < VIRTIO_QUEUE_MAX ? vdev->vq[n].vector :
978         VIRTIO_NO_VECTOR;
979 }
980 
981 void virtio_queue_set_vector(VirtIODevice *vdev, int n, uint16_t vector)
982 {
983     VirtQueue *vq = &vdev->vq[n];
984 
985     if (n < VIRTIO_QUEUE_MAX) {
986         if (vdev->vector_queues &&
987             vdev->vq[n].vector != VIRTIO_NO_VECTOR) {
988             QLIST_REMOVE(vq, node);
989         }
990         vdev->vq[n].vector = vector;
991         if (vdev->vector_queues &&
992             vector != VIRTIO_NO_VECTOR) {
993             QLIST_INSERT_HEAD(&vdev->vector_queues[vector], vq, node);
994         }
995     }
996 }
997 
998 VirtQueue *virtio_add_queue(VirtIODevice *vdev, int queue_size,
999                             void (*handle_output)(VirtIODevice *, VirtQueue *))
1000 {
1001     int i;
1002 
1003     for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1004         if (vdev->vq[i].vring.num == 0)
1005             break;
1006     }
1007 
1008     if (i == VIRTIO_QUEUE_MAX || queue_size > VIRTQUEUE_MAX_SIZE)
1009         abort();
1010 
1011     vdev->vq[i].vring.num = queue_size;
1012     vdev->vq[i].vring.num_default = queue_size;
1013     vdev->vq[i].vring.align = VIRTIO_PCI_VRING_ALIGN;
1014     vdev->vq[i].handle_output = handle_output;
1015 
1016     return &vdev->vq[i];
1017 }
1018 
1019 void virtio_del_queue(VirtIODevice *vdev, int n)
1020 {
1021     if (n < 0 || n >= VIRTIO_QUEUE_MAX) {
1022         abort();
1023     }
1024 
1025     vdev->vq[n].vring.num = 0;
1026     vdev->vq[n].vring.num_default = 0;
1027 }
1028 
1029 void virtio_irq(VirtQueue *vq)
1030 {
1031     trace_virtio_irq(vq);
1032     vq->vdev->isr |= 0x01;
1033     virtio_notify_vector(vq->vdev, vq->vector);
1034 }
1035 
1036 static bool vring_notify(VirtIODevice *vdev, VirtQueue *vq)
1037 {
1038     uint16_t old, new;
1039     bool v;
1040     /* We need to expose used array entries before checking used event. */
1041     smp_mb();
1042     /* Always notify when queue is empty (when feature acknowledge) */
1043     if (virtio_vdev_has_feature(vdev, VIRTIO_F_NOTIFY_ON_EMPTY) &&
1044         !vq->inuse && vring_avail_idx(vq) == vq->last_avail_idx) {
1045         return true;
1046     }
1047 
1048     if (!virtio_vdev_has_feature(vdev, VIRTIO_RING_F_EVENT_IDX)) {
1049         return !(vring_avail_flags(vq) & VRING_AVAIL_F_NO_INTERRUPT);
1050     }
1051 
1052     v = vq->signalled_used_valid;
1053     vq->signalled_used_valid = true;
1054     old = vq->signalled_used;
1055     new = vq->signalled_used = vring_used_idx(vq);
1056     return !v || vring_need_event(vring_get_used_event(vq), new, old);
1057 }
1058 
1059 void virtio_notify(VirtIODevice *vdev, VirtQueue *vq)
1060 {
1061     if (!vring_notify(vdev, vq)) {
1062         return;
1063     }
1064 
1065     trace_virtio_notify(vdev, vq);
1066     vdev->isr |= 0x01;
1067     virtio_notify_vector(vdev, vq->vector);
1068 }
1069 
1070 void virtio_notify_config(VirtIODevice *vdev)
1071 {
1072     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))
1073         return;
1074 
1075     vdev->isr |= 0x03;
1076     vdev->generation++;
1077     virtio_notify_vector(vdev, vdev->config_vector);
1078 }
1079 
1080 static bool virtio_device_endian_needed(void *opaque)
1081 {
1082     VirtIODevice *vdev = opaque;
1083 
1084     assert(vdev->device_endian != VIRTIO_DEVICE_ENDIAN_UNKNOWN);
1085     if (!virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1)) {
1086         return vdev->device_endian != virtio_default_endian();
1087     }
1088     /* Devices conforming to VIRTIO 1.0 or later are always LE. */
1089     return vdev->device_endian != VIRTIO_DEVICE_ENDIAN_LITTLE;
1090 }
1091 
1092 static bool virtio_64bit_features_needed(void *opaque)
1093 {
1094     VirtIODevice *vdev = opaque;
1095 
1096     return (vdev->host_features >> 32) != 0;
1097 }
1098 
1099 static bool virtio_virtqueue_needed(void *opaque)
1100 {
1101     VirtIODevice *vdev = opaque;
1102 
1103     return virtio_host_has_feature(vdev, VIRTIO_F_VERSION_1);
1104 }
1105 
1106 static bool virtio_ringsize_needed(void *opaque)
1107 {
1108     VirtIODevice *vdev = opaque;
1109     int i;
1110 
1111     for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1112         if (vdev->vq[i].vring.num != vdev->vq[i].vring.num_default) {
1113             return true;
1114         }
1115     }
1116     return false;
1117 }
1118 
1119 static bool virtio_extra_state_needed(void *opaque)
1120 {
1121     VirtIODevice *vdev = opaque;
1122     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1123     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1124 
1125     return k->has_extra_state &&
1126         k->has_extra_state(qbus->parent);
1127 }
1128 
1129 static const VMStateDescription vmstate_virtqueue = {
1130     .name = "virtqueue_state",
1131     .version_id = 1,
1132     .minimum_version_id = 1,
1133     .fields = (VMStateField[]) {
1134         VMSTATE_UINT64(vring.avail, struct VirtQueue),
1135         VMSTATE_UINT64(vring.used, struct VirtQueue),
1136         VMSTATE_END_OF_LIST()
1137     }
1138 };
1139 
1140 static const VMStateDescription vmstate_virtio_virtqueues = {
1141     .name = "virtio/virtqueues",
1142     .version_id = 1,
1143     .minimum_version_id = 1,
1144     .needed = &virtio_virtqueue_needed,
1145     .fields = (VMStateField[]) {
1146         VMSTATE_STRUCT_VARRAY_KNOWN(vq, struct VirtIODevice, VIRTIO_QUEUE_MAX,
1147                       0, vmstate_virtqueue, VirtQueue),
1148         VMSTATE_END_OF_LIST()
1149     }
1150 };
1151 
1152 static const VMStateDescription vmstate_ringsize = {
1153     .name = "ringsize_state",
1154     .version_id = 1,
1155     .minimum_version_id = 1,
1156     .fields = (VMStateField[]) {
1157         VMSTATE_UINT32(vring.num_default, struct VirtQueue),
1158         VMSTATE_END_OF_LIST()
1159     }
1160 };
1161 
1162 static const VMStateDescription vmstate_virtio_ringsize = {
1163     .name = "virtio/ringsize",
1164     .version_id = 1,
1165     .minimum_version_id = 1,
1166     .needed = &virtio_ringsize_needed,
1167     .fields = (VMStateField[]) {
1168         VMSTATE_STRUCT_VARRAY_KNOWN(vq, struct VirtIODevice, VIRTIO_QUEUE_MAX,
1169                       0, vmstate_ringsize, VirtQueue),
1170         VMSTATE_END_OF_LIST()
1171     }
1172 };
1173 
1174 static int get_extra_state(QEMUFile *f, void *pv, size_t size)
1175 {
1176     VirtIODevice *vdev = pv;
1177     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1178     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1179 
1180     if (!k->load_extra_state) {
1181         return -1;
1182     } else {
1183         return k->load_extra_state(qbus->parent, f);
1184     }
1185 }
1186 
1187 static void put_extra_state(QEMUFile *f, void *pv, size_t size)
1188 {
1189     VirtIODevice *vdev = pv;
1190     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1191     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1192 
1193     k->save_extra_state(qbus->parent, f);
1194 }
1195 
1196 static const VMStateInfo vmstate_info_extra_state = {
1197     .name = "virtqueue_extra_state",
1198     .get = get_extra_state,
1199     .put = put_extra_state,
1200 };
1201 
1202 static const VMStateDescription vmstate_virtio_extra_state = {
1203     .name = "virtio/extra_state",
1204     .version_id = 1,
1205     .minimum_version_id = 1,
1206     .needed = &virtio_extra_state_needed,
1207     .fields = (VMStateField[]) {
1208         {
1209             .name         = "extra_state",
1210             .version_id   = 0,
1211             .field_exists = NULL,
1212             .size         = 0,
1213             .info         = &vmstate_info_extra_state,
1214             .flags        = VMS_SINGLE,
1215             .offset       = 0,
1216         },
1217         VMSTATE_END_OF_LIST()
1218     }
1219 };
1220 
1221 static const VMStateDescription vmstate_virtio_device_endian = {
1222     .name = "virtio/device_endian",
1223     .version_id = 1,
1224     .minimum_version_id = 1,
1225     .needed = &virtio_device_endian_needed,
1226     .fields = (VMStateField[]) {
1227         VMSTATE_UINT8(device_endian, VirtIODevice),
1228         VMSTATE_END_OF_LIST()
1229     }
1230 };
1231 
1232 static const VMStateDescription vmstate_virtio_64bit_features = {
1233     .name = "virtio/64bit_features",
1234     .version_id = 1,
1235     .minimum_version_id = 1,
1236     .needed = &virtio_64bit_features_needed,
1237     .fields = (VMStateField[]) {
1238         VMSTATE_UINT64(guest_features, VirtIODevice),
1239         VMSTATE_END_OF_LIST()
1240     }
1241 };
1242 
1243 static const VMStateDescription vmstate_virtio = {
1244     .name = "virtio",
1245     .version_id = 1,
1246     .minimum_version_id = 1,
1247     .minimum_version_id_old = 1,
1248     .fields = (VMStateField[]) {
1249         VMSTATE_END_OF_LIST()
1250     },
1251     .subsections = (const VMStateDescription*[]) {
1252         &vmstate_virtio_device_endian,
1253         &vmstate_virtio_64bit_features,
1254         &vmstate_virtio_virtqueues,
1255         &vmstate_virtio_ringsize,
1256         &vmstate_virtio_extra_state,
1257         NULL
1258     }
1259 };
1260 
1261 void virtio_save(VirtIODevice *vdev, QEMUFile *f)
1262 {
1263     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1264     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1265     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(vdev);
1266     uint32_t guest_features_lo = (vdev->guest_features & 0xffffffff);
1267     int i;
1268 
1269     if (k->save_config) {
1270         k->save_config(qbus->parent, f);
1271     }
1272 
1273     qemu_put_8s(f, &vdev->status);
1274     qemu_put_8s(f, &vdev->isr);
1275     qemu_put_be16s(f, &vdev->queue_sel);
1276     qemu_put_be32s(f, &guest_features_lo);
1277     qemu_put_be32(f, vdev->config_len);
1278     qemu_put_buffer(f, vdev->config, vdev->config_len);
1279 
1280     for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1281         if (vdev->vq[i].vring.num == 0)
1282             break;
1283     }
1284 
1285     qemu_put_be32(f, i);
1286 
1287     for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1288         if (vdev->vq[i].vring.num == 0)
1289             break;
1290 
1291         qemu_put_be32(f, vdev->vq[i].vring.num);
1292         if (k->has_variable_vring_alignment) {
1293             qemu_put_be32(f, vdev->vq[i].vring.align);
1294         }
1295         /* XXX virtio-1 devices */
1296         qemu_put_be64(f, vdev->vq[i].vring.desc);
1297         qemu_put_be16s(f, &vdev->vq[i].last_avail_idx);
1298         if (k->save_queue) {
1299             k->save_queue(qbus->parent, i, f);
1300         }
1301     }
1302 
1303     if (vdc->save != NULL) {
1304         vdc->save(vdev, f);
1305     }
1306 
1307     /* Subsections */
1308     vmstate_save_state(f, &vmstate_virtio, vdev, NULL);
1309 }
1310 
1311 static int virtio_set_features_nocheck(VirtIODevice *vdev, uint64_t val)
1312 {
1313     VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
1314     bool bad = (val & ~(vdev->host_features)) != 0;
1315 
1316     val &= vdev->host_features;
1317     if (k->set_features) {
1318         k->set_features(vdev, val);
1319     }
1320     vdev->guest_features = val;
1321     return bad ? -1 : 0;
1322 }
1323 
1324 int virtio_set_features(VirtIODevice *vdev, uint64_t val)
1325 {
1326    /*
1327      * The driver must not attempt to set features after feature negotiation
1328      * has finished.
1329      */
1330     if (vdev->status & VIRTIO_CONFIG_S_FEATURES_OK) {
1331         return -EINVAL;
1332     }
1333     return virtio_set_features_nocheck(vdev, val);
1334 }
1335 
1336 int virtio_load(VirtIODevice *vdev, QEMUFile *f, int version_id)
1337 {
1338     int i, ret;
1339     int32_t config_len;
1340     uint32_t num;
1341     uint32_t features;
1342     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1343     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1344     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(vdev);
1345 
1346     /*
1347      * We poison the endianness to ensure it does not get used before
1348      * subsections have been loaded.
1349      */
1350     vdev->device_endian = VIRTIO_DEVICE_ENDIAN_UNKNOWN;
1351 
1352     if (k->load_config) {
1353         ret = k->load_config(qbus->parent, f);
1354         if (ret)
1355             return ret;
1356     }
1357 
1358     qemu_get_8s(f, &vdev->status);
1359     qemu_get_8s(f, &vdev->isr);
1360     qemu_get_be16s(f, &vdev->queue_sel);
1361     if (vdev->queue_sel >= VIRTIO_QUEUE_MAX) {
1362         return -1;
1363     }
1364     qemu_get_be32s(f, &features);
1365 
1366     config_len = qemu_get_be32(f);
1367 
1368     /*
1369      * There are cases where the incoming config can be bigger or smaller
1370      * than what we have; so load what we have space for, and skip
1371      * any excess that's in the stream.
1372      */
1373     qemu_get_buffer(f, vdev->config, MIN(config_len, vdev->config_len));
1374 
1375     while (config_len > vdev->config_len) {
1376         qemu_get_byte(f);
1377         config_len--;
1378     }
1379 
1380     num = qemu_get_be32(f);
1381 
1382     if (num > VIRTIO_QUEUE_MAX) {
1383         error_report("Invalid number of virtqueues: 0x%x", num);
1384         return -1;
1385     }
1386 
1387     for (i = 0; i < num; i++) {
1388         vdev->vq[i].vring.num = qemu_get_be32(f);
1389         if (k->has_variable_vring_alignment) {
1390             vdev->vq[i].vring.align = qemu_get_be32(f);
1391         }
1392         vdev->vq[i].vring.desc = qemu_get_be64(f);
1393         qemu_get_be16s(f, &vdev->vq[i].last_avail_idx);
1394         vdev->vq[i].signalled_used_valid = false;
1395         vdev->vq[i].notification = true;
1396 
1397         if (vdev->vq[i].vring.desc) {
1398             /* XXX virtio-1 devices */
1399             virtio_queue_update_rings(vdev, i);
1400         } else if (vdev->vq[i].last_avail_idx) {
1401             error_report("VQ %d address 0x0 "
1402                          "inconsistent with Host index 0x%x",
1403                          i, vdev->vq[i].last_avail_idx);
1404                 return -1;
1405 	}
1406         if (k->load_queue) {
1407             ret = k->load_queue(qbus->parent, i, f);
1408             if (ret)
1409                 return ret;
1410         }
1411     }
1412 
1413     virtio_notify_vector(vdev, VIRTIO_NO_VECTOR);
1414 
1415     if (vdc->load != NULL) {
1416         ret = vdc->load(vdev, f, version_id);
1417         if (ret) {
1418             return ret;
1419         }
1420     }
1421 
1422     /* Subsections */
1423     ret = vmstate_load_state(f, &vmstate_virtio, vdev, 1);
1424     if (ret) {
1425         return ret;
1426     }
1427 
1428     if (vdev->device_endian == VIRTIO_DEVICE_ENDIAN_UNKNOWN) {
1429         vdev->device_endian = virtio_default_endian();
1430     }
1431 
1432     if (virtio_64bit_features_needed(vdev)) {
1433         /*
1434          * Subsection load filled vdev->guest_features.  Run them
1435          * through virtio_set_features to sanity-check them against
1436          * host_features.
1437          */
1438         uint64_t features64 = vdev->guest_features;
1439         if (virtio_set_features_nocheck(vdev, features64) < 0) {
1440             error_report("Features 0x%" PRIx64 " unsupported. "
1441                          "Allowed features: 0x%" PRIx64,
1442                          features64, vdev->host_features);
1443             return -1;
1444         }
1445     } else {
1446         if (virtio_set_features_nocheck(vdev, features) < 0) {
1447             error_report("Features 0x%x unsupported. "
1448                          "Allowed features: 0x%" PRIx64,
1449                          features, vdev->host_features);
1450             return -1;
1451         }
1452     }
1453 
1454     for (i = 0; i < num; i++) {
1455         if (vdev->vq[i].vring.desc) {
1456             uint16_t nheads;
1457             nheads = vring_avail_idx(&vdev->vq[i]) - vdev->vq[i].last_avail_idx;
1458             /* Check it isn't doing strange things with descriptor numbers. */
1459             if (nheads > vdev->vq[i].vring.num) {
1460                 error_report("VQ %d size 0x%x Guest index 0x%x "
1461                              "inconsistent with Host index 0x%x: delta 0x%x",
1462                              i, vdev->vq[i].vring.num,
1463                              vring_avail_idx(&vdev->vq[i]),
1464                              vdev->vq[i].last_avail_idx, nheads);
1465                 return -1;
1466             }
1467         }
1468     }
1469 
1470     return 0;
1471 }
1472 
1473 void virtio_cleanup(VirtIODevice *vdev)
1474 {
1475     qemu_del_vm_change_state_handler(vdev->vmstate);
1476     g_free(vdev->config);
1477     g_free(vdev->vq);
1478     g_free(vdev->vector_queues);
1479 }
1480 
1481 static void virtio_vmstate_change(void *opaque, int running, RunState state)
1482 {
1483     VirtIODevice *vdev = opaque;
1484     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1485     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1486     bool backend_run = running && (vdev->status & VIRTIO_CONFIG_S_DRIVER_OK);
1487     vdev->vm_running = running;
1488 
1489     if (backend_run) {
1490         virtio_set_status(vdev, vdev->status);
1491     }
1492 
1493     if (k->vmstate_change) {
1494         k->vmstate_change(qbus->parent, backend_run);
1495     }
1496 
1497     if (!backend_run) {
1498         virtio_set_status(vdev, vdev->status);
1499     }
1500 }
1501 
1502 void virtio_instance_init_common(Object *proxy_obj, void *data,
1503                                  size_t vdev_size, const char *vdev_name)
1504 {
1505     DeviceState *vdev = data;
1506 
1507     object_initialize(vdev, vdev_size, vdev_name);
1508     object_property_add_child(proxy_obj, "virtio-backend", OBJECT(vdev), NULL);
1509     object_unref(OBJECT(vdev));
1510     qdev_alias_all_properties(vdev, proxy_obj);
1511 }
1512 
1513 void virtio_init(VirtIODevice *vdev, const char *name,
1514                  uint16_t device_id, size_t config_size)
1515 {
1516     BusState *qbus = qdev_get_parent_bus(DEVICE(vdev));
1517     VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(qbus);
1518     int i;
1519     int nvectors = k->query_nvectors ? k->query_nvectors(qbus->parent) : 0;
1520 
1521     if (nvectors) {
1522         vdev->vector_queues =
1523             g_malloc0(sizeof(*vdev->vector_queues) * nvectors);
1524     }
1525 
1526     vdev->device_id = device_id;
1527     vdev->status = 0;
1528     vdev->isr = 0;
1529     vdev->queue_sel = 0;
1530     vdev->config_vector = VIRTIO_NO_VECTOR;
1531     vdev->vq = g_malloc0(sizeof(VirtQueue) * VIRTIO_QUEUE_MAX);
1532     vdev->vm_running = runstate_is_running();
1533     for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1534         vdev->vq[i].vector = VIRTIO_NO_VECTOR;
1535         vdev->vq[i].vdev = vdev;
1536         vdev->vq[i].queue_index = i;
1537     }
1538 
1539     vdev->name = name;
1540     vdev->config_len = config_size;
1541     if (vdev->config_len) {
1542         vdev->config = g_malloc0(config_size);
1543     } else {
1544         vdev->config = NULL;
1545     }
1546     vdev->vmstate = qemu_add_vm_change_state_handler(virtio_vmstate_change,
1547                                                      vdev);
1548     vdev->device_endian = virtio_default_endian();
1549 }
1550 
1551 hwaddr virtio_queue_get_desc_addr(VirtIODevice *vdev, int n)
1552 {
1553     return vdev->vq[n].vring.desc;
1554 }
1555 
1556 hwaddr virtio_queue_get_avail_addr(VirtIODevice *vdev, int n)
1557 {
1558     return vdev->vq[n].vring.avail;
1559 }
1560 
1561 hwaddr virtio_queue_get_used_addr(VirtIODevice *vdev, int n)
1562 {
1563     return vdev->vq[n].vring.used;
1564 }
1565 
1566 hwaddr virtio_queue_get_ring_addr(VirtIODevice *vdev, int n)
1567 {
1568     return vdev->vq[n].vring.desc;
1569 }
1570 
1571 hwaddr virtio_queue_get_desc_size(VirtIODevice *vdev, int n)
1572 {
1573     return sizeof(VRingDesc) * vdev->vq[n].vring.num;
1574 }
1575 
1576 hwaddr virtio_queue_get_avail_size(VirtIODevice *vdev, int n)
1577 {
1578     return offsetof(VRingAvail, ring) +
1579         sizeof(uint16_t) * vdev->vq[n].vring.num;
1580 }
1581 
1582 hwaddr virtio_queue_get_used_size(VirtIODevice *vdev, int n)
1583 {
1584     return offsetof(VRingUsed, ring) +
1585         sizeof(VRingUsedElem) * vdev->vq[n].vring.num;
1586 }
1587 
1588 hwaddr virtio_queue_get_ring_size(VirtIODevice *vdev, int n)
1589 {
1590     return vdev->vq[n].vring.used - vdev->vq[n].vring.desc +
1591 	    virtio_queue_get_used_size(vdev, n);
1592 }
1593 
1594 uint16_t virtio_queue_get_last_avail_idx(VirtIODevice *vdev, int n)
1595 {
1596     return vdev->vq[n].last_avail_idx;
1597 }
1598 
1599 void virtio_queue_set_last_avail_idx(VirtIODevice *vdev, int n, uint16_t idx)
1600 {
1601     vdev->vq[n].last_avail_idx = idx;
1602 }
1603 
1604 void virtio_queue_invalidate_signalled_used(VirtIODevice *vdev, int n)
1605 {
1606     vdev->vq[n].signalled_used_valid = false;
1607 }
1608 
1609 VirtQueue *virtio_get_queue(VirtIODevice *vdev, int n)
1610 {
1611     return vdev->vq + n;
1612 }
1613 
1614 uint16_t virtio_get_queue_index(VirtQueue *vq)
1615 {
1616     return vq->queue_index;
1617 }
1618 
1619 static void virtio_queue_guest_notifier_read(EventNotifier *n)
1620 {
1621     VirtQueue *vq = container_of(n, VirtQueue, guest_notifier);
1622     if (event_notifier_test_and_clear(n)) {
1623         virtio_irq(vq);
1624     }
1625 }
1626 
1627 void virtio_queue_set_guest_notifier_fd_handler(VirtQueue *vq, bool assign,
1628                                                 bool with_irqfd)
1629 {
1630     if (assign && !with_irqfd) {
1631         event_notifier_set_handler(&vq->guest_notifier,
1632                                    virtio_queue_guest_notifier_read);
1633     } else {
1634         event_notifier_set_handler(&vq->guest_notifier, NULL);
1635     }
1636     if (!assign) {
1637         /* Test and clear notifier before closing it,
1638          * in case poll callback didn't have time to run. */
1639         virtio_queue_guest_notifier_read(&vq->guest_notifier);
1640     }
1641 }
1642 
1643 EventNotifier *virtio_queue_get_guest_notifier(VirtQueue *vq)
1644 {
1645     return &vq->guest_notifier;
1646 }
1647 
1648 static void virtio_queue_host_notifier_read(EventNotifier *n)
1649 {
1650     VirtQueue *vq = container_of(n, VirtQueue, host_notifier);
1651     if (event_notifier_test_and_clear(n)) {
1652         virtio_queue_notify_vq(vq);
1653     }
1654 }
1655 
1656 void virtio_queue_set_host_notifier_fd_handler(VirtQueue *vq, bool assign,
1657                                                bool set_handler)
1658 {
1659     if (assign && set_handler) {
1660         event_notifier_set_handler(&vq->host_notifier,
1661                                    virtio_queue_host_notifier_read);
1662     } else {
1663         event_notifier_set_handler(&vq->host_notifier, NULL);
1664     }
1665     if (!assign) {
1666         /* Test and clear notifier before after disabling event,
1667          * in case poll callback didn't have time to run. */
1668         virtio_queue_host_notifier_read(&vq->host_notifier);
1669     }
1670 }
1671 
1672 EventNotifier *virtio_queue_get_host_notifier(VirtQueue *vq)
1673 {
1674     return &vq->host_notifier;
1675 }
1676 
1677 void virtio_device_set_child_bus_name(VirtIODevice *vdev, char *bus_name)
1678 {
1679     g_free(vdev->bus_name);
1680     vdev->bus_name = g_strdup(bus_name);
1681 }
1682 
1683 static void virtio_device_realize(DeviceState *dev, Error **errp)
1684 {
1685     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1686     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
1687     Error *err = NULL;
1688 
1689     if (vdc->realize != NULL) {
1690         vdc->realize(dev, &err);
1691         if (err != NULL) {
1692             error_propagate(errp, err);
1693             return;
1694         }
1695     }
1696 
1697     virtio_bus_device_plugged(vdev, &err);
1698     if (err != NULL) {
1699         error_propagate(errp, err);
1700         return;
1701     }
1702 }
1703 
1704 static void virtio_device_unrealize(DeviceState *dev, Error **errp)
1705 {
1706     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1707     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
1708     Error *err = NULL;
1709 
1710     virtio_bus_device_unplugged(vdev);
1711 
1712     if (vdc->unrealize != NULL) {
1713         vdc->unrealize(dev, &err);
1714         if (err != NULL) {
1715             error_propagate(errp, err);
1716             return;
1717         }
1718     }
1719 
1720     g_free(vdev->bus_name);
1721     vdev->bus_name = NULL;
1722 }
1723 
1724 static Property virtio_properties[] = {
1725     DEFINE_VIRTIO_COMMON_FEATURES(VirtIODevice, host_features),
1726     DEFINE_PROP_END_OF_LIST(),
1727 };
1728 
1729 static void virtio_device_class_init(ObjectClass *klass, void *data)
1730 {
1731     /* Set the default value here. */
1732     DeviceClass *dc = DEVICE_CLASS(klass);
1733 
1734     dc->realize = virtio_device_realize;
1735     dc->unrealize = virtio_device_unrealize;
1736     dc->bus_type = TYPE_VIRTIO_BUS;
1737     dc->props = virtio_properties;
1738 }
1739 
1740 static const TypeInfo virtio_device_info = {
1741     .name = TYPE_VIRTIO_DEVICE,
1742     .parent = TYPE_DEVICE,
1743     .instance_size = sizeof(VirtIODevice),
1744     .class_init = virtio_device_class_init,
1745     .abstract = true,
1746     .class_size = sizeof(VirtioDeviceClass),
1747 };
1748 
1749 static void virtio_register_types(void)
1750 {
1751     type_register_static(&virtio_device_info);
1752 }
1753 
1754 type_init(virtio_register_types)
1755