xref: /openbmc/qemu/hw/net/virtio-net.c (revision edc243851279e3393000b28b6b69454cae1190ef)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
146e790746SPaolo Bonzini #include "qemu/iov.h"
156e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
166e790746SPaolo Bonzini #include "net/net.h"
176e790746SPaolo Bonzini #include "net/checksum.h"
186e790746SPaolo Bonzini #include "net/tap.h"
196e790746SPaolo Bonzini #include "qemu/error-report.h"
206e790746SPaolo Bonzini #include "qemu/timer.h"
216e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
226e790746SPaolo Bonzini #include "net/vhost_net.h"
2317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
24b1be4280SAmos Kong #include "qapi/qmp/qjson.h"
25b1be4280SAmos Kong #include "monitor/monitor.h"
266e790746SPaolo Bonzini 
276e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
286e790746SPaolo Bonzini 
296e790746SPaolo Bonzini #define MAC_TABLE_ENTRIES    64
306e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
316e790746SPaolo Bonzini 
326e790746SPaolo Bonzini /*
336e790746SPaolo Bonzini  * Calculate the number of bytes up to and including the given 'field' of
346e790746SPaolo Bonzini  * 'container'.
356e790746SPaolo Bonzini  */
366e790746SPaolo Bonzini #define endof(container, field) \
376e790746SPaolo Bonzini     (offsetof(container, field) + sizeof(((container *)0)->field))
386e790746SPaolo Bonzini 
396e790746SPaolo Bonzini typedef struct VirtIOFeature {
406e790746SPaolo Bonzini     uint32_t flags;
416e790746SPaolo Bonzini     size_t end;
426e790746SPaolo Bonzini } VirtIOFeature;
436e790746SPaolo Bonzini 
446e790746SPaolo Bonzini static VirtIOFeature feature_sizes[] = {
456e790746SPaolo Bonzini     {.flags = 1 << VIRTIO_NET_F_MAC,
466e790746SPaolo Bonzini      .end = endof(struct virtio_net_config, mac)},
476e790746SPaolo Bonzini     {.flags = 1 << VIRTIO_NET_F_STATUS,
486e790746SPaolo Bonzini      .end = endof(struct virtio_net_config, status)},
496e790746SPaolo Bonzini     {.flags = 1 << VIRTIO_NET_F_MQ,
506e790746SPaolo Bonzini      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
516e790746SPaolo Bonzini     {}
526e790746SPaolo Bonzini };
536e790746SPaolo Bonzini 
546e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
556e790746SPaolo Bonzini {
566e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
576e790746SPaolo Bonzini 
586e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
596e790746SPaolo Bonzini }
606e790746SPaolo Bonzini 
616e790746SPaolo Bonzini static int vq2q(int queue_index)
626e790746SPaolo Bonzini {
636e790746SPaolo Bonzini     return queue_index / 2;
646e790746SPaolo Bonzini }
656e790746SPaolo Bonzini 
666e790746SPaolo Bonzini /* TODO
676e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
686e790746SPaolo Bonzini  */
696e790746SPaolo Bonzini 
706e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
716e790746SPaolo Bonzini {
7217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
736e790746SPaolo Bonzini     struct virtio_net_config netcfg;
746e790746SPaolo Bonzini 
756e790746SPaolo Bonzini     stw_p(&netcfg.status, n->status);
766e790746SPaolo Bonzini     stw_p(&netcfg.max_virtqueue_pairs, n->max_queues);
776e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
786e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
796e790746SPaolo Bonzini }
806e790746SPaolo Bonzini 
816e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
826e790746SPaolo Bonzini {
8317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
846e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
856e790746SPaolo Bonzini 
866e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
876e790746SPaolo Bonzini 
8817a0ca55SKONRAD Frederic     if (!(vdev->guest_features >> VIRTIO_NET_F_CTRL_MAC_ADDR & 1) &&
896e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
906e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
916e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
926e790746SPaolo Bonzini     }
936e790746SPaolo Bonzini }
946e790746SPaolo Bonzini 
956e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
966e790746SPaolo Bonzini {
9717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
986e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
9917a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
1006e790746SPaolo Bonzini }
1016e790746SPaolo Bonzini 
1026e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
1036e790746SPaolo Bonzini {
10417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1056e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
1066e790746SPaolo Bonzini     int queues = n->multiqueue ? n->max_queues : 1;
1076e790746SPaolo Bonzini 
1086e790746SPaolo Bonzini     if (!nc->peer) {
1096e790746SPaolo Bonzini         return;
1106e790746SPaolo Bonzini     }
1116e790746SPaolo Bonzini     if (nc->peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
1126e790746SPaolo Bonzini         return;
1136e790746SPaolo Bonzini     }
1146e790746SPaolo Bonzini 
1156e790746SPaolo Bonzini     if (!tap_get_vhost_net(nc->peer)) {
1166e790746SPaolo Bonzini         return;
1176e790746SPaolo Bonzini     }
1186e790746SPaolo Bonzini 
119d7108d90SJason Wang     if (!!n->vhost_started ==
120d7108d90SJason Wang         (virtio_net_started(n, status) && !nc->peer->link_down)) {
1216e790746SPaolo Bonzini         return;
1226e790746SPaolo Bonzini     }
1236e790746SPaolo Bonzini     if (!n->vhost_started) {
1246e790746SPaolo Bonzini         int r;
12517a0ca55SKONRAD Frederic         if (!vhost_net_query(tap_get_vhost_net(nc->peer), vdev)) {
1266e790746SPaolo Bonzini             return;
1276e790746SPaolo Bonzini         }
1286e790746SPaolo Bonzini         n->vhost_started = 1;
12917a0ca55SKONRAD Frederic         r = vhost_net_start(vdev, n->nic->ncs, queues);
1306e790746SPaolo Bonzini         if (r < 0) {
1316e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
1326e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
1336e790746SPaolo Bonzini             n->vhost_started = 0;
1346e790746SPaolo Bonzini         }
1356e790746SPaolo Bonzini     } else {
13617a0ca55SKONRAD Frederic         vhost_net_stop(vdev, n->nic->ncs, queues);
1376e790746SPaolo Bonzini         n->vhost_started = 0;
1386e790746SPaolo Bonzini     }
1396e790746SPaolo Bonzini }
1406e790746SPaolo Bonzini 
1416e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
1426e790746SPaolo Bonzini {
14317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1446e790746SPaolo Bonzini     VirtIONetQueue *q;
1456e790746SPaolo Bonzini     int i;
1466e790746SPaolo Bonzini     uint8_t queue_status;
1476e790746SPaolo Bonzini 
1486e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
1496e790746SPaolo Bonzini 
1506e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
1516e790746SPaolo Bonzini         q = &n->vqs[i];
1526e790746SPaolo Bonzini 
1536e790746SPaolo Bonzini         if ((!n->multiqueue && i != 0) || i >= n->curr_queues) {
1546e790746SPaolo Bonzini             queue_status = 0;
1556e790746SPaolo Bonzini         } else {
1566e790746SPaolo Bonzini             queue_status = status;
1576e790746SPaolo Bonzini         }
1586e790746SPaolo Bonzini 
1596e790746SPaolo Bonzini         if (!q->tx_waiting) {
1606e790746SPaolo Bonzini             continue;
1616e790746SPaolo Bonzini         }
1626e790746SPaolo Bonzini 
1636e790746SPaolo Bonzini         if (virtio_net_started(n, queue_status) && !n->vhost_started) {
1646e790746SPaolo Bonzini             if (q->tx_timer) {
165bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
166bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
1676e790746SPaolo Bonzini             } else {
1686e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
1696e790746SPaolo Bonzini             }
1706e790746SPaolo Bonzini         } else {
1716e790746SPaolo Bonzini             if (q->tx_timer) {
172bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
1736e790746SPaolo Bonzini             } else {
1746e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
1756e790746SPaolo Bonzini             }
1766e790746SPaolo Bonzini         }
1776e790746SPaolo Bonzini     }
1786e790746SPaolo Bonzini }
1796e790746SPaolo Bonzini 
1806e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
1816e790746SPaolo Bonzini {
1826e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
18317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1846e790746SPaolo Bonzini     uint16_t old_status = n->status;
1856e790746SPaolo Bonzini 
1866e790746SPaolo Bonzini     if (nc->link_down)
1876e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
1886e790746SPaolo Bonzini     else
1896e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
1906e790746SPaolo Bonzini 
1916e790746SPaolo Bonzini     if (n->status != old_status)
19217a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
1936e790746SPaolo Bonzini 
19417a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
1956e790746SPaolo Bonzini }
1966e790746SPaolo Bonzini 
197b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
198b1be4280SAmos Kong {
199b1be4280SAmos Kong     QObject *event_data;
200b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
201b1be4280SAmos Kong 
202b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
20396e35046SAmos Kong         gchar *path = object_get_canonical_path(OBJECT(n->qdev));
204b1be4280SAmos Kong         if (n->netclient_name) {
205b1be4280SAmos Kong             event_data = qobject_from_jsonf("{ 'name': %s, 'path': %s }",
20696e35046SAmos Kong                                     n->netclient_name, path);
207b1be4280SAmos Kong         } else {
20896e35046SAmos Kong             event_data = qobject_from_jsonf("{ 'path': %s }", path);
209b1be4280SAmos Kong         }
210b1be4280SAmos Kong         monitor_protocol_event(QEVENT_NIC_RX_FILTER_CHANGED, event_data);
211b1be4280SAmos Kong         qobject_decref(event_data);
21296e35046SAmos Kong         g_free(path);
213b1be4280SAmos Kong 
214b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
215b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
216b1be4280SAmos Kong     }
217b1be4280SAmos Kong }
218b1be4280SAmos Kong 
219b1be4280SAmos Kong static char *mac_strdup_printf(const uint8_t *mac)
220b1be4280SAmos Kong {
221b1be4280SAmos Kong     return g_strdup_printf("%.2x:%.2x:%.2x:%.2x:%.2x:%.2x", mac[0],
222b1be4280SAmos Kong                             mac[1], mac[2], mac[3], mac[4], mac[5]);
223b1be4280SAmos Kong }
224b1be4280SAmos Kong 
225f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
226f7bc8ef8SAmos Kong {
227f7bc8ef8SAmos Kong     intList *list, *entry;
228f7bc8ef8SAmos Kong     int i, j;
229f7bc8ef8SAmos Kong 
230f7bc8ef8SAmos Kong     list = NULL;
231f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
232f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
233f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
234f7bc8ef8SAmos Kong                 entry = g_malloc0(sizeof(*entry));
235f7bc8ef8SAmos Kong                 entry->value = (i << 5) + j;
236f7bc8ef8SAmos Kong                 entry->next = list;
237f7bc8ef8SAmos Kong                 list = entry;
238f7bc8ef8SAmos Kong             }
239f7bc8ef8SAmos Kong         }
240f7bc8ef8SAmos Kong     }
241f7bc8ef8SAmos Kong 
242f7bc8ef8SAmos Kong     return list;
243f7bc8ef8SAmos Kong }
244f7bc8ef8SAmos Kong 
245b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
246b1be4280SAmos Kong {
247b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
248f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
249b1be4280SAmos Kong     RxFilterInfo *info;
250b1be4280SAmos Kong     strList *str_list, *entry;
251f7bc8ef8SAmos Kong     int i;
252b1be4280SAmos Kong 
253b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
254b1be4280SAmos Kong     info->name = g_strdup(nc->name);
255b1be4280SAmos Kong     info->promiscuous = n->promisc;
256b1be4280SAmos Kong 
257b1be4280SAmos Kong     if (n->nouni) {
258b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
259b1be4280SAmos Kong     } else if (n->alluni) {
260b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
261b1be4280SAmos Kong     } else {
262b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
263b1be4280SAmos Kong     }
264b1be4280SAmos Kong 
265b1be4280SAmos Kong     if (n->nomulti) {
266b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
267b1be4280SAmos Kong     } else if (n->allmulti) {
268b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
269b1be4280SAmos Kong     } else {
270b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
271b1be4280SAmos Kong     }
272b1be4280SAmos Kong 
273b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
274b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
275b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
276b1be4280SAmos Kong 
277b1be4280SAmos Kong     info->main_mac = mac_strdup_printf(n->mac);
278b1be4280SAmos Kong 
279b1be4280SAmos Kong     str_list = NULL;
280b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
281b1be4280SAmos Kong         entry = g_malloc0(sizeof(*entry));
282b1be4280SAmos Kong         entry->value = mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
283b1be4280SAmos Kong         entry->next = str_list;
284b1be4280SAmos Kong         str_list = entry;
285b1be4280SAmos Kong     }
286b1be4280SAmos Kong     info->unicast_table = str_list;
287b1be4280SAmos Kong 
288b1be4280SAmos Kong     str_list = NULL;
289b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
290b1be4280SAmos Kong         entry = g_malloc0(sizeof(*entry));
291b1be4280SAmos Kong         entry->value = mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
292b1be4280SAmos Kong         entry->next = str_list;
293b1be4280SAmos Kong         str_list = entry;
294b1be4280SAmos Kong     }
295b1be4280SAmos Kong     info->multicast_table = str_list;
296f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
297b1be4280SAmos Kong 
298f7bc8ef8SAmos Kong     if (!((1 << VIRTIO_NET_F_CTRL_VLAN) & vdev->guest_features)) {
299f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
300f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
301f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
302f7bc8ef8SAmos Kong     } else {
303f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
304b1be4280SAmos Kong     }
305b1be4280SAmos Kong 
306b1be4280SAmos Kong     /* enable event notification after query */
307b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
308b1be4280SAmos Kong 
309b1be4280SAmos Kong     return info;
310b1be4280SAmos Kong }
311b1be4280SAmos Kong 
3126e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
3136e790746SPaolo Bonzini {
31417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3156e790746SPaolo Bonzini 
3166e790746SPaolo Bonzini     /* Reset back to compatibility mode */
3176e790746SPaolo Bonzini     n->promisc = 1;
3186e790746SPaolo Bonzini     n->allmulti = 0;
3196e790746SPaolo Bonzini     n->alluni = 0;
3206e790746SPaolo Bonzini     n->nomulti = 0;
3216e790746SPaolo Bonzini     n->nouni = 0;
3226e790746SPaolo Bonzini     n->nobcast = 0;
3236e790746SPaolo Bonzini     /* multiqueue is disabled by default */
3246e790746SPaolo Bonzini     n->curr_queues = 1;
3256e790746SPaolo Bonzini 
3266e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
3276e790746SPaolo Bonzini     n->mac_table.in_use = 0;
3286e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
3296e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
3306e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
3316e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
3326e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
333702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
3346e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
3356e790746SPaolo Bonzini }
3366e790746SPaolo Bonzini 
3376e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
3386e790746SPaolo Bonzini {
3396e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
3406e790746SPaolo Bonzini     if (!nc->peer) {
3416e790746SPaolo Bonzini         return;
3426e790746SPaolo Bonzini     }
3436e790746SPaolo Bonzini 
344d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
3456e790746SPaolo Bonzini }
3466e790746SPaolo Bonzini 
3476e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
3486e790746SPaolo Bonzini {
3496e790746SPaolo Bonzini     return n->has_vnet_hdr;
3506e790746SPaolo Bonzini }
3516e790746SPaolo Bonzini 
3526e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
3536e790746SPaolo Bonzini {
3546e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
3556e790746SPaolo Bonzini         return 0;
3566e790746SPaolo Bonzini 
357d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
3586e790746SPaolo Bonzini 
3596e790746SPaolo Bonzini     return n->has_ufo;
3606e790746SPaolo Bonzini }
3616e790746SPaolo Bonzini 
3626e790746SPaolo Bonzini static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs)
3636e790746SPaolo Bonzini {
3646e790746SPaolo Bonzini     int i;
3656e790746SPaolo Bonzini     NetClientState *nc;
3666e790746SPaolo Bonzini 
3676e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
3686e790746SPaolo Bonzini 
3696e790746SPaolo Bonzini     n->guest_hdr_len = n->mergeable_rx_bufs ?
3706e790746SPaolo Bonzini         sizeof(struct virtio_net_hdr_mrg_rxbuf) : sizeof(struct virtio_net_hdr);
3716e790746SPaolo Bonzini 
3726e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
3736e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
3746e790746SPaolo Bonzini 
3756e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
376d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
377d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
3786e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
3796e790746SPaolo Bonzini         }
3806e790746SPaolo Bonzini     }
3816e790746SPaolo Bonzini }
3826e790746SPaolo Bonzini 
3836e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
3846e790746SPaolo Bonzini {
3856e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
3866e790746SPaolo Bonzini 
3876e790746SPaolo Bonzini     if (!nc->peer) {
3886e790746SPaolo Bonzini         return 0;
3896e790746SPaolo Bonzini     }
3906e790746SPaolo Bonzini 
3916e790746SPaolo Bonzini     if (nc->peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
3926e790746SPaolo Bonzini         return 0;
3936e790746SPaolo Bonzini     }
3946e790746SPaolo Bonzini 
3956e790746SPaolo Bonzini     return tap_enable(nc->peer);
3966e790746SPaolo Bonzini }
3976e790746SPaolo Bonzini 
3986e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
3996e790746SPaolo Bonzini {
4006e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
4016e790746SPaolo Bonzini 
4026e790746SPaolo Bonzini     if (!nc->peer) {
4036e790746SPaolo Bonzini         return 0;
4046e790746SPaolo Bonzini     }
4056e790746SPaolo Bonzini 
4066e790746SPaolo Bonzini     if (nc->peer->info->type !=  NET_CLIENT_OPTIONS_KIND_TAP) {
4076e790746SPaolo Bonzini         return 0;
4086e790746SPaolo Bonzini     }
4096e790746SPaolo Bonzini 
4106e790746SPaolo Bonzini     return tap_disable(nc->peer);
4116e790746SPaolo Bonzini }
4126e790746SPaolo Bonzini 
4136e790746SPaolo Bonzini static void virtio_net_set_queues(VirtIONet *n)
4146e790746SPaolo Bonzini {
4156e790746SPaolo Bonzini     int i;
416ddfa83eaSJoel Stanley     int r;
4176e790746SPaolo Bonzini 
4186e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
4196e790746SPaolo Bonzini         if (i < n->curr_queues) {
420ddfa83eaSJoel Stanley             r = peer_attach(n, i);
421ddfa83eaSJoel Stanley             assert(!r);
4226e790746SPaolo Bonzini         } else {
423ddfa83eaSJoel Stanley             r = peer_detach(n, i);
424ddfa83eaSJoel Stanley             assert(!r);
4256e790746SPaolo Bonzini         }
4266e790746SPaolo Bonzini     }
4276e790746SPaolo Bonzini }
4286e790746SPaolo Bonzini 
429ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
4306e790746SPaolo Bonzini 
4316e790746SPaolo Bonzini static uint32_t virtio_net_get_features(VirtIODevice *vdev, uint32_t features)
4326e790746SPaolo Bonzini {
43317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
4346e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
4356e790746SPaolo Bonzini 
4366e790746SPaolo Bonzini     features |= (1 << VIRTIO_NET_F_MAC);
4376e790746SPaolo Bonzini 
4386e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
4396e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_CSUM);
4406e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_HOST_TSO4);
4416e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_HOST_TSO6);
4426e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_HOST_ECN);
4436e790746SPaolo Bonzini 
4446e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_GUEST_CSUM);
4456e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_GUEST_TSO4);
4466e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_GUEST_TSO6);
4476e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_GUEST_ECN);
4486e790746SPaolo Bonzini     }
4496e790746SPaolo Bonzini 
4506e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
4516e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_GUEST_UFO);
4526e790746SPaolo Bonzini         features &= ~(0x1 << VIRTIO_NET_F_HOST_UFO);
4536e790746SPaolo Bonzini     }
4546e790746SPaolo Bonzini 
4556e790746SPaolo Bonzini     if (!nc->peer || nc->peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
4566e790746SPaolo Bonzini         return features;
4576e790746SPaolo Bonzini     }
4586e790746SPaolo Bonzini     if (!tap_get_vhost_net(nc->peer)) {
4596e790746SPaolo Bonzini         return features;
4606e790746SPaolo Bonzini     }
4616e790746SPaolo Bonzini     return vhost_net_get_features(tap_get_vhost_net(nc->peer), features);
4626e790746SPaolo Bonzini }
4636e790746SPaolo Bonzini 
4646e790746SPaolo Bonzini static uint32_t virtio_net_bad_features(VirtIODevice *vdev)
4656e790746SPaolo Bonzini {
4666e790746SPaolo Bonzini     uint32_t features = 0;
4676e790746SPaolo Bonzini 
4686e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
4696e790746SPaolo Bonzini      * but also these: */
4706e790746SPaolo Bonzini     features |= (1 << VIRTIO_NET_F_MAC);
4716e790746SPaolo Bonzini     features |= (1 << VIRTIO_NET_F_CSUM);
4726e790746SPaolo Bonzini     features |= (1 << VIRTIO_NET_F_HOST_TSO4);
4736e790746SPaolo Bonzini     features |= (1 << VIRTIO_NET_F_HOST_TSO6);
4746e790746SPaolo Bonzini     features |= (1 << VIRTIO_NET_F_HOST_ECN);
4756e790746SPaolo Bonzini 
4766e790746SPaolo Bonzini     return features;
4776e790746SPaolo Bonzini }
4786e790746SPaolo Bonzini 
479644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
480644c9858SDmitry Fleytman {
481ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
482644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
483644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
484644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
485644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
486644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
487644c9858SDmitry Fleytman }
488644c9858SDmitry Fleytman 
489644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
490644c9858SDmitry Fleytman {
491644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
492644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
493644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
494644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
495644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
496644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
497644c9858SDmitry Fleytman 
498644c9858SDmitry Fleytman     return guest_offloads_mask & features;
499644c9858SDmitry Fleytman }
500644c9858SDmitry Fleytman 
501644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
502644c9858SDmitry Fleytman {
503644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
504644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
505644c9858SDmitry Fleytman }
506644c9858SDmitry Fleytman 
5076e790746SPaolo Bonzini static void virtio_net_set_features(VirtIODevice *vdev, uint32_t features)
5086e790746SPaolo Bonzini {
50917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
5106e790746SPaolo Bonzini     int i;
5116e790746SPaolo Bonzini 
512ec57db16SJason Wang     virtio_net_set_multiqueue(n, !!(features & (1 << VIRTIO_NET_F_MQ)));
5136e790746SPaolo Bonzini 
5146e790746SPaolo Bonzini     virtio_net_set_mrg_rx_bufs(n, !!(features & (1 << VIRTIO_NET_F_MRG_RXBUF)));
5156e790746SPaolo Bonzini 
5166e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
517644c9858SDmitry Fleytman         n->curr_guest_offloads =
518644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
519644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
5206e790746SPaolo Bonzini     }
5216e790746SPaolo Bonzini 
5226e790746SPaolo Bonzini     for (i = 0;  i < n->max_queues; i++) {
5236e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
5246e790746SPaolo Bonzini 
5256e790746SPaolo Bonzini         if (!nc->peer || nc->peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
5266e790746SPaolo Bonzini             continue;
5276e790746SPaolo Bonzini         }
5286e790746SPaolo Bonzini         if (!tap_get_vhost_net(nc->peer)) {
5296e790746SPaolo Bonzini             continue;
5306e790746SPaolo Bonzini         }
5316e790746SPaolo Bonzini         vhost_net_ack_features(tap_get_vhost_net(nc->peer), features);
5326e790746SPaolo Bonzini     }
5330b1eaa88SStefan Fritsch 
5340b1eaa88SStefan Fritsch     if ((1 << VIRTIO_NET_F_CTRL_VLAN) & features) {
5350b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
5360b1eaa88SStefan Fritsch     } else {
5370b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
5380b1eaa88SStefan Fritsch     }
5396e790746SPaolo Bonzini }
5406e790746SPaolo Bonzini 
5416e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
5426e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
5436e790746SPaolo Bonzini {
5446e790746SPaolo Bonzini     uint8_t on;
5456e790746SPaolo Bonzini     size_t s;
546b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
5476e790746SPaolo Bonzini 
5486e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
5496e790746SPaolo Bonzini     if (s != sizeof(on)) {
5506e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
5516e790746SPaolo Bonzini     }
5526e790746SPaolo Bonzini 
5536e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
5546e790746SPaolo Bonzini         n->promisc = on;
5556e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
5566e790746SPaolo Bonzini         n->allmulti = on;
5576e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
5586e790746SPaolo Bonzini         n->alluni = on;
5596e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
5606e790746SPaolo Bonzini         n->nomulti = on;
5616e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
5626e790746SPaolo Bonzini         n->nouni = on;
5636e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
5646e790746SPaolo Bonzini         n->nobcast = on;
5656e790746SPaolo Bonzini     } else {
5666e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
5676e790746SPaolo Bonzini     }
5686e790746SPaolo Bonzini 
569b1be4280SAmos Kong     rxfilter_notify(nc);
570b1be4280SAmos Kong 
5716e790746SPaolo Bonzini     return VIRTIO_NET_OK;
5726e790746SPaolo Bonzini }
5736e790746SPaolo Bonzini 
574644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
575644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
576644c9858SDmitry Fleytman {
577644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
578644c9858SDmitry Fleytman     uint64_t offloads;
579644c9858SDmitry Fleytman     size_t s;
580644c9858SDmitry Fleytman 
581644c9858SDmitry Fleytman     if (!((1 << VIRTIO_NET_F_CTRL_GUEST_OFFLOADS) & vdev->guest_features)) {
582644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
583644c9858SDmitry Fleytman     }
584644c9858SDmitry Fleytman 
585644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
586644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
587644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
588644c9858SDmitry Fleytman     }
589644c9858SDmitry Fleytman 
590644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
591644c9858SDmitry Fleytman         uint64_t supported_offloads;
592644c9858SDmitry Fleytman 
593644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
594644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
595644c9858SDmitry Fleytman         }
596644c9858SDmitry Fleytman 
597644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
598644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
599644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
600644c9858SDmitry Fleytman         }
601644c9858SDmitry Fleytman 
602644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
603644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
604644c9858SDmitry Fleytman 
605644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
606644c9858SDmitry Fleytman     } else {
607644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
608644c9858SDmitry Fleytman     }
609644c9858SDmitry Fleytman }
610644c9858SDmitry Fleytman 
6116e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
6126e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
6136e790746SPaolo Bonzini {
6146e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
6156e790746SPaolo Bonzini     size_t s;
616b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
6176e790746SPaolo Bonzini 
6186e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
6196e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
6206e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
6216e790746SPaolo Bonzini         }
6226e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
6236e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
6246e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
625b1be4280SAmos Kong         rxfilter_notify(nc);
626b1be4280SAmos Kong 
6276e790746SPaolo Bonzini         return VIRTIO_NET_OK;
6286e790746SPaolo Bonzini     }
6296e790746SPaolo Bonzini 
6306e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
6316e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
6326e790746SPaolo Bonzini     }
6336e790746SPaolo Bonzini 
634cae2e556SAmos Kong     int in_use = 0;
635cae2e556SAmos Kong     int first_multi = 0;
636cae2e556SAmos Kong     uint8_t uni_overflow = 0;
637cae2e556SAmos Kong     uint8_t multi_overflow = 0;
638cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
6396e790746SPaolo Bonzini 
6406e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
6416e790746SPaolo Bonzini                    sizeof(mac_data.entries));
6426e790746SPaolo Bonzini     mac_data.entries = ldl_p(&mac_data.entries);
6436e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
644b1be4280SAmos Kong         goto error;
6456e790746SPaolo Bonzini     }
6466e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
6476e790746SPaolo Bonzini 
6486e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
649b1be4280SAmos Kong         goto error;
6506e790746SPaolo Bonzini     }
6516e790746SPaolo Bonzini 
6526e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
653cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
6546e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
6556e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
656b1be4280SAmos Kong             goto error;
6576e790746SPaolo Bonzini         }
658cae2e556SAmos Kong         in_use += mac_data.entries;
6596e790746SPaolo Bonzini     } else {
660cae2e556SAmos Kong         uni_overflow = 1;
6616e790746SPaolo Bonzini     }
6626e790746SPaolo Bonzini 
6636e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
6646e790746SPaolo Bonzini 
665cae2e556SAmos Kong     first_multi = in_use;
6666e790746SPaolo Bonzini 
6676e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
6686e790746SPaolo Bonzini                    sizeof(mac_data.entries));
6696e790746SPaolo Bonzini     mac_data.entries = ldl_p(&mac_data.entries);
6706e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
671b1be4280SAmos Kong         goto error;
6726e790746SPaolo Bonzini     }
6736e790746SPaolo Bonzini 
6746e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
6756e790746SPaolo Bonzini 
6766e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
677b1be4280SAmos Kong         goto error;
6786e790746SPaolo Bonzini     }
6796e790746SPaolo Bonzini 
680*edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
681cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
6826e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
6836e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
684b1be4280SAmos Kong             goto error;
6856e790746SPaolo Bonzini         }
686cae2e556SAmos Kong         in_use += mac_data.entries;
6876e790746SPaolo Bonzini     } else {
688cae2e556SAmos Kong         multi_overflow = 1;
6896e790746SPaolo Bonzini     }
6906e790746SPaolo Bonzini 
691cae2e556SAmos Kong     n->mac_table.in_use = in_use;
692cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
693cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
694cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
695cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
696cae2e556SAmos Kong     g_free(macs);
697b1be4280SAmos Kong     rxfilter_notify(nc);
698b1be4280SAmos Kong 
6996e790746SPaolo Bonzini     return VIRTIO_NET_OK;
700b1be4280SAmos Kong 
701b1be4280SAmos Kong error:
702cae2e556SAmos Kong     g_free(macs);
703b1be4280SAmos Kong     return VIRTIO_NET_ERR;
7046e790746SPaolo Bonzini }
7056e790746SPaolo Bonzini 
7066e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
7076e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
7086e790746SPaolo Bonzini {
7096e790746SPaolo Bonzini     uint16_t vid;
7106e790746SPaolo Bonzini     size_t s;
711b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
7126e790746SPaolo Bonzini 
7136e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
7146e790746SPaolo Bonzini     vid = lduw_p(&vid);
7156e790746SPaolo Bonzini     if (s != sizeof(vid)) {
7166e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
7176e790746SPaolo Bonzini     }
7186e790746SPaolo Bonzini 
7196e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
7206e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
7216e790746SPaolo Bonzini 
7226e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
7236e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
7246e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
7256e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
7266e790746SPaolo Bonzini     else
7276e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
7286e790746SPaolo Bonzini 
729b1be4280SAmos Kong     rxfilter_notify(nc);
730b1be4280SAmos Kong 
7316e790746SPaolo Bonzini     return VIRTIO_NET_OK;
7326e790746SPaolo Bonzini }
7336e790746SPaolo Bonzini 
7346e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
7356e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
7366e790746SPaolo Bonzini {
73717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
7386e790746SPaolo Bonzini     struct virtio_net_ctrl_mq mq;
7396e790746SPaolo Bonzini     size_t s;
7406e790746SPaolo Bonzini     uint16_t queues;
7416e790746SPaolo Bonzini 
7426e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
7436e790746SPaolo Bonzini     if (s != sizeof(mq)) {
7446e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
7456e790746SPaolo Bonzini     }
7466e790746SPaolo Bonzini 
7476e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
7486e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
7496e790746SPaolo Bonzini     }
7506e790746SPaolo Bonzini 
7516e790746SPaolo Bonzini     queues = lduw_p(&mq.virtqueue_pairs);
7526e790746SPaolo Bonzini 
7536e790746SPaolo Bonzini     if (queues < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
7546e790746SPaolo Bonzini         queues > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
7556e790746SPaolo Bonzini         queues > n->max_queues ||
7566e790746SPaolo Bonzini         !n->multiqueue) {
7576e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
7586e790746SPaolo Bonzini     }
7596e790746SPaolo Bonzini 
7606e790746SPaolo Bonzini     n->curr_queues = queues;
7616e790746SPaolo Bonzini     /* stop the backend before changing the number of queues to avoid handling a
7626e790746SPaolo Bonzini      * disabled queue */
76317a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
7646e790746SPaolo Bonzini     virtio_net_set_queues(n);
7656e790746SPaolo Bonzini 
7666e790746SPaolo Bonzini     return VIRTIO_NET_OK;
7676e790746SPaolo Bonzini }
7686e790746SPaolo Bonzini static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
7696e790746SPaolo Bonzini {
77017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
7716e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
7726e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
7736e790746SPaolo Bonzini     VirtQueueElement elem;
7746e790746SPaolo Bonzini     size_t s;
7756e790746SPaolo Bonzini     struct iovec *iov;
7766e790746SPaolo Bonzini     unsigned int iov_cnt;
7776e790746SPaolo Bonzini 
7786e790746SPaolo Bonzini     while (virtqueue_pop(vq, &elem)) {
7796e790746SPaolo Bonzini         if (iov_size(elem.in_sg, elem.in_num) < sizeof(status) ||
7806e790746SPaolo Bonzini             iov_size(elem.out_sg, elem.out_num) < sizeof(ctrl)) {
7816e790746SPaolo Bonzini             error_report("virtio-net ctrl missing headers");
7826e790746SPaolo Bonzini             exit(1);
7836e790746SPaolo Bonzini         }
7846e790746SPaolo Bonzini 
7856e790746SPaolo Bonzini         iov = elem.out_sg;
7866e790746SPaolo Bonzini         iov_cnt = elem.out_num;
7876e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl));
7886e790746SPaolo Bonzini         iov_discard_front(&iov, &iov_cnt, sizeof(ctrl));
7896e790746SPaolo Bonzini         if (s != sizeof(ctrl)) {
7906e790746SPaolo Bonzini             status = VIRTIO_NET_ERR;
7916e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
7926e790746SPaolo Bonzini             status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt);
7936e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
7946e790746SPaolo Bonzini             status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt);
7956e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
7966e790746SPaolo Bonzini             status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt);
7976e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
7986e790746SPaolo Bonzini             status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt);
799644c9858SDmitry Fleytman         } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
800644c9858SDmitry Fleytman             status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt);
8016e790746SPaolo Bonzini         }
8026e790746SPaolo Bonzini 
8036e790746SPaolo Bonzini         s = iov_from_buf(elem.in_sg, elem.in_num, 0, &status, sizeof(status));
8046e790746SPaolo Bonzini         assert(s == sizeof(status));
8056e790746SPaolo Bonzini 
8066e790746SPaolo Bonzini         virtqueue_push(vq, &elem, sizeof(status));
8076e790746SPaolo Bonzini         virtio_notify(vdev, vq);
8086e790746SPaolo Bonzini     }
8096e790746SPaolo Bonzini }
8106e790746SPaolo Bonzini 
8116e790746SPaolo Bonzini /* RX */
8126e790746SPaolo Bonzini 
8136e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
8146e790746SPaolo Bonzini {
81517a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
8166e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
8176e790746SPaolo Bonzini 
8186e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
8196e790746SPaolo Bonzini }
8206e790746SPaolo Bonzini 
8216e790746SPaolo Bonzini static int virtio_net_can_receive(NetClientState *nc)
8226e790746SPaolo Bonzini {
8236e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
82417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
8256e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
8266e790746SPaolo Bonzini 
82717a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
8286e790746SPaolo Bonzini         return 0;
8296e790746SPaolo Bonzini     }
8306e790746SPaolo Bonzini 
8316e790746SPaolo Bonzini     if (nc->queue_index >= n->curr_queues) {
8326e790746SPaolo Bonzini         return 0;
8336e790746SPaolo Bonzini     }
8346e790746SPaolo Bonzini 
8356e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
83617a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
8376e790746SPaolo Bonzini         return 0;
8386e790746SPaolo Bonzini     }
8396e790746SPaolo Bonzini 
8406e790746SPaolo Bonzini     return 1;
8416e790746SPaolo Bonzini }
8426e790746SPaolo Bonzini 
8436e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
8446e790746SPaolo Bonzini {
8456e790746SPaolo Bonzini     VirtIONet *n = q->n;
8466e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
8476e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
8486e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
8496e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
8506e790746SPaolo Bonzini 
8516e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
8526e790746SPaolo Bonzini          * available after the above check but before notification was
8536e790746SPaolo Bonzini          * enabled, check for available buffers again.
8546e790746SPaolo Bonzini          */
8556e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
8566e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
8576e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
8586e790746SPaolo Bonzini             return 0;
8596e790746SPaolo Bonzini         }
8606e790746SPaolo Bonzini     }
8616e790746SPaolo Bonzini 
8626e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
8636e790746SPaolo Bonzini     return 1;
8646e790746SPaolo Bonzini }
8656e790746SPaolo Bonzini 
8666e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
8676e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
8686e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
8696e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
8706e790746SPaolo Bonzini  * dhclient yet.
8716e790746SPaolo Bonzini  *
8726e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
8736e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
8746e790746SPaolo Bonzini  * kernels.
8756e790746SPaolo Bonzini  *
8766e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
8776e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
8786e790746SPaolo Bonzini  * cache.
8796e790746SPaolo Bonzini  */
8806e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
8816e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
8826e790746SPaolo Bonzini {
8836e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
8846e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
8856e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
8866e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
8876e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
8886e790746SPaolo Bonzini         net_checksum_calculate(buf, size);
8896e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
8906e790746SPaolo Bonzini     }
8916e790746SPaolo Bonzini }
8926e790746SPaolo Bonzini 
8936e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
8946e790746SPaolo Bonzini                            const void *buf, size_t size)
8956e790746SPaolo Bonzini {
8966e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
8976e790746SPaolo Bonzini         /* FIXME this cast is evil */
8986e790746SPaolo Bonzini         void *wbuf = (void *)buf;
8996e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
9006e790746SPaolo Bonzini                                     size - n->host_hdr_len);
9016e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
9026e790746SPaolo Bonzini     } else {
9036e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
9046e790746SPaolo Bonzini             .flags = 0,
9056e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
9066e790746SPaolo Bonzini         };
9076e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
9086e790746SPaolo Bonzini     }
9096e790746SPaolo Bonzini }
9106e790746SPaolo Bonzini 
9116e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
9126e790746SPaolo Bonzini {
9136e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
9146e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
9156e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
9166e790746SPaolo Bonzini     int i;
9176e790746SPaolo Bonzini 
9186e790746SPaolo Bonzini     if (n->promisc)
9196e790746SPaolo Bonzini         return 1;
9206e790746SPaolo Bonzini 
9216e790746SPaolo Bonzini     ptr += n->host_hdr_len;
9226e790746SPaolo Bonzini 
9236e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
9246e790746SPaolo Bonzini         int vid = be16_to_cpup((uint16_t *)(ptr + 14)) & 0xfff;
9256e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
9266e790746SPaolo Bonzini             return 0;
9276e790746SPaolo Bonzini     }
9286e790746SPaolo Bonzini 
9296e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
9306e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
9316e790746SPaolo Bonzini             return !n->nobcast;
9326e790746SPaolo Bonzini         } else if (n->nomulti) {
9336e790746SPaolo Bonzini             return 0;
9346e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
9356e790746SPaolo Bonzini             return 1;
9366e790746SPaolo Bonzini         }
9376e790746SPaolo Bonzini 
9386e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
9396e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
9406e790746SPaolo Bonzini                 return 1;
9416e790746SPaolo Bonzini             }
9426e790746SPaolo Bonzini         }
9436e790746SPaolo Bonzini     } else { // unicast
9446e790746SPaolo Bonzini         if (n->nouni) {
9456e790746SPaolo Bonzini             return 0;
9466e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
9476e790746SPaolo Bonzini             return 1;
9486e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
9496e790746SPaolo Bonzini             return 1;
9506e790746SPaolo Bonzini         }
9516e790746SPaolo Bonzini 
9526e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
9536e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
9546e790746SPaolo Bonzini                 return 1;
9556e790746SPaolo Bonzini             }
9566e790746SPaolo Bonzini         }
9576e790746SPaolo Bonzini     }
9586e790746SPaolo Bonzini 
9596e790746SPaolo Bonzini     return 0;
9606e790746SPaolo Bonzini }
9616e790746SPaolo Bonzini 
9626e790746SPaolo Bonzini static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, size_t size)
9636e790746SPaolo Bonzini {
9646e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
9656e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
96617a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
9676e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
9686e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
9696e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
9706e790746SPaolo Bonzini     size_t offset, i, guest_offset;
9716e790746SPaolo Bonzini 
9726e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
9736e790746SPaolo Bonzini         return -1;
9746e790746SPaolo Bonzini     }
9756e790746SPaolo Bonzini 
9766e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
9776e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
9786e790746SPaolo Bonzini         return 0;
9796e790746SPaolo Bonzini     }
9806e790746SPaolo Bonzini 
9816e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
9826e790746SPaolo Bonzini         return size;
9836e790746SPaolo Bonzini 
9846e790746SPaolo Bonzini     offset = i = 0;
9856e790746SPaolo Bonzini 
9866e790746SPaolo Bonzini     while (offset < size) {
9876e790746SPaolo Bonzini         VirtQueueElement elem;
9886e790746SPaolo Bonzini         int len, total;
9896e790746SPaolo Bonzini         const struct iovec *sg = elem.in_sg;
9906e790746SPaolo Bonzini 
9916e790746SPaolo Bonzini         total = 0;
9926e790746SPaolo Bonzini 
9936e790746SPaolo Bonzini         if (virtqueue_pop(q->rx_vq, &elem) == 0) {
9946e790746SPaolo Bonzini             if (i == 0)
9956e790746SPaolo Bonzini                 return -1;
9966e790746SPaolo Bonzini             error_report("virtio-net unexpected empty queue: "
9976e790746SPaolo Bonzini                     "i %zd mergeable %d offset %zd, size %zd, "
9986e790746SPaolo Bonzini                     "guest hdr len %zd, host hdr len %zd guest features 0x%x",
9996e790746SPaolo Bonzini                     i, n->mergeable_rx_bufs, offset, size,
100017a0ca55SKONRAD Frederic                     n->guest_hdr_len, n->host_hdr_len, vdev->guest_features);
10016e790746SPaolo Bonzini             exit(1);
10026e790746SPaolo Bonzini         }
10036e790746SPaolo Bonzini 
10046e790746SPaolo Bonzini         if (elem.in_num < 1) {
10056e790746SPaolo Bonzini             error_report("virtio-net receive queue contains no in buffers");
10066e790746SPaolo Bonzini             exit(1);
10076e790746SPaolo Bonzini         }
10086e790746SPaolo Bonzini 
10096e790746SPaolo Bonzini         if (i == 0) {
10106e790746SPaolo Bonzini             assert(offset == 0);
10116e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
10126e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
10136e790746SPaolo Bonzini                                     sg, elem.in_num,
10146e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
10156e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
10166e790746SPaolo Bonzini             }
10176e790746SPaolo Bonzini 
10186e790746SPaolo Bonzini             receive_header(n, sg, elem.in_num, buf, size);
10196e790746SPaolo Bonzini             offset = n->host_hdr_len;
10206e790746SPaolo Bonzini             total += n->guest_hdr_len;
10216e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
10226e790746SPaolo Bonzini         } else {
10236e790746SPaolo Bonzini             guest_offset = 0;
10246e790746SPaolo Bonzini         }
10256e790746SPaolo Bonzini 
10266e790746SPaolo Bonzini         /* copy in packet.  ugh */
10276e790746SPaolo Bonzini         len = iov_from_buf(sg, elem.in_num, guest_offset,
10286e790746SPaolo Bonzini                            buf + offset, size - offset);
10296e790746SPaolo Bonzini         total += len;
10306e790746SPaolo Bonzini         offset += len;
10316e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
10326e790746SPaolo Bonzini          * must have consumed the complete packet.
10336e790746SPaolo Bonzini          * Otherwise, drop it. */
10346e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
10356e790746SPaolo Bonzini #if 0
10366e790746SPaolo Bonzini             error_report("virtio-net truncated non-mergeable packet: "
10376e790746SPaolo Bonzini                          "i %zd mergeable %d offset %zd, size %zd, "
10386e790746SPaolo Bonzini                          "guest hdr len %zd, host hdr len %zd",
10396e790746SPaolo Bonzini                          i, n->mergeable_rx_bufs,
10406e790746SPaolo Bonzini                          offset, size, n->guest_hdr_len, n->host_hdr_len);
10416e790746SPaolo Bonzini #endif
10426e790746SPaolo Bonzini             return size;
10436e790746SPaolo Bonzini         }
10446e790746SPaolo Bonzini 
10456e790746SPaolo Bonzini         /* signal other side */
10466e790746SPaolo Bonzini         virtqueue_fill(q->rx_vq, &elem, total, i++);
10476e790746SPaolo Bonzini     }
10486e790746SPaolo Bonzini 
10496e790746SPaolo Bonzini     if (mhdr_cnt) {
10506e790746SPaolo Bonzini         stw_p(&mhdr.num_buffers, i);
10516e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
10526e790746SPaolo Bonzini                      0,
10536e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
10546e790746SPaolo Bonzini     }
10556e790746SPaolo Bonzini 
10566e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
105717a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
10586e790746SPaolo Bonzini 
10596e790746SPaolo Bonzini     return size;
10606e790746SPaolo Bonzini }
10616e790746SPaolo Bonzini 
10626e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
10636e790746SPaolo Bonzini 
10646e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
10656e790746SPaolo Bonzini {
10666e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
10676e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
106817a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10696e790746SPaolo Bonzini 
10706e790746SPaolo Bonzini     virtqueue_push(q->tx_vq, &q->async_tx.elem, 0);
107117a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
10726e790746SPaolo Bonzini 
10736e790746SPaolo Bonzini     q->async_tx.elem.out_num = q->async_tx.len = 0;
10746e790746SPaolo Bonzini 
10756e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
10766e790746SPaolo Bonzini     virtio_net_flush_tx(q);
10776e790746SPaolo Bonzini }
10786e790746SPaolo Bonzini 
10796e790746SPaolo Bonzini /* TX */
10806e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
10816e790746SPaolo Bonzini {
10826e790746SPaolo Bonzini     VirtIONet *n = q->n;
108317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10846e790746SPaolo Bonzini     VirtQueueElement elem;
10856e790746SPaolo Bonzini     int32_t num_packets = 0;
10866e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
108717a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
10886e790746SPaolo Bonzini         return num_packets;
10896e790746SPaolo Bonzini     }
10906e790746SPaolo Bonzini 
109117a0ca55SKONRAD Frederic     assert(vdev->vm_running);
10926e790746SPaolo Bonzini 
10936e790746SPaolo Bonzini     if (q->async_tx.elem.out_num) {
10946e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
10956e790746SPaolo Bonzini         return num_packets;
10966e790746SPaolo Bonzini     }
10976e790746SPaolo Bonzini 
10986e790746SPaolo Bonzini     while (virtqueue_pop(q->tx_vq, &elem)) {
10996e790746SPaolo Bonzini         ssize_t ret, len;
11006e790746SPaolo Bonzini         unsigned int out_num = elem.out_num;
11016e790746SPaolo Bonzini         struct iovec *out_sg = &elem.out_sg[0];
11026e790746SPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE];
11036e790746SPaolo Bonzini 
11046e790746SPaolo Bonzini         if (out_num < 1) {
11056e790746SPaolo Bonzini             error_report("virtio-net header not in first element");
11066e790746SPaolo Bonzini             exit(1);
11076e790746SPaolo Bonzini         }
11086e790746SPaolo Bonzini 
11096e790746SPaolo Bonzini         /*
11106e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
11116e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
11126e790746SPaolo Bonzini          * that host is interested in.
11136e790746SPaolo Bonzini          */
11146e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
11156e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
11166e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
11176e790746SPaolo Bonzini                                        out_sg, out_num,
11186e790746SPaolo Bonzini                                        0, n->host_hdr_len);
11196e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
11206e790746SPaolo Bonzini                              out_sg, out_num,
11216e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
11226e790746SPaolo Bonzini             out_num = sg_num;
11236e790746SPaolo Bonzini             out_sg = sg;
11246e790746SPaolo Bonzini         }
11256e790746SPaolo Bonzini 
11266e790746SPaolo Bonzini         len = n->guest_hdr_len;
11276e790746SPaolo Bonzini 
11286e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
11296e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
11306e790746SPaolo Bonzini         if (ret == 0) {
11316e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
11326e790746SPaolo Bonzini             q->async_tx.elem = elem;
11336e790746SPaolo Bonzini             q->async_tx.len  = len;
11346e790746SPaolo Bonzini             return -EBUSY;
11356e790746SPaolo Bonzini         }
11366e790746SPaolo Bonzini 
11376e790746SPaolo Bonzini         len += ret;
11386e790746SPaolo Bonzini 
11396e790746SPaolo Bonzini         virtqueue_push(q->tx_vq, &elem, 0);
114017a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
11416e790746SPaolo Bonzini 
11426e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
11436e790746SPaolo Bonzini             break;
11446e790746SPaolo Bonzini         }
11456e790746SPaolo Bonzini     }
11466e790746SPaolo Bonzini     return num_packets;
11476e790746SPaolo Bonzini }
11486e790746SPaolo Bonzini 
11496e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
11506e790746SPaolo Bonzini {
115117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
11526e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
11536e790746SPaolo Bonzini 
11546e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
115517a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
11566e790746SPaolo Bonzini         q->tx_waiting = 1;
11576e790746SPaolo Bonzini         return;
11586e790746SPaolo Bonzini     }
11596e790746SPaolo Bonzini 
11606e790746SPaolo Bonzini     if (q->tx_waiting) {
11616e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 1);
1162bc72ad67SAlex Bligh         timer_del(q->tx_timer);
11636e790746SPaolo Bonzini         q->tx_waiting = 0;
11646e790746SPaolo Bonzini         virtio_net_flush_tx(q);
11656e790746SPaolo Bonzini     } else {
1166bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
1167bc72ad67SAlex Bligh                        qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
11686e790746SPaolo Bonzini         q->tx_waiting = 1;
11696e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
11706e790746SPaolo Bonzini     }
11716e790746SPaolo Bonzini }
11726e790746SPaolo Bonzini 
11736e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
11746e790746SPaolo Bonzini {
117517a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
11766e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
11776e790746SPaolo Bonzini 
11786e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
11796e790746SPaolo Bonzini         return;
11806e790746SPaolo Bonzini     }
11816e790746SPaolo Bonzini     q->tx_waiting = 1;
11826e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
118317a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
11846e790746SPaolo Bonzini         return;
11856e790746SPaolo Bonzini     }
11866e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
11876e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
11886e790746SPaolo Bonzini }
11896e790746SPaolo Bonzini 
11906e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
11916e790746SPaolo Bonzini {
11926e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
11936e790746SPaolo Bonzini     VirtIONet *n = q->n;
119417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
119517a0ca55SKONRAD Frederic     assert(vdev->vm_running);
11966e790746SPaolo Bonzini 
11976e790746SPaolo Bonzini     q->tx_waiting = 0;
11986e790746SPaolo Bonzini 
11996e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
120017a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
12016e790746SPaolo Bonzini         return;
120217a0ca55SKONRAD Frederic     }
12036e790746SPaolo Bonzini 
12046e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
12056e790746SPaolo Bonzini     virtio_net_flush_tx(q);
12066e790746SPaolo Bonzini }
12076e790746SPaolo Bonzini 
12086e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
12096e790746SPaolo Bonzini {
12106e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
12116e790746SPaolo Bonzini     VirtIONet *n = q->n;
121217a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
12136e790746SPaolo Bonzini     int32_t ret;
12146e790746SPaolo Bonzini 
121517a0ca55SKONRAD Frederic     assert(vdev->vm_running);
12166e790746SPaolo Bonzini 
12176e790746SPaolo Bonzini     q->tx_waiting = 0;
12186e790746SPaolo Bonzini 
12196e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
122017a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
12216e790746SPaolo Bonzini         return;
122217a0ca55SKONRAD Frederic     }
12236e790746SPaolo Bonzini 
12246e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
12256e790746SPaolo Bonzini     if (ret == -EBUSY) {
12266e790746SPaolo Bonzini         return; /* Notification re-enable handled by tx_complete */
12276e790746SPaolo Bonzini     }
12286e790746SPaolo Bonzini 
12296e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
12306e790746SPaolo Bonzini      * more coming and immediately reschedule */
12316e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
12326e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
12336e790746SPaolo Bonzini         q->tx_waiting = 1;
12346e790746SPaolo Bonzini         return;
12356e790746SPaolo Bonzini     }
12366e790746SPaolo Bonzini 
12376e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
12386e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
12396e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
12406e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
12416e790746SPaolo Bonzini     if (virtio_net_flush_tx(q) > 0) {
12426e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
12436e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
12446e790746SPaolo Bonzini         q->tx_waiting = 1;
12456e790746SPaolo Bonzini     }
12466e790746SPaolo Bonzini }
12476e790746SPaolo Bonzini 
1248ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
12496e790746SPaolo Bonzini {
125017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
12516e790746SPaolo Bonzini     int i, max = multiqueue ? n->max_queues : 1;
12526e790746SPaolo Bonzini 
12536e790746SPaolo Bonzini     n->multiqueue = multiqueue;
12546e790746SPaolo Bonzini 
12556e790746SPaolo Bonzini     for (i = 2; i <= n->max_queues * 2 + 1; i++) {
12566e790746SPaolo Bonzini         virtio_del_queue(vdev, i);
12576e790746SPaolo Bonzini     }
12586e790746SPaolo Bonzini 
12596e790746SPaolo Bonzini     for (i = 1; i < max; i++) {
12606e790746SPaolo Bonzini         n->vqs[i].rx_vq = virtio_add_queue(vdev, 256, virtio_net_handle_rx);
12616e790746SPaolo Bonzini         if (n->vqs[i].tx_timer) {
12626e790746SPaolo Bonzini             n->vqs[i].tx_vq =
12636e790746SPaolo Bonzini                 virtio_add_queue(vdev, 256, virtio_net_handle_tx_timer);
1264bc72ad67SAlex Bligh             n->vqs[i].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
12656e790746SPaolo Bonzini                                                    virtio_net_tx_timer,
12666e790746SPaolo Bonzini                                                    &n->vqs[i]);
12676e790746SPaolo Bonzini         } else {
12686e790746SPaolo Bonzini             n->vqs[i].tx_vq =
12696e790746SPaolo Bonzini                 virtio_add_queue(vdev, 256, virtio_net_handle_tx_bh);
12706e790746SPaolo Bonzini             n->vqs[i].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[i]);
12716e790746SPaolo Bonzini         }
12726e790746SPaolo Bonzini 
12736e790746SPaolo Bonzini         n->vqs[i].tx_waiting = 0;
12746e790746SPaolo Bonzini         n->vqs[i].n = n;
12756e790746SPaolo Bonzini     }
12766e790746SPaolo Bonzini 
1277ec57db16SJason Wang     /* Note: Minux Guests (version 3.2.1) use ctrl vq but don't ack
1278ec57db16SJason Wang      * VIRTIO_NET_F_CTRL_VQ. Create ctrl vq unconditionally to avoid
1279ec57db16SJason Wang      * breaking them.
1280ec57db16SJason Wang      */
12816e790746SPaolo Bonzini     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
12826e790746SPaolo Bonzini 
12836e790746SPaolo Bonzini     virtio_net_set_queues(n);
12846e790746SPaolo Bonzini }
12856e790746SPaolo Bonzini 
12866e790746SPaolo Bonzini static void virtio_net_save(QEMUFile *f, void *opaque)
12876e790746SPaolo Bonzini {
12886e790746SPaolo Bonzini     int i;
12896e790746SPaolo Bonzini     VirtIONet *n = opaque;
129017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
12916e790746SPaolo Bonzini 
12926e790746SPaolo Bonzini     /* At this point, backend must be stopped, otherwise
12936e790746SPaolo Bonzini      * it might keep writing to memory. */
12946e790746SPaolo Bonzini     assert(!n->vhost_started);
129517a0ca55SKONRAD Frederic     virtio_save(vdev, f);
12966e790746SPaolo Bonzini 
12976e790746SPaolo Bonzini     qemu_put_buffer(f, n->mac, ETH_ALEN);
12986e790746SPaolo Bonzini     qemu_put_be32(f, n->vqs[0].tx_waiting);
12996e790746SPaolo Bonzini     qemu_put_be32(f, n->mergeable_rx_bufs);
13006e790746SPaolo Bonzini     qemu_put_be16(f, n->status);
13016e790746SPaolo Bonzini     qemu_put_byte(f, n->promisc);
13026e790746SPaolo Bonzini     qemu_put_byte(f, n->allmulti);
13036e790746SPaolo Bonzini     qemu_put_be32(f, n->mac_table.in_use);
13046e790746SPaolo Bonzini     qemu_put_buffer(f, n->mac_table.macs, n->mac_table.in_use * ETH_ALEN);
13056e790746SPaolo Bonzini     qemu_put_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
13066e790746SPaolo Bonzini     qemu_put_be32(f, n->has_vnet_hdr);
13076e790746SPaolo Bonzini     qemu_put_byte(f, n->mac_table.multi_overflow);
13086e790746SPaolo Bonzini     qemu_put_byte(f, n->mac_table.uni_overflow);
13096e790746SPaolo Bonzini     qemu_put_byte(f, n->alluni);
13106e790746SPaolo Bonzini     qemu_put_byte(f, n->nomulti);
13116e790746SPaolo Bonzini     qemu_put_byte(f, n->nouni);
13126e790746SPaolo Bonzini     qemu_put_byte(f, n->nobcast);
13136e790746SPaolo Bonzini     qemu_put_byte(f, n->has_ufo);
13146e790746SPaolo Bonzini     if (n->max_queues > 1) {
13156e790746SPaolo Bonzini         qemu_put_be16(f, n->max_queues);
13166e790746SPaolo Bonzini         qemu_put_be16(f, n->curr_queues);
13176e790746SPaolo Bonzini         for (i = 1; i < n->curr_queues; i++) {
13186e790746SPaolo Bonzini             qemu_put_be32(f, n->vqs[i].tx_waiting);
13196e790746SPaolo Bonzini         }
13206e790746SPaolo Bonzini     }
1321644c9858SDmitry Fleytman 
1322644c9858SDmitry Fleytman     if ((1 << VIRTIO_NET_F_CTRL_GUEST_OFFLOADS) & vdev->guest_features) {
1323644c9858SDmitry Fleytman         qemu_put_be64(f, n->curr_guest_offloads);
1324644c9858SDmitry Fleytman     }
13256e790746SPaolo Bonzini }
13266e790746SPaolo Bonzini 
13276e790746SPaolo Bonzini static int virtio_net_load(QEMUFile *f, void *opaque, int version_id)
13286e790746SPaolo Bonzini {
13296e790746SPaolo Bonzini     VirtIONet *n = opaque;
133017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
13316e790746SPaolo Bonzini     int ret, i, link_down;
13326e790746SPaolo Bonzini 
13336e790746SPaolo Bonzini     if (version_id < 2 || version_id > VIRTIO_NET_VM_VERSION)
13346e790746SPaolo Bonzini         return -EINVAL;
13356e790746SPaolo Bonzini 
133617a0ca55SKONRAD Frederic     ret = virtio_load(vdev, f);
13376e790746SPaolo Bonzini     if (ret) {
13386e790746SPaolo Bonzini         return ret;
13396e790746SPaolo Bonzini     }
13406e790746SPaolo Bonzini 
13416e790746SPaolo Bonzini     qemu_get_buffer(f, n->mac, ETH_ALEN);
13426e790746SPaolo Bonzini     n->vqs[0].tx_waiting = qemu_get_be32(f);
13436e790746SPaolo Bonzini 
13446e790746SPaolo Bonzini     virtio_net_set_mrg_rx_bufs(n, qemu_get_be32(f));
13456e790746SPaolo Bonzini 
13466e790746SPaolo Bonzini     if (version_id >= 3)
13476e790746SPaolo Bonzini         n->status = qemu_get_be16(f);
13486e790746SPaolo Bonzini 
13496e790746SPaolo Bonzini     if (version_id >= 4) {
13506e790746SPaolo Bonzini         if (version_id < 8) {
13516e790746SPaolo Bonzini             n->promisc = qemu_get_be32(f);
13526e790746SPaolo Bonzini             n->allmulti = qemu_get_be32(f);
13536e790746SPaolo Bonzini         } else {
13546e790746SPaolo Bonzini             n->promisc = qemu_get_byte(f);
13556e790746SPaolo Bonzini             n->allmulti = qemu_get_byte(f);
13566e790746SPaolo Bonzini         }
13576e790746SPaolo Bonzini     }
13586e790746SPaolo Bonzini 
13596e790746SPaolo Bonzini     if (version_id >= 5) {
13606e790746SPaolo Bonzini         n->mac_table.in_use = qemu_get_be32(f);
13616e790746SPaolo Bonzini         /* MAC_TABLE_ENTRIES may be different from the saved image */
13626e790746SPaolo Bonzini         if (n->mac_table.in_use <= MAC_TABLE_ENTRIES) {
13636e790746SPaolo Bonzini             qemu_get_buffer(f, n->mac_table.macs,
13646e790746SPaolo Bonzini                             n->mac_table.in_use * ETH_ALEN);
13656e790746SPaolo Bonzini         } else if (n->mac_table.in_use) {
13666e790746SPaolo Bonzini             uint8_t *buf = g_malloc0(n->mac_table.in_use);
13676e790746SPaolo Bonzini             qemu_get_buffer(f, buf, n->mac_table.in_use * ETH_ALEN);
13686e790746SPaolo Bonzini             g_free(buf);
13696e790746SPaolo Bonzini             n->mac_table.multi_overflow = n->mac_table.uni_overflow = 1;
13706e790746SPaolo Bonzini             n->mac_table.in_use = 0;
13716e790746SPaolo Bonzini         }
13726e790746SPaolo Bonzini     }
13736e790746SPaolo Bonzini 
13746e790746SPaolo Bonzini     if (version_id >= 6)
13756e790746SPaolo Bonzini         qemu_get_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
13766e790746SPaolo Bonzini 
13776e790746SPaolo Bonzini     if (version_id >= 7) {
13786e790746SPaolo Bonzini         if (qemu_get_be32(f) && !peer_has_vnet_hdr(n)) {
13796e790746SPaolo Bonzini             error_report("virtio-net: saved image requires vnet_hdr=on");
13806e790746SPaolo Bonzini             return -1;
13816e790746SPaolo Bonzini         }
13826e790746SPaolo Bonzini     }
13836e790746SPaolo Bonzini 
13846e790746SPaolo Bonzini     if (version_id >= 9) {
13856e790746SPaolo Bonzini         n->mac_table.multi_overflow = qemu_get_byte(f);
13866e790746SPaolo Bonzini         n->mac_table.uni_overflow = qemu_get_byte(f);
13876e790746SPaolo Bonzini     }
13886e790746SPaolo Bonzini 
13896e790746SPaolo Bonzini     if (version_id >= 10) {
13906e790746SPaolo Bonzini         n->alluni = qemu_get_byte(f);
13916e790746SPaolo Bonzini         n->nomulti = qemu_get_byte(f);
13926e790746SPaolo Bonzini         n->nouni = qemu_get_byte(f);
13936e790746SPaolo Bonzini         n->nobcast = qemu_get_byte(f);
13946e790746SPaolo Bonzini     }
13956e790746SPaolo Bonzini 
13966e790746SPaolo Bonzini     if (version_id >= 11) {
13976e790746SPaolo Bonzini         if (qemu_get_byte(f) && !peer_has_ufo(n)) {
13986e790746SPaolo Bonzini             error_report("virtio-net: saved image requires TUN_F_UFO support");
13996e790746SPaolo Bonzini             return -1;
14006e790746SPaolo Bonzini         }
14016e790746SPaolo Bonzini     }
14026e790746SPaolo Bonzini 
14036e790746SPaolo Bonzini     if (n->max_queues > 1) {
14046e790746SPaolo Bonzini         if (n->max_queues != qemu_get_be16(f)) {
14056e790746SPaolo Bonzini             error_report("virtio-net: different max_queues ");
14066e790746SPaolo Bonzini             return -1;
14076e790746SPaolo Bonzini         }
14086e790746SPaolo Bonzini 
14096e790746SPaolo Bonzini         n->curr_queues = qemu_get_be16(f);
14106e790746SPaolo Bonzini         for (i = 1; i < n->curr_queues; i++) {
14116e790746SPaolo Bonzini             n->vqs[i].tx_waiting = qemu_get_be32(f);
14126e790746SPaolo Bonzini         }
14136e790746SPaolo Bonzini     }
14146e790746SPaolo Bonzini 
1415644c9858SDmitry Fleytman     if ((1 << VIRTIO_NET_F_CTRL_GUEST_OFFLOADS) & vdev->guest_features) {
1416644c9858SDmitry Fleytman         n->curr_guest_offloads = qemu_get_be64(f);
1417644c9858SDmitry Fleytman     } else {
1418644c9858SDmitry Fleytman         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
1419644c9858SDmitry Fleytman     }
1420644c9858SDmitry Fleytman 
1421644c9858SDmitry Fleytman     if (peer_has_vnet_hdr(n)) {
1422644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1423644c9858SDmitry Fleytman     }
1424644c9858SDmitry Fleytman 
14256e790746SPaolo Bonzini     virtio_net_set_queues(n);
14266e790746SPaolo Bonzini 
14276e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
14286e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
14296e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
14306e790746SPaolo Bonzini             break;
14316e790746SPaolo Bonzini         }
14326e790746SPaolo Bonzini     }
14336e790746SPaolo Bonzini     n->mac_table.first_multi = i;
14346e790746SPaolo Bonzini 
14356e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
14366e790746SPaolo Bonzini      * to link status bit in n->status */
14376e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
14386e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
14396e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
14406e790746SPaolo Bonzini     }
14416e790746SPaolo Bonzini 
14426e790746SPaolo Bonzini     return 0;
14436e790746SPaolo Bonzini }
14446e790746SPaolo Bonzini 
14456e790746SPaolo Bonzini static void virtio_net_cleanup(NetClientState *nc)
14466e790746SPaolo Bonzini {
14476e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
14486e790746SPaolo Bonzini 
14496e790746SPaolo Bonzini     n->nic = NULL;
14506e790746SPaolo Bonzini }
14516e790746SPaolo Bonzini 
14526e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
14536e790746SPaolo Bonzini     .type = NET_CLIENT_OPTIONS_KIND_NIC,
14546e790746SPaolo Bonzini     .size = sizeof(NICState),
14556e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
14566e790746SPaolo Bonzini     .receive = virtio_net_receive,
14576e790746SPaolo Bonzini     .cleanup = virtio_net_cleanup,
14586e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
1459b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
14606e790746SPaolo Bonzini };
14616e790746SPaolo Bonzini 
14626e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
14636e790746SPaolo Bonzini {
146417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
14656e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
14666e790746SPaolo Bonzini     assert(n->vhost_started);
14676e790746SPaolo Bonzini     return vhost_net_virtqueue_pending(tap_get_vhost_net(nc->peer), idx);
14686e790746SPaolo Bonzini }
14696e790746SPaolo Bonzini 
14706e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
14716e790746SPaolo Bonzini                                            bool mask)
14726e790746SPaolo Bonzini {
147317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
14746e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
14756e790746SPaolo Bonzini     assert(n->vhost_started);
14766e790746SPaolo Bonzini     vhost_net_virtqueue_mask(tap_get_vhost_net(nc->peer),
14776e790746SPaolo Bonzini                              vdev, idx, mask);
14786e790746SPaolo Bonzini }
14796e790746SPaolo Bonzini 
148017ec5a86SKONRAD Frederic void virtio_net_set_config_size(VirtIONet *n, uint32_t host_features)
14816e790746SPaolo Bonzini {
14826e790746SPaolo Bonzini     int i, config_size = 0;
1483e9016ee2SJason Wang     host_features |= (1 << VIRTIO_NET_F_MAC);
14846e790746SPaolo Bonzini     for (i = 0; feature_sizes[i].flags != 0; i++) {
14856e790746SPaolo Bonzini         if (host_features & feature_sizes[i].flags) {
14866e790746SPaolo Bonzini             config_size = MAX(feature_sizes[i].end, config_size);
14876e790746SPaolo Bonzini         }
14886e790746SPaolo Bonzini     }
148917ec5a86SKONRAD Frederic     n->config_size = config_size;
149017ec5a86SKONRAD Frederic }
14916e790746SPaolo Bonzini 
14928a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
14938a253ec2SKONRAD Frederic                                    const char *type)
14948a253ec2SKONRAD Frederic {
14958a253ec2SKONRAD Frederic     /*
14968a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
14978a253ec2SKONRAD Frederic      */
14988a253ec2SKONRAD Frederic     assert(type != NULL);
14998a253ec2SKONRAD Frederic 
15008a253ec2SKONRAD Frederic     if (n->netclient_name) {
15018a253ec2SKONRAD Frederic         g_free(n->netclient_name);
15028a253ec2SKONRAD Frederic         n->netclient_name = NULL;
15038a253ec2SKONRAD Frederic     }
15048a253ec2SKONRAD Frederic     if (n->netclient_type) {
15058a253ec2SKONRAD Frederic         g_free(n->netclient_type);
15068a253ec2SKONRAD Frederic         n->netclient_type = NULL;
15078a253ec2SKONRAD Frederic     }
15088a253ec2SKONRAD Frederic 
15098a253ec2SKONRAD Frederic     if (name != NULL) {
15108a253ec2SKONRAD Frederic         n->netclient_name = g_strdup(name);
15118a253ec2SKONRAD Frederic     }
15128a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
15138a253ec2SKONRAD Frederic }
15148a253ec2SKONRAD Frederic 
1515e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
151617ec5a86SKONRAD Frederic {
1517e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1518284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
1519284a32f0SAndreas Färber     NetClientState *nc;
15201773d9eeSKONRAD Frederic     int i;
152117ec5a86SKONRAD Frederic 
1522284a32f0SAndreas Färber     virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size);
152317ec5a86SKONRAD Frederic 
15241773d9eeSKONRAD Frederic     n->max_queues = MAX(n->nic_conf.queues, 1);
15256e790746SPaolo Bonzini     n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queues);
152617a0ca55SKONRAD Frederic     n->vqs[0].rx_vq = virtio_add_queue(vdev, 256, virtio_net_handle_rx);
15276e790746SPaolo Bonzini     n->curr_queues = 1;
15286e790746SPaolo Bonzini     n->vqs[0].n = n;
15291773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
15306e790746SPaolo Bonzini 
15311773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
15321773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
15336e790746SPaolo Bonzini         error_report("virtio-net: "
15346e790746SPaolo Bonzini                      "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
15351773d9eeSKONRAD Frederic                      n->net_conf.tx);
15366e790746SPaolo Bonzini         error_report("Defaulting to \"bh\"");
15376e790746SPaolo Bonzini     }
15386e790746SPaolo Bonzini 
15391773d9eeSKONRAD Frederic     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
154017a0ca55SKONRAD Frederic         n->vqs[0].tx_vq = virtio_add_queue(vdev, 256,
15416e790746SPaolo Bonzini                                            virtio_net_handle_tx_timer);
1542bc72ad67SAlex Bligh         n->vqs[0].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, virtio_net_tx_timer,
15436e790746SPaolo Bonzini                                                &n->vqs[0]);
15446e790746SPaolo Bonzini     } else {
154517a0ca55SKONRAD Frederic         n->vqs[0].tx_vq = virtio_add_queue(vdev, 256,
15466e790746SPaolo Bonzini                                            virtio_net_handle_tx_bh);
15476e790746SPaolo Bonzini         n->vqs[0].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[0]);
15486e790746SPaolo Bonzini     }
154917a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
15501773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
15511773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
15526e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
15536e790746SPaolo Bonzini 
15548a253ec2SKONRAD Frederic     if (n->netclient_type) {
15558a253ec2SKONRAD Frederic         /*
15568a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
15578a253ec2SKONRAD Frederic          */
15588a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
15598a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
15608a253ec2SKONRAD Frederic     } else {
15611773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
1562284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
15638a253ec2SKONRAD Frederic     }
15648a253ec2SKONRAD Frederic 
15656e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
15666e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
15676e790746SPaolo Bonzini         for (i = 0; i < n->max_queues; i++) {
1568d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
15696e790746SPaolo Bonzini         }
15706e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
15716e790746SPaolo Bonzini     } else {
15726e790746SPaolo Bonzini         n->host_hdr_len = 0;
15736e790746SPaolo Bonzini     }
15746e790746SPaolo Bonzini 
15751773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
15766e790746SPaolo Bonzini 
15776e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
15781773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
15796e790746SPaolo Bonzini     virtio_net_set_mrg_rx_bufs(n, 0);
15806e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
15816e790746SPaolo Bonzini 
15826e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
15836e790746SPaolo Bonzini 
15846e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
15856e790746SPaolo Bonzini 
1586b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
1587b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
1588b1be4280SAmos Kong 
1589284a32f0SAndreas Färber     n->qdev = dev;
1590284a32f0SAndreas Färber     register_savevm(dev, "virtio-net", -1, VIRTIO_NET_VM_VERSION,
15916e790746SPaolo Bonzini                     virtio_net_save, virtio_net_load, n);
15926e790746SPaolo Bonzini 
1593284a32f0SAndreas Färber     add_boot_device_path(n->nic_conf.bootindex, dev, "/ethernet-phy@0");
159417ec5a86SKONRAD Frederic }
159517ec5a86SKONRAD Frederic 
1596306ec6c3SAndreas Färber static void virtio_net_device_unrealize(DeviceState *dev, Error **errp)
159717ec5a86SKONRAD Frederic {
1598306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1599306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
160017ec5a86SKONRAD Frederic     int i;
160117ec5a86SKONRAD Frederic 
160217ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
160317ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
160417ec5a86SKONRAD Frederic 
1605306ec6c3SAndreas Färber     unregister_savevm(dev, "virtio-net", n);
160617ec5a86SKONRAD Frederic 
16078a253ec2SKONRAD Frederic     if (n->netclient_name) {
16088a253ec2SKONRAD Frederic         g_free(n->netclient_name);
16098a253ec2SKONRAD Frederic         n->netclient_name = NULL;
16108a253ec2SKONRAD Frederic     }
16118a253ec2SKONRAD Frederic     if (n->netclient_type) {
16128a253ec2SKONRAD Frederic         g_free(n->netclient_type);
16138a253ec2SKONRAD Frederic         n->netclient_type = NULL;
16148a253ec2SKONRAD Frederic     }
16158a253ec2SKONRAD Frederic 
161617ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
161717ec5a86SKONRAD Frederic     g_free(n->vlans);
161817ec5a86SKONRAD Frederic 
161917ec5a86SKONRAD Frederic     for (i = 0; i < n->max_queues; i++) {
162017ec5a86SKONRAD Frederic         VirtIONetQueue *q = &n->vqs[i];
162117ec5a86SKONRAD Frederic         NetClientState *nc = qemu_get_subqueue(n->nic, i);
162217ec5a86SKONRAD Frederic 
162317ec5a86SKONRAD Frederic         qemu_purge_queued_packets(nc);
162417ec5a86SKONRAD Frederic 
162517ec5a86SKONRAD Frederic         if (q->tx_timer) {
1626bc72ad67SAlex Bligh             timer_del(q->tx_timer);
1627bc72ad67SAlex Bligh             timer_free(q->tx_timer);
1628fe2dafa0SJason Wang         } else if (q->tx_bh) {
162917ec5a86SKONRAD Frederic             qemu_bh_delete(q->tx_bh);
163017ec5a86SKONRAD Frederic         }
163117ec5a86SKONRAD Frederic     }
163217ec5a86SKONRAD Frederic 
163317ec5a86SKONRAD Frederic     g_free(n->vqs);
163417ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
16356a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
163617ec5a86SKONRAD Frederic }
163717ec5a86SKONRAD Frederic 
163817ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
163917ec5a86SKONRAD Frederic {
164017ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
164117ec5a86SKONRAD Frederic 
164217ec5a86SKONRAD Frederic     /*
164317ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
164417ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
164517ec5a86SKONRAD Frederic      */
164617ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
164717ec5a86SKONRAD Frederic }
164817ec5a86SKONRAD Frederic 
164917ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
165017ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
165117ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
165217ec5a86SKONRAD Frederic                                                TX_TIMER_INTERVAL),
165317ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
165417ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
165517ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
165617ec5a86SKONRAD Frederic };
165717ec5a86SKONRAD Frederic 
165817ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
165917ec5a86SKONRAD Frederic {
166017ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
166117ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
1662e6f746b3SAndreas Färber 
166317ec5a86SKONRAD Frederic     dc->props = virtio_net_properties;
1664125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
1665e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
1666306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
166717ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
166817ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
166917ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
167017ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
167117ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
167217ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
167317ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
167417ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
167517ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
167617ec5a86SKONRAD Frederic }
167717ec5a86SKONRAD Frederic 
167817ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
167917ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
168017ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
168117ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
168217ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
168317ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
168417ec5a86SKONRAD Frederic };
168517ec5a86SKONRAD Frederic 
168617ec5a86SKONRAD Frederic static void virtio_register_types(void)
168717ec5a86SKONRAD Frederic {
168817ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
168917ec5a86SKONRAD Frederic }
169017ec5a86SKONRAD Frederic 
169117ec5a86SKONRAD Frederic type_init(virtio_register_types)
1692