xref: /openbmc/qemu/hw/net/virtio-net.c (revision f574633529926697ced51b6865e5c50bbb78bf1b)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
149b8bfe21SPeter Maydell #include "qemu/osdep.h"
159711cd0dSJens Freimann #include "qemu/atomic.h"
166e790746SPaolo Bonzini #include "qemu/iov.h"
17db725815SMarkus Armbruster #include "qemu/main-loop.h"
180b8fa32fSMarkus Armbruster #include "qemu/module.h"
196e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
206e790746SPaolo Bonzini #include "net/net.h"
216e790746SPaolo Bonzini #include "net/checksum.h"
226e790746SPaolo Bonzini #include "net/tap.h"
236e790746SPaolo Bonzini #include "qemu/error-report.h"
246e790746SPaolo Bonzini #include "qemu/timer.h"
259711cd0dSJens Freimann #include "qemu/option.h"
269711cd0dSJens Freimann #include "qemu/option_int.h"
279711cd0dSJens Freimann #include "qemu/config-file.h"
289711cd0dSJens Freimann #include "qapi/qmp/qdict.h"
296e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
306e790746SPaolo Bonzini #include "net/vhost_net.h"
319d8c6a25SDr. David Alan Gilbert #include "net/announce.h"
3217ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
33e688df6bSMarkus Armbruster #include "qapi/error.h"
349af23989SMarkus Armbruster #include "qapi/qapi-events-net.h"
35a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h"
369711cd0dSJens Freimann #include "qapi/qapi-types-migration.h"
379711cd0dSJens Freimann #include "qapi/qapi-events-migration.h"
381399c60dSRusty Russell #include "hw/virtio/virtio-access.h"
39f8d806c9SJuan Quintela #include "migration/misc.h"
409473939eSJason Baron #include "standard-headers/linux/ethtool.h"
412f780b6aSMarkus Armbruster #include "sysemu/sysemu.h"
429d8c6a25SDr. David Alan Gilbert #include "trace.h"
439711cd0dSJens Freimann #include "monitor/qdev.h"
449711cd0dSJens Freimann #include "hw/pci/pci.h"
454474e37aSYuri Benditovich #include "net_rx_pkt.h"
46108a6481SCindy Lu #include "hw/virtio/vhost.h"
476e790746SPaolo Bonzini 
486e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
496e790746SPaolo Bonzini 
506e790746SPaolo Bonzini #define MAC_TABLE_ENTRIES    64
516e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
526e790746SPaolo Bonzini 
531c0fbfa3SMichael S. Tsirkin /* previously fixed value */
541c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
559b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256
569b02e161SWei Wang 
571c0fbfa3SMichael S. Tsirkin /* for now, only allow larger queues; with virtio-1, guest can downsize */
581c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
599b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE
601c0fbfa3SMichael S. Tsirkin 
612974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE   8        /* ipv4 saddr + daddr */
622974e916SYuri Benditovich 
632974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG         0x3F
642974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH   0xF000
652974e916SYuri Benditovich 
662974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */
672974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header))
682974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535
692974e916SYuri Benditovich 
702974e916SYuri Benditovich /* header length value in ip header without option */
712974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5
722974e916SYuri Benditovich 
732974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE   32      /* ipv6 saddr + daddr */
742974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD
752974e916SYuri Benditovich 
762974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance
772974e916SYuri Benditovich    a lot, and should be tuned carefully, '300000'(300us) is the recommended
782974e916SYuri Benditovich    value to pass the WHQL test, '50000' can gain 2x netperf throughput with
792974e916SYuri Benditovich    tso/gso/gro 'off'. */
802974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000
812974e916SYuri Benditovich 
8259079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \
8359079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \
8459079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \
8559079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \
8659079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \
8759079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \
8859079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \
8959079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \
9059079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDP_EX)
9159079029SYuri Benditovich 
926e790746SPaolo Bonzini static VirtIOFeature feature_sizes[] = {
93127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MAC,
945d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mac)},
95127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_STATUS,
965d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, status)},
97127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MQ,
985d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
99127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MTU,
1005d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mtu)},
1019473939eSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX,
1025d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, duplex)},
103e22f0603SYuri Benditovich     {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT),
10459079029SYuri Benditovich      .end = endof(struct virtio_net_config, supported_hash_types)},
1056e790746SPaolo Bonzini     {}
1066e790746SPaolo Bonzini };
1076e790746SPaolo Bonzini 
1086e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
1096e790746SPaolo Bonzini {
1106e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1116e790746SPaolo Bonzini 
1126e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
1136e790746SPaolo Bonzini }
1146e790746SPaolo Bonzini 
1156e790746SPaolo Bonzini static int vq2q(int queue_index)
1166e790746SPaolo Bonzini {
1176e790746SPaolo Bonzini     return queue_index / 2;
1186e790746SPaolo Bonzini }
1196e790746SPaolo Bonzini 
1206e790746SPaolo Bonzini /* TODO
1216e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
1226e790746SPaolo Bonzini  */
1236e790746SPaolo Bonzini 
1246e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
1256e790746SPaolo Bonzini {
12617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1276e790746SPaolo Bonzini     struct virtio_net_config netcfg;
128c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1296e790746SPaolo Bonzini 
130108a6481SCindy Lu     int ret = 0;
131108a6481SCindy Lu     memset(&netcfg, 0 , sizeof(struct virtio_net_config));
1321399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.status, n->status);
1331399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queues);
134a93e599dSMaxime Coquelin     virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu);
1356e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
1369473939eSJason Baron     virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed);
1379473939eSJason Baron     netcfg.duplex = n->net_conf.duplex;
13859079029SYuri Benditovich     netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE;
13959079029SYuri Benditovich     virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length,
140e22f0603SYuri Benditovich                  virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ?
141e22f0603SYuri Benditovich                  VIRTIO_NET_RSS_MAX_TABLE_LEN : 1);
14259079029SYuri Benditovich     virtio_stl_p(vdev, &netcfg.supported_hash_types,
14359079029SYuri Benditovich                  VIRTIO_NET_RSS_SUPPORTED_HASHES);
1446e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
145108a6481SCindy Lu 
146c546ecf2SJason Wang     /*
147c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
148c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
149c546ecf2SJason Wang      */
150c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
151108a6481SCindy Lu         ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
152108a6481SCindy Lu                                    n->config_size);
153108a6481SCindy Lu         if (ret != -1) {
154108a6481SCindy Lu             memcpy(config, &netcfg, n->config_size);
155108a6481SCindy Lu         }
156108a6481SCindy Lu     }
1576e790746SPaolo Bonzini }
1586e790746SPaolo Bonzini 
1596e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
1606e790746SPaolo Bonzini {
16117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1626e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
163c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1646e790746SPaolo Bonzini 
1656e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
1666e790746SPaolo Bonzini 
16795129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
16895129d6fSCornelia Huck         !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
1696e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
1706e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
1716e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1726e790746SPaolo Bonzini     }
173108a6481SCindy Lu 
174c546ecf2SJason Wang     /*
175c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
176c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
177c546ecf2SJason Wang      */
178c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
179c546ecf2SJason Wang         vhost_net_set_config(get_vhost_net(nc->peer),
180c546ecf2SJason Wang                              (uint8_t *)&netcfg, 0, n->config_size,
181108a6481SCindy Lu                              VHOST_SET_CONFIG_TYPE_MASTER);
182108a6481SCindy Lu       }
1836e790746SPaolo Bonzini }
1846e790746SPaolo Bonzini 
1856e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
1866e790746SPaolo Bonzini {
18717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1886e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
18917a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
1906e790746SPaolo Bonzini }
1916e790746SPaolo Bonzini 
192b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net)
193b2c929f0SDr. David Alan Gilbert {
194b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(net);
195b2c929f0SDr. David Alan Gilbert     trace_virtio_net_announce_notify();
196b2c929f0SDr. David Alan Gilbert 
197b2c929f0SDr. David Alan Gilbert     net->status |= VIRTIO_NET_S_ANNOUNCE;
198b2c929f0SDr. David Alan Gilbert     virtio_notify_config(vdev);
199b2c929f0SDr. David Alan Gilbert }
200b2c929f0SDr. David Alan Gilbert 
201f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque)
202f57fcf70SJason Wang {
203f57fcf70SJason Wang     VirtIONet *n = opaque;
2049d8c6a25SDr. David Alan Gilbert     trace_virtio_net_announce_timer(n->announce_timer.round);
205f57fcf70SJason Wang 
2069d8c6a25SDr. David Alan Gilbert     n->announce_timer.round--;
207b2c929f0SDr. David Alan Gilbert     virtio_net_announce_notify(n);
208b2c929f0SDr. David Alan Gilbert }
209b2c929f0SDr. David Alan Gilbert 
210b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc)
211b2c929f0SDr. David Alan Gilbert {
212b2c929f0SDr. David Alan Gilbert     VirtIONet *n = qemu_get_nic_opaque(nc);
213b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
214b2c929f0SDr. David Alan Gilbert 
215b2c929f0SDr. David Alan Gilbert     /*
216b2c929f0SDr. David Alan Gilbert      * Make sure the virtio migration announcement timer isn't running
217b2c929f0SDr. David Alan Gilbert      * If it is, let it trigger announcement so that we do not cause
218b2c929f0SDr. David Alan Gilbert      * confusion.
219b2c929f0SDr. David Alan Gilbert      */
220b2c929f0SDr. David Alan Gilbert     if (n->announce_timer.round) {
221b2c929f0SDr. David Alan Gilbert         return;
222b2c929f0SDr. David Alan Gilbert     }
223b2c929f0SDr. David Alan Gilbert 
224b2c929f0SDr. David Alan Gilbert     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
225b2c929f0SDr. David Alan Gilbert         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
226b2c929f0SDr. David Alan Gilbert             virtio_net_announce_notify(n);
227b2c929f0SDr. David Alan Gilbert     }
228f57fcf70SJason Wang }
229f57fcf70SJason Wang 
2306e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
2316e790746SPaolo Bonzini {
23217a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2336e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
2346e790746SPaolo Bonzini     int queues = n->multiqueue ? n->max_queues : 1;
2356e790746SPaolo Bonzini 
236ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
2376e790746SPaolo Bonzini         return;
2386e790746SPaolo Bonzini     }
2396e790746SPaolo Bonzini 
2408c1ac475SRadim Krčmář     if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
2418c1ac475SRadim Krčmář         !!n->vhost_started) {
2426e790746SPaolo Bonzini         return;
2436e790746SPaolo Bonzini     }
2446e790746SPaolo Bonzini     if (!n->vhost_started) {
245086abc1cSMichael S. Tsirkin         int r, i;
246086abc1cSMichael S. Tsirkin 
2471bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
2481bfa316cSGreg Kurz             error_report("backend does not support %s vnet headers; "
2491bfa316cSGreg Kurz                          "falling back on userspace virtio",
2501bfa316cSGreg Kurz                          virtio_is_big_endian(vdev) ? "BE" : "LE");
2511bfa316cSGreg Kurz             return;
2521bfa316cSGreg Kurz         }
2531bfa316cSGreg Kurz 
254086abc1cSMichael S. Tsirkin         /* Any packets outstanding? Purge them to avoid touching rings
255086abc1cSMichael S. Tsirkin          * when vhost is running.
256086abc1cSMichael S. Tsirkin          */
257086abc1cSMichael S. Tsirkin         for (i = 0;  i < queues; i++) {
258086abc1cSMichael S. Tsirkin             NetClientState *qnc = qemu_get_subqueue(n->nic, i);
259086abc1cSMichael S. Tsirkin 
260086abc1cSMichael S. Tsirkin             /* Purge both directions: TX and RX. */
261086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
262086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
263086abc1cSMichael S. Tsirkin         }
264086abc1cSMichael S. Tsirkin 
265a93e599dSMaxime Coquelin         if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) {
266a93e599dSMaxime Coquelin             r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu);
267a93e599dSMaxime Coquelin             if (r < 0) {
268a93e599dSMaxime Coquelin                 error_report("%uBytes MTU not supported by the backend",
269a93e599dSMaxime Coquelin                              n->net_conf.mtu);
270a93e599dSMaxime Coquelin 
271a93e599dSMaxime Coquelin                 return;
272a93e599dSMaxime Coquelin             }
273a93e599dSMaxime Coquelin         }
274a93e599dSMaxime Coquelin 
2756e790746SPaolo Bonzini         n->vhost_started = 1;
27617a0ca55SKONRAD Frederic         r = vhost_net_start(vdev, n->nic->ncs, queues);
2776e790746SPaolo Bonzini         if (r < 0) {
2786e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
2796e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
2806e790746SPaolo Bonzini             n->vhost_started = 0;
2816e790746SPaolo Bonzini         }
2826e790746SPaolo Bonzini     } else {
28317a0ca55SKONRAD Frederic         vhost_net_stop(vdev, n->nic->ncs, queues);
2846e790746SPaolo Bonzini         n->vhost_started = 0;
2856e790746SPaolo Bonzini     }
2866e790746SPaolo Bonzini }
2876e790746SPaolo Bonzini 
2881bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
2891bfa316cSGreg Kurz                                           NetClientState *peer,
2901bfa316cSGreg Kurz                                           bool enable)
2911bfa316cSGreg Kurz {
2921bfa316cSGreg Kurz     if (virtio_is_big_endian(vdev)) {
2931bfa316cSGreg Kurz         return qemu_set_vnet_be(peer, enable);
2941bfa316cSGreg Kurz     } else {
2951bfa316cSGreg Kurz         return qemu_set_vnet_le(peer, enable);
2961bfa316cSGreg Kurz     }
2971bfa316cSGreg Kurz }
2981bfa316cSGreg Kurz 
2991bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
3001bfa316cSGreg Kurz                                        int queues, bool enable)
3011bfa316cSGreg Kurz {
3021bfa316cSGreg Kurz     int i;
3031bfa316cSGreg Kurz 
3041bfa316cSGreg Kurz     for (i = 0; i < queues; i++) {
3051bfa316cSGreg Kurz         if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
3061bfa316cSGreg Kurz             enable) {
3071bfa316cSGreg Kurz             while (--i >= 0) {
3081bfa316cSGreg Kurz                 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
3091bfa316cSGreg Kurz             }
3101bfa316cSGreg Kurz 
3111bfa316cSGreg Kurz             return true;
3121bfa316cSGreg Kurz         }
3131bfa316cSGreg Kurz     }
3141bfa316cSGreg Kurz 
3151bfa316cSGreg Kurz     return false;
3161bfa316cSGreg Kurz }
3171bfa316cSGreg Kurz 
3181bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
3191bfa316cSGreg Kurz {
3201bfa316cSGreg Kurz     VirtIODevice *vdev = VIRTIO_DEVICE(n);
3211bfa316cSGreg Kurz     int queues = n->multiqueue ? n->max_queues : 1;
3221bfa316cSGreg Kurz 
3231bfa316cSGreg Kurz     if (virtio_net_started(n, status)) {
3241bfa316cSGreg Kurz         /* Before using the device, we tell the network backend about the
3251bfa316cSGreg Kurz          * endianness to use when parsing vnet headers. If the backend
3261bfa316cSGreg Kurz          * can't do it, we fallback onto fixing the headers in the core
3271bfa316cSGreg Kurz          * virtio-net code.
3281bfa316cSGreg Kurz          */
3291bfa316cSGreg Kurz         n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
3301bfa316cSGreg Kurz                                                             queues, true);
3311bfa316cSGreg Kurz     } else if (virtio_net_started(n, vdev->status)) {
3321bfa316cSGreg Kurz         /* After using the device, we need to reset the network backend to
3331bfa316cSGreg Kurz          * the default (guest native endianness), otherwise the guest may
3341bfa316cSGreg Kurz          * lose network connectivity if it is rebooted into a different
3351bfa316cSGreg Kurz          * endianness.
3361bfa316cSGreg Kurz          */
3371bfa316cSGreg Kurz         virtio_net_set_vnet_endian(vdev, n->nic->ncs, queues, false);
3381bfa316cSGreg Kurz     }
3391bfa316cSGreg Kurz }
3401bfa316cSGreg Kurz 
341283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq)
342283e2c2aSYuri Benditovich {
343283e2c2aSYuri Benditovich     unsigned int dropped = virtqueue_drop_all(vq);
344283e2c2aSYuri Benditovich     if (dropped) {
345283e2c2aSYuri Benditovich         virtio_notify(vdev, vq);
346283e2c2aSYuri Benditovich     }
347283e2c2aSYuri Benditovich }
348283e2c2aSYuri Benditovich 
3496e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
3506e790746SPaolo Bonzini {
35117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3526e790746SPaolo Bonzini     VirtIONetQueue *q;
3536e790746SPaolo Bonzini     int i;
3546e790746SPaolo Bonzini     uint8_t queue_status;
3556e790746SPaolo Bonzini 
3561bfa316cSGreg Kurz     virtio_net_vnet_endian_status(n, status);
3576e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
3586e790746SPaolo Bonzini 
3596e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
36038705bb5SFam Zheng         NetClientState *ncs = qemu_get_subqueue(n->nic, i);
36138705bb5SFam Zheng         bool queue_started;
3626e790746SPaolo Bonzini         q = &n->vqs[i];
3636e790746SPaolo Bonzini 
3646e790746SPaolo Bonzini         if ((!n->multiqueue && i != 0) || i >= n->curr_queues) {
3656e790746SPaolo Bonzini             queue_status = 0;
3666e790746SPaolo Bonzini         } else {
3676e790746SPaolo Bonzini             queue_status = status;
3686e790746SPaolo Bonzini         }
36938705bb5SFam Zheng         queue_started =
37038705bb5SFam Zheng             virtio_net_started(n, queue_status) && !n->vhost_started;
37138705bb5SFam Zheng 
37238705bb5SFam Zheng         if (queue_started) {
37338705bb5SFam Zheng             qemu_flush_queued_packets(ncs);
37438705bb5SFam Zheng         }
3756e790746SPaolo Bonzini 
3766e790746SPaolo Bonzini         if (!q->tx_waiting) {
3776e790746SPaolo Bonzini             continue;
3786e790746SPaolo Bonzini         }
3796e790746SPaolo Bonzini 
38038705bb5SFam Zheng         if (queue_started) {
3816e790746SPaolo Bonzini             if (q->tx_timer) {
382bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
383bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
3846e790746SPaolo Bonzini             } else {
3856e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
3866e790746SPaolo Bonzini             }
3876e790746SPaolo Bonzini         } else {
3886e790746SPaolo Bonzini             if (q->tx_timer) {
389bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
3906e790746SPaolo Bonzini             } else {
3916e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
3926e790746SPaolo Bonzini             }
393283e2c2aSYuri Benditovich             if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 &&
39470e53e6eSJason Wang                 (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) &&
39570e53e6eSJason Wang                 vdev->vm_running) {
396283e2c2aSYuri Benditovich                 /* if tx is waiting we are likely have some packets in tx queue
397283e2c2aSYuri Benditovich                  * and disabled notification */
398283e2c2aSYuri Benditovich                 q->tx_waiting = 0;
399283e2c2aSYuri Benditovich                 virtio_queue_set_notification(q->tx_vq, 1);
400283e2c2aSYuri Benditovich                 virtio_net_drop_tx_queue_data(vdev, q->tx_vq);
401283e2c2aSYuri Benditovich             }
4026e790746SPaolo Bonzini         }
4036e790746SPaolo Bonzini     }
4046e790746SPaolo Bonzini }
4056e790746SPaolo Bonzini 
4066e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
4076e790746SPaolo Bonzini {
4086e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
40917a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
4106e790746SPaolo Bonzini     uint16_t old_status = n->status;
4116e790746SPaolo Bonzini 
4126e790746SPaolo Bonzini     if (nc->link_down)
4136e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
4146e790746SPaolo Bonzini     else
4156e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
4166e790746SPaolo Bonzini 
4176e790746SPaolo Bonzini     if (n->status != old_status)
41817a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
4196e790746SPaolo Bonzini 
42017a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
4216e790746SPaolo Bonzini }
4226e790746SPaolo Bonzini 
423b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
424b1be4280SAmos Kong {
425b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
426b1be4280SAmos Kong 
427b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
428ddfb0baaSMarkus Armbruster         char *path = object_get_canonical_path(OBJECT(n->qdev));
42906150279SWenchao Xia         qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
4303ab72385SPeter Xu                                               n->netclient_name, path);
43196e35046SAmos Kong         g_free(path);
432b1be4280SAmos Kong 
433b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
434b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
435b1be4280SAmos Kong     }
436b1be4280SAmos Kong }
437b1be4280SAmos Kong 
438f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
439f7bc8ef8SAmos Kong {
44054aa3de7SEric Blake     intList *list;
441f7bc8ef8SAmos Kong     int i, j;
442f7bc8ef8SAmos Kong 
443f7bc8ef8SAmos Kong     list = NULL;
444f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
445f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
446f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
44754aa3de7SEric Blake                 QAPI_LIST_PREPEND(list, (i << 5) + j);
448f7bc8ef8SAmos Kong             }
449f7bc8ef8SAmos Kong         }
450f7bc8ef8SAmos Kong     }
451f7bc8ef8SAmos Kong 
452f7bc8ef8SAmos Kong     return list;
453f7bc8ef8SAmos Kong }
454f7bc8ef8SAmos Kong 
455b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
456b1be4280SAmos Kong {
457b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
458f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
459b1be4280SAmos Kong     RxFilterInfo *info;
46054aa3de7SEric Blake     strList *str_list;
461f7bc8ef8SAmos Kong     int i;
462b1be4280SAmos Kong 
463b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
464b1be4280SAmos Kong     info->name = g_strdup(nc->name);
465b1be4280SAmos Kong     info->promiscuous = n->promisc;
466b1be4280SAmos Kong 
467b1be4280SAmos Kong     if (n->nouni) {
468b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
469b1be4280SAmos Kong     } else if (n->alluni) {
470b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
471b1be4280SAmos Kong     } else {
472b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
473b1be4280SAmos Kong     }
474b1be4280SAmos Kong 
475b1be4280SAmos Kong     if (n->nomulti) {
476b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
477b1be4280SAmos Kong     } else if (n->allmulti) {
478b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
479b1be4280SAmos Kong     } else {
480b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
481b1be4280SAmos Kong     }
482b1be4280SAmos Kong 
483b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
484b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
485b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
486b1be4280SAmos Kong 
487b0575ba4SScott Feldman     info->main_mac = qemu_mac_strdup_printf(n->mac);
488b1be4280SAmos Kong 
489b1be4280SAmos Kong     str_list = NULL;
490b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
49154aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
49254aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
493b1be4280SAmos Kong     }
494b1be4280SAmos Kong     info->unicast_table = str_list;
495b1be4280SAmos Kong 
496b1be4280SAmos Kong     str_list = NULL;
497b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
49854aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
49954aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
500b1be4280SAmos Kong     }
501b1be4280SAmos Kong     info->multicast_table = str_list;
502f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
503b1be4280SAmos Kong 
50495129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
505f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
506f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
507f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
508f7bc8ef8SAmos Kong     } else {
509f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
510b1be4280SAmos Kong     }
511b1be4280SAmos Kong 
512b1be4280SAmos Kong     /* enable event notification after query */
513b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
514b1be4280SAmos Kong 
515b1be4280SAmos Kong     return info;
516b1be4280SAmos Kong }
517b1be4280SAmos Kong 
5186e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
5196e790746SPaolo Bonzini {
52017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
52194b52958SGreg Kurz     int i;
5226e790746SPaolo Bonzini 
5236e790746SPaolo Bonzini     /* Reset back to compatibility mode */
5246e790746SPaolo Bonzini     n->promisc = 1;
5256e790746SPaolo Bonzini     n->allmulti = 0;
5266e790746SPaolo Bonzini     n->alluni = 0;
5276e790746SPaolo Bonzini     n->nomulti = 0;
5286e790746SPaolo Bonzini     n->nouni = 0;
5296e790746SPaolo Bonzini     n->nobcast = 0;
5306e790746SPaolo Bonzini     /* multiqueue is disabled by default */
5316e790746SPaolo Bonzini     n->curr_queues = 1;
5329d8c6a25SDr. David Alan Gilbert     timer_del(n->announce_timer.tm);
5339d8c6a25SDr. David Alan Gilbert     n->announce_timer.round = 0;
534f57fcf70SJason Wang     n->status &= ~VIRTIO_NET_S_ANNOUNCE;
5356e790746SPaolo Bonzini 
5366e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
5376e790746SPaolo Bonzini     n->mac_table.in_use = 0;
5386e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
5396e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
5406e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
5416e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
5426e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
543702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
5446e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
54594b52958SGreg Kurz 
54694b52958SGreg Kurz     /* Flush any async TX */
54794b52958SGreg Kurz     for (i = 0;  i < n->max_queues; i++) {
54894b52958SGreg Kurz         NetClientState *nc = qemu_get_subqueue(n->nic, i);
54994b52958SGreg Kurz 
55094b52958SGreg Kurz         if (nc->peer) {
55194b52958SGreg Kurz             qemu_flush_or_purge_queued_packets(nc->peer, true);
55294b52958SGreg Kurz             assert(!virtio_net_get_subqueue(nc)->async_tx.elem);
55394b52958SGreg Kurz         }
55494b52958SGreg Kurz     }
5556e790746SPaolo Bonzini }
5566e790746SPaolo Bonzini 
5576e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
5586e790746SPaolo Bonzini {
5596e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
5606e790746SPaolo Bonzini     if (!nc->peer) {
5616e790746SPaolo Bonzini         return;
5626e790746SPaolo Bonzini     }
5636e790746SPaolo Bonzini 
564d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
5656e790746SPaolo Bonzini }
5666e790746SPaolo Bonzini 
5676e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
5686e790746SPaolo Bonzini {
5696e790746SPaolo Bonzini     return n->has_vnet_hdr;
5706e790746SPaolo Bonzini }
5716e790746SPaolo Bonzini 
5726e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
5736e790746SPaolo Bonzini {
5746e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
5756e790746SPaolo Bonzini         return 0;
5766e790746SPaolo Bonzini 
577d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
5786e790746SPaolo Bonzini 
5796e790746SPaolo Bonzini     return n->has_ufo;
5806e790746SPaolo Bonzini }
5816e790746SPaolo Bonzini 
582bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
583e22f0603SYuri Benditovich                                        int version_1, int hash_report)
5846e790746SPaolo Bonzini {
5856e790746SPaolo Bonzini     int i;
5866e790746SPaolo Bonzini     NetClientState *nc;
5876e790746SPaolo Bonzini 
5886e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
5896e790746SPaolo Bonzini 
590bb9d17f8SCornelia Huck     if (version_1) {
591e22f0603SYuri Benditovich         n->guest_hdr_len = hash_report ?
592e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_v1_hash) :
593e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_mrg_rxbuf);
594e22f0603SYuri Benditovich         n->rss_data.populate_hash = !!hash_report;
595bb9d17f8SCornelia Huck     } else {
5966e790746SPaolo Bonzini         n->guest_hdr_len = n->mergeable_rx_bufs ?
597bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr_mrg_rxbuf) :
598bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr);
599bb9d17f8SCornelia Huck     }
6006e790746SPaolo Bonzini 
6016e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
6026e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
6036e790746SPaolo Bonzini 
6046e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
605d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
606d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
6076e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
6086e790746SPaolo Bonzini         }
6096e790746SPaolo Bonzini     }
6106e790746SPaolo Bonzini }
6116e790746SPaolo Bonzini 
6122eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n)
6132eef278bSMichael S. Tsirkin {
6142eef278bSMichael S. Tsirkin     NetClientState *peer = n->nic_conf.peers.ncs[0];
6152eef278bSMichael S. Tsirkin 
6162eef278bSMichael S. Tsirkin     /*
6172eef278bSMichael S. Tsirkin      * Backends other than vhost-user don't support max queue size.
6182eef278bSMichael S. Tsirkin      */
6192eef278bSMichael S. Tsirkin     if (!peer) {
6202eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6212eef278bSMichael S. Tsirkin     }
6222eef278bSMichael S. Tsirkin 
6232eef278bSMichael S. Tsirkin     if (peer->info->type != NET_CLIENT_DRIVER_VHOST_USER) {
6242eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6252eef278bSMichael S. Tsirkin     }
6262eef278bSMichael S. Tsirkin 
6272eef278bSMichael S. Tsirkin     return VIRTQUEUE_MAX_SIZE;
6282eef278bSMichael S. Tsirkin }
6292eef278bSMichael S. Tsirkin 
6306e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
6316e790746SPaolo Bonzini {
6326e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6336e790746SPaolo Bonzini 
6346e790746SPaolo Bonzini     if (!nc->peer) {
6356e790746SPaolo Bonzini         return 0;
6366e790746SPaolo Bonzini     }
6376e790746SPaolo Bonzini 
638f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6397263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 1);
6407263a0adSChangchun Ouyang     }
6417263a0adSChangchun Ouyang 
642f394b2e2SEric Blake     if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
6436e790746SPaolo Bonzini         return 0;
6446e790746SPaolo Bonzini     }
6456e790746SPaolo Bonzini 
6461074b879SJason Wang     if (n->max_queues == 1) {
6471074b879SJason Wang         return 0;
6481074b879SJason Wang     }
6491074b879SJason Wang 
6506e790746SPaolo Bonzini     return tap_enable(nc->peer);
6516e790746SPaolo Bonzini }
6526e790746SPaolo Bonzini 
6536e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
6546e790746SPaolo Bonzini {
6556e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6566e790746SPaolo Bonzini 
6576e790746SPaolo Bonzini     if (!nc->peer) {
6586e790746SPaolo Bonzini         return 0;
6596e790746SPaolo Bonzini     }
6606e790746SPaolo Bonzini 
661f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6627263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 0);
6637263a0adSChangchun Ouyang     }
6647263a0adSChangchun Ouyang 
665f394b2e2SEric Blake     if (nc->peer->info->type !=  NET_CLIENT_DRIVER_TAP) {
6666e790746SPaolo Bonzini         return 0;
6676e790746SPaolo Bonzini     }
6686e790746SPaolo Bonzini 
6696e790746SPaolo Bonzini     return tap_disable(nc->peer);
6706e790746SPaolo Bonzini }
6716e790746SPaolo Bonzini 
6726e790746SPaolo Bonzini static void virtio_net_set_queues(VirtIONet *n)
6736e790746SPaolo Bonzini {
6746e790746SPaolo Bonzini     int i;
675ddfa83eaSJoel Stanley     int r;
6766e790746SPaolo Bonzini 
67768b5f314SYuri Benditovich     if (n->nic->peer_deleted) {
67868b5f314SYuri Benditovich         return;
67968b5f314SYuri Benditovich     }
68068b5f314SYuri Benditovich 
6816e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
6826e790746SPaolo Bonzini         if (i < n->curr_queues) {
683ddfa83eaSJoel Stanley             r = peer_attach(n, i);
684ddfa83eaSJoel Stanley             assert(!r);
6856e790746SPaolo Bonzini         } else {
686ddfa83eaSJoel Stanley             r = peer_detach(n, i);
687ddfa83eaSJoel Stanley             assert(!r);
6886e790746SPaolo Bonzini         }
6896e790746SPaolo Bonzini     }
6906e790746SPaolo Bonzini }
6916e790746SPaolo Bonzini 
692ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
6936e790746SPaolo Bonzini 
6949d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
6959d5b731dSJason Wang                                         Error **errp)
6966e790746SPaolo Bonzini {
69717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
6986e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
6996e790746SPaolo Bonzini 
700da3e8a23SShannon Zhao     /* Firstly sync all virtio-net possible supported features */
701da3e8a23SShannon Zhao     features |= n->host_features;
702da3e8a23SShannon Zhao 
7030cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7046e790746SPaolo Bonzini 
7056e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
7060cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
7070cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7080cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7090cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
7106e790746SPaolo Bonzini 
7110cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
7120cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
7130cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
7140cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
715e22f0603SYuri Benditovich 
716e22f0603SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
7176e790746SPaolo Bonzini     }
7186e790746SPaolo Bonzini 
7196e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
7200cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
7210cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
7226e790746SPaolo Bonzini     }
7236e790746SPaolo Bonzini 
724ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
7256e790746SPaolo Bonzini         return features;
7266e790746SPaolo Bonzini     }
7272974e916SYuri Benditovich 
72859079029SYuri Benditovich     virtio_clear_feature(&features, VIRTIO_NET_F_RSS);
729e22f0603SYuri Benditovich     virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
73075ebec11SMaxime Coquelin     features = vhost_net_get_features(get_vhost_net(nc->peer), features);
73175ebec11SMaxime Coquelin     vdev->backend_features = features;
73275ebec11SMaxime Coquelin 
73375ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
73475ebec11SMaxime Coquelin             (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) {
73575ebec11SMaxime Coquelin         features |= (1ULL << VIRTIO_NET_F_MTU);
73675ebec11SMaxime Coquelin     }
73775ebec11SMaxime Coquelin 
73875ebec11SMaxime Coquelin     return features;
7396e790746SPaolo Bonzini }
7406e790746SPaolo Bonzini 
741019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
7426e790746SPaolo Bonzini {
743019a3edbSGerd Hoffmann     uint64_t features = 0;
7446e790746SPaolo Bonzini 
7456e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
7466e790746SPaolo Bonzini      * but also these: */
7470cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7480cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
7490cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7500cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7510cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
7526e790746SPaolo Bonzini 
7536e790746SPaolo Bonzini     return features;
7546e790746SPaolo Bonzini }
7556e790746SPaolo Bonzini 
756644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
757644c9858SDmitry Fleytman {
758ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
759644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
760644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
761644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
762644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
763644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
764644c9858SDmitry Fleytman }
765644c9858SDmitry Fleytman 
766644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
767644c9858SDmitry Fleytman {
768644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
769644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
770644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
771644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
772644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
773644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
774644c9858SDmitry Fleytman 
775644c9858SDmitry Fleytman     return guest_offloads_mask & features;
776644c9858SDmitry Fleytman }
777644c9858SDmitry Fleytman 
778644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
779644c9858SDmitry Fleytman {
780644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
781644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
782644c9858SDmitry Fleytman }
783644c9858SDmitry Fleytman 
784f5e1847bSJuan Quintela typedef struct {
785f5e1847bSJuan Quintela     VirtIONet *n;
786f5e1847bSJuan Quintela     char *id;
787f5e1847bSJuan Quintela } FailoverId;
788f5e1847bSJuan Quintela 
789f5e1847bSJuan Quintela /**
790f5e1847bSJuan Quintela  * Set the id of the failover primary device
791f5e1847bSJuan Quintela  *
792f5e1847bSJuan Quintela  * @opaque: FailoverId to setup
793f5e1847bSJuan Quintela  * @opts: opts for device we are handling
794f5e1847bSJuan Quintela  * @errp: returns an error if this function fails
795f5e1847bSJuan Quintela  */
796f5e1847bSJuan Quintela static int failover_set_primary(void *opaque, QemuOpts *opts, Error **errp)
797f5e1847bSJuan Quintela {
798f5e1847bSJuan Quintela     FailoverId *fid = opaque;
799f5e1847bSJuan Quintela     const char *standby_id = qemu_opt_get(opts, "failover_pair_id");
800f5e1847bSJuan Quintela 
801f5e1847bSJuan Quintela     if (g_strcmp0(standby_id, fid->n->netclient_name) == 0) {
802f5e1847bSJuan Quintela         fid->id = g_strdup(opts->id);
803f5e1847bSJuan Quintela         return 1;
804f5e1847bSJuan Quintela     }
805f5e1847bSJuan Quintela 
806f5e1847bSJuan Quintela     return 0;
807f5e1847bSJuan Quintela }
808f5e1847bSJuan Quintela 
809f5e1847bSJuan Quintela /**
810f5e1847bSJuan Quintela  * Find the primary device id for this failover virtio-net
811f5e1847bSJuan Quintela  *
812f5e1847bSJuan Quintela  * @n: VirtIONet device
813f5e1847bSJuan Quintela  * @errp: returns an error if this function fails
814f5e1847bSJuan Quintela  */
815f5e1847bSJuan Quintela static char *failover_find_primary_device_id(VirtIONet *n)
816f5e1847bSJuan Quintela {
817f5e1847bSJuan Quintela     Error *err = NULL;
818f5e1847bSJuan Quintela     FailoverId fid;
819f5e1847bSJuan Quintela 
8203abad4a2SJuan Quintela     fid.n = n;
821f5e1847bSJuan Quintela     if (!qemu_opts_foreach(qemu_find_opts("device"),
822f5e1847bSJuan Quintela                            failover_set_primary, &fid, &err)) {
823f5e1847bSJuan Quintela         return NULL;
824f5e1847bSJuan Quintela     }
825f5e1847bSJuan Quintela     return fid.id;
826f5e1847bSJuan Quintela }
827f5e1847bSJuan Quintela 
82885d3b931SJuan Quintela /**
82985d3b931SJuan Quintela  * Find the primary device for this failover virtio-net
83085d3b931SJuan Quintela  *
83185d3b931SJuan Quintela  * @n: VirtIONet device
83285d3b931SJuan Quintela  * @errp: returns an error if this function fails
83385d3b931SJuan Quintela  */
8340a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n)
8359711cd0dSJens Freimann {
836f5e1847bSJuan Quintela     char *id = failover_find_primary_device_id(n);
8379711cd0dSJens Freimann 
838f5e1847bSJuan Quintela     if (!id) {
8399711cd0dSJens Freimann         return NULL;
8409711cd0dSJens Freimann     }
841f5e1847bSJuan Quintela 
8423abad4a2SJuan Quintela     return qdev_find_recursive(sysbus_get_default(), id);
8439711cd0dSJens Freimann }
8449711cd0dSJens Freimann 
84521e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp)
84621e8709bSJuan Quintela {
84721e8709bSJuan Quintela     Error *err = NULL;
84821e8709bSJuan Quintela     QemuOpts *opts;
84921e8709bSJuan Quintela     char *id;
85021e8709bSJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
85121e8709bSJuan Quintela 
85221e8709bSJuan Quintela     if (dev) {
85321e8709bSJuan Quintela         return;
85421e8709bSJuan Quintela     }
85521e8709bSJuan Quintela 
85621e8709bSJuan Quintela     id = failover_find_primary_device_id(n);
85721e8709bSJuan Quintela     if (!id) {
85821e8709bSJuan Quintela         return;
85921e8709bSJuan Quintela     }
86021e8709bSJuan Quintela     opts = qemu_opts_find(qemu_find_opts("device"), id);
86121e8709bSJuan Quintela     if (opts) {
86221e8709bSJuan Quintela         dev = qdev_device_add(opts, &err);
86321e8709bSJuan Quintela         if (err) {
86421e8709bSJuan Quintela             qemu_opts_del(opts);
86521e8709bSJuan Quintela         }
86621e8709bSJuan Quintela     } else {
86721e8709bSJuan Quintela         error_setg(errp, "Primary device not found");
86821e8709bSJuan Quintela         error_append_hint(errp, "Virtio-net failover will not work. Make "
86921e8709bSJuan Quintela                           "sure primary device has parameter"
87021e8709bSJuan Quintela                           " failover_pair_id=<virtio-net-id>\n");
87121e8709bSJuan Quintela     }
87221e8709bSJuan Quintela     error_propagate(errp, err);
87321e8709bSJuan Quintela }
87421e8709bSJuan Quintela 
875d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
8766e790746SPaolo Bonzini {
87717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
8789711cd0dSJens Freimann     Error *err = NULL;
8796e790746SPaolo Bonzini     int i;
8806e790746SPaolo Bonzini 
88175ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
88275ebec11SMaxime Coquelin             !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) {
88375ebec11SMaxime Coquelin         features &= ~(1ULL << VIRTIO_NET_F_MTU);
88475ebec11SMaxime Coquelin     }
88575ebec11SMaxime Coquelin 
886ef546f12SCornelia Huck     virtio_net_set_multiqueue(n,
88759079029SYuri Benditovich                               virtio_has_feature(features, VIRTIO_NET_F_RSS) ||
88895129d6fSCornelia Huck                               virtio_has_feature(features, VIRTIO_NET_F_MQ));
8896e790746SPaolo Bonzini 
890ef546f12SCornelia Huck     virtio_net_set_mrg_rx_bufs(n,
89195129d6fSCornelia Huck                                virtio_has_feature(features,
892bb9d17f8SCornelia Huck                                                   VIRTIO_NET_F_MRG_RXBUF),
89395129d6fSCornelia Huck                                virtio_has_feature(features,
894e22f0603SYuri Benditovich                                                   VIRTIO_F_VERSION_1),
895e22f0603SYuri Benditovich                                virtio_has_feature(features,
896e22f0603SYuri Benditovich                                                   VIRTIO_NET_F_HASH_REPORT));
8976e790746SPaolo Bonzini 
8982974e916SYuri Benditovich     n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
8992974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4);
9002974e916SYuri Benditovich     n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9012974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6);
902e22f0603SYuri Benditovich     n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS);
9032974e916SYuri Benditovich 
9046e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
905644c9858SDmitry Fleytman         n->curr_guest_offloads =
906644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
907644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
9086e790746SPaolo Bonzini     }
9096e790746SPaolo Bonzini 
9106e790746SPaolo Bonzini     for (i = 0;  i < n->max_queues; i++) {
9116e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
9126e790746SPaolo Bonzini 
913ed8b4afeSNikolay Nikolaev         if (!get_vhost_net(nc->peer)) {
9146e790746SPaolo Bonzini             continue;
9156e790746SPaolo Bonzini         }
916ed8b4afeSNikolay Nikolaev         vhost_net_ack_features(get_vhost_net(nc->peer), features);
9176e790746SPaolo Bonzini     }
9180b1eaa88SStefan Fritsch 
91995129d6fSCornelia Huck     if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
9200b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
9210b1eaa88SStefan Fritsch     } else {
9220b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
9230b1eaa88SStefan Fritsch     }
9249711cd0dSJens Freimann 
9259711cd0dSJens Freimann     if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) {
9269711cd0dSJens Freimann         qapi_event_send_failover_negotiated(n->netclient_name);
927e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, false);
9289711cd0dSJens Freimann         failover_add_primary(n, &err);
9299711cd0dSJens Freimann         if (err) {
9309711cd0dSJens Freimann             warn_report_err(err);
9319711cd0dSJens Freimann         }
9326e790746SPaolo Bonzini     }
93321e8709bSJuan Quintela }
9346e790746SPaolo Bonzini 
9356e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
9366e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
9376e790746SPaolo Bonzini {
9386e790746SPaolo Bonzini     uint8_t on;
9396e790746SPaolo Bonzini     size_t s;
940b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
9416e790746SPaolo Bonzini 
9426e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
9436e790746SPaolo Bonzini     if (s != sizeof(on)) {
9446e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9456e790746SPaolo Bonzini     }
9466e790746SPaolo Bonzini 
9476e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
9486e790746SPaolo Bonzini         n->promisc = on;
9496e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
9506e790746SPaolo Bonzini         n->allmulti = on;
9516e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
9526e790746SPaolo Bonzini         n->alluni = on;
9536e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
9546e790746SPaolo Bonzini         n->nomulti = on;
9556e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
9566e790746SPaolo Bonzini         n->nouni = on;
9576e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
9586e790746SPaolo Bonzini         n->nobcast = on;
9596e790746SPaolo Bonzini     } else {
9606e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9616e790746SPaolo Bonzini     }
9626e790746SPaolo Bonzini 
963b1be4280SAmos Kong     rxfilter_notify(nc);
964b1be4280SAmos Kong 
9656e790746SPaolo Bonzini     return VIRTIO_NET_OK;
9666e790746SPaolo Bonzini }
9676e790746SPaolo Bonzini 
968644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
969644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
970644c9858SDmitry Fleytman {
971644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
972644c9858SDmitry Fleytman     uint64_t offloads;
973644c9858SDmitry Fleytman     size_t s;
974644c9858SDmitry Fleytman 
97595129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
976644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
977644c9858SDmitry Fleytman     }
978644c9858SDmitry Fleytman 
979644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
980644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
981644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
982644c9858SDmitry Fleytman     }
983644c9858SDmitry Fleytman 
984644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
985644c9858SDmitry Fleytman         uint64_t supported_offloads;
986644c9858SDmitry Fleytman 
987189ae6bbSJason Wang         offloads = virtio_ldq_p(vdev, &offloads);
988189ae6bbSJason Wang 
989644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
990644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
991644c9858SDmitry Fleytman         }
992644c9858SDmitry Fleytman 
9932974e916SYuri Benditovich         n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
9942974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4);
9952974e916SYuri Benditovich         n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
9962974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6);
9972974e916SYuri Benditovich         virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT);
9982974e916SYuri Benditovich 
999644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
1000644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
1001644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1002644c9858SDmitry Fleytman         }
1003644c9858SDmitry Fleytman 
1004644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
1005644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1006644c9858SDmitry Fleytman 
1007644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
1008644c9858SDmitry Fleytman     } else {
1009644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1010644c9858SDmitry Fleytman     }
1011644c9858SDmitry Fleytman }
1012644c9858SDmitry Fleytman 
10136e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
10146e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
10156e790746SPaolo Bonzini {
10161399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10176e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
10186e790746SPaolo Bonzini     size_t s;
1019b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10206e790746SPaolo Bonzini 
10216e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
10226e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
10236e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
10246e790746SPaolo Bonzini         }
10256e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
10266e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
10276e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1028b1be4280SAmos Kong         rxfilter_notify(nc);
1029b1be4280SAmos Kong 
10306e790746SPaolo Bonzini         return VIRTIO_NET_OK;
10316e790746SPaolo Bonzini     }
10326e790746SPaolo Bonzini 
10336e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
10346e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10356e790746SPaolo Bonzini     }
10366e790746SPaolo Bonzini 
1037cae2e556SAmos Kong     int in_use = 0;
1038cae2e556SAmos Kong     int first_multi = 0;
1039cae2e556SAmos Kong     uint8_t uni_overflow = 0;
1040cae2e556SAmos Kong     uint8_t multi_overflow = 0;
1041cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
10426e790746SPaolo Bonzini 
10436e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10446e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10451399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10466e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1047b1be4280SAmos Kong         goto error;
10486e790746SPaolo Bonzini     }
10496e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10506e790746SPaolo Bonzini 
10516e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
1052b1be4280SAmos Kong         goto error;
10536e790746SPaolo Bonzini     }
10546e790746SPaolo Bonzini 
10556e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
1056cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
10576e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
10586e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1059b1be4280SAmos Kong             goto error;
10606e790746SPaolo Bonzini         }
1061cae2e556SAmos Kong         in_use += mac_data.entries;
10626e790746SPaolo Bonzini     } else {
1063cae2e556SAmos Kong         uni_overflow = 1;
10646e790746SPaolo Bonzini     }
10656e790746SPaolo Bonzini 
10666e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
10676e790746SPaolo Bonzini 
1068cae2e556SAmos Kong     first_multi = in_use;
10696e790746SPaolo Bonzini 
10706e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10716e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10721399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10736e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1074b1be4280SAmos Kong         goto error;
10756e790746SPaolo Bonzini     }
10766e790746SPaolo Bonzini 
10776e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10786e790746SPaolo Bonzini 
10796e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
1080b1be4280SAmos Kong         goto error;
10816e790746SPaolo Bonzini     }
10826e790746SPaolo Bonzini 
1083edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
1084cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
10856e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
10866e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1087b1be4280SAmos Kong             goto error;
10886e790746SPaolo Bonzini         }
1089cae2e556SAmos Kong         in_use += mac_data.entries;
10906e790746SPaolo Bonzini     } else {
1091cae2e556SAmos Kong         multi_overflow = 1;
10926e790746SPaolo Bonzini     }
10936e790746SPaolo Bonzini 
1094cae2e556SAmos Kong     n->mac_table.in_use = in_use;
1095cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
1096cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
1097cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
1098cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
1099cae2e556SAmos Kong     g_free(macs);
1100b1be4280SAmos Kong     rxfilter_notify(nc);
1101b1be4280SAmos Kong 
11026e790746SPaolo Bonzini     return VIRTIO_NET_OK;
1103b1be4280SAmos Kong 
1104b1be4280SAmos Kong error:
1105cae2e556SAmos Kong     g_free(macs);
1106b1be4280SAmos Kong     return VIRTIO_NET_ERR;
11076e790746SPaolo Bonzini }
11086e790746SPaolo Bonzini 
11096e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
11106e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
11116e790746SPaolo Bonzini {
11121399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
11136e790746SPaolo Bonzini     uint16_t vid;
11146e790746SPaolo Bonzini     size_t s;
1115b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
11166e790746SPaolo Bonzini 
11176e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
11181399c60dSRusty Russell     vid = virtio_lduw_p(vdev, &vid);
11196e790746SPaolo Bonzini     if (s != sizeof(vid)) {
11206e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11216e790746SPaolo Bonzini     }
11226e790746SPaolo Bonzini 
11236e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
11246e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11256e790746SPaolo Bonzini 
11266e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
11276e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
11286e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
11296e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
11306e790746SPaolo Bonzini     else
11316e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11326e790746SPaolo Bonzini 
1133b1be4280SAmos Kong     rxfilter_notify(nc);
1134b1be4280SAmos Kong 
11356e790746SPaolo Bonzini     return VIRTIO_NET_OK;
11366e790746SPaolo Bonzini }
11376e790746SPaolo Bonzini 
1138f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
1139f57fcf70SJason Wang                                       struct iovec *iov, unsigned int iov_cnt)
1140f57fcf70SJason Wang {
11419d8c6a25SDr. David Alan Gilbert     trace_virtio_net_handle_announce(n->announce_timer.round);
1142f57fcf70SJason Wang     if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
1143f57fcf70SJason Wang         n->status & VIRTIO_NET_S_ANNOUNCE) {
1144f57fcf70SJason Wang         n->status &= ~VIRTIO_NET_S_ANNOUNCE;
11459d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
11469d8c6a25SDr. David Alan Gilbert             qemu_announce_timer_step(&n->announce_timer);
1147f57fcf70SJason Wang         }
1148f57fcf70SJason Wang         return VIRTIO_NET_OK;
1149f57fcf70SJason Wang     } else {
1150f57fcf70SJason Wang         return VIRTIO_NET_ERR;
1151f57fcf70SJason Wang     }
1152f57fcf70SJason Wang }
1153f57fcf70SJason Wang 
115459079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n)
115559079029SYuri Benditovich {
115659079029SYuri Benditovich     if (n->rss_data.enabled) {
115759079029SYuri Benditovich         trace_virtio_net_rss_disable();
115859079029SYuri Benditovich     }
115959079029SYuri Benditovich     n->rss_data.enabled = false;
116059079029SYuri Benditovich }
116159079029SYuri Benditovich 
116259079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n,
1163e22f0603SYuri Benditovich                                       struct iovec *iov,
1164e22f0603SYuri Benditovich                                       unsigned int iov_cnt,
1165e22f0603SYuri Benditovich                                       bool do_rss)
116659079029SYuri Benditovich {
116759079029SYuri Benditovich     VirtIODevice *vdev = VIRTIO_DEVICE(n);
116859079029SYuri Benditovich     struct virtio_net_rss_config cfg;
116959079029SYuri Benditovich     size_t s, offset = 0, size_get;
117059079029SYuri Benditovich     uint16_t queues, i;
117159079029SYuri Benditovich     struct {
117259079029SYuri Benditovich         uint16_t us;
117359079029SYuri Benditovich         uint8_t b;
117459079029SYuri Benditovich     } QEMU_PACKED temp;
117559079029SYuri Benditovich     const char *err_msg = "";
117659079029SYuri Benditovich     uint32_t err_value = 0;
117759079029SYuri Benditovich 
1178e22f0603SYuri Benditovich     if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) {
117959079029SYuri Benditovich         err_msg = "RSS is not negotiated";
118059079029SYuri Benditovich         goto error;
118159079029SYuri Benditovich     }
1182e22f0603SYuri Benditovich     if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) {
1183e22f0603SYuri Benditovich         err_msg = "Hash report is not negotiated";
1184e22f0603SYuri Benditovich         goto error;
1185e22f0603SYuri Benditovich     }
118659079029SYuri Benditovich     size_get = offsetof(struct virtio_net_rss_config, indirection_table);
118759079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get);
118859079029SYuri Benditovich     if (s != size_get) {
118959079029SYuri Benditovich         err_msg = "Short command buffer";
119059079029SYuri Benditovich         err_value = (uint32_t)s;
119159079029SYuri Benditovich         goto error;
119259079029SYuri Benditovich     }
119359079029SYuri Benditovich     n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types);
119459079029SYuri Benditovich     n->rss_data.indirections_len =
119559079029SYuri Benditovich         virtio_lduw_p(vdev, &cfg.indirection_table_mask);
119659079029SYuri Benditovich     n->rss_data.indirections_len++;
1197e22f0603SYuri Benditovich     if (!do_rss) {
1198e22f0603SYuri Benditovich         n->rss_data.indirections_len = 1;
1199e22f0603SYuri Benditovich     }
120059079029SYuri Benditovich     if (!is_power_of_2(n->rss_data.indirections_len)) {
120159079029SYuri Benditovich         err_msg = "Invalid size of indirection table";
120259079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
120359079029SYuri Benditovich         goto error;
120459079029SYuri Benditovich     }
120559079029SYuri Benditovich     if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) {
120659079029SYuri Benditovich         err_msg = "Too large indirection table";
120759079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
120859079029SYuri Benditovich         goto error;
120959079029SYuri Benditovich     }
1210e22f0603SYuri Benditovich     n->rss_data.default_queue = do_rss ?
1211e22f0603SYuri Benditovich         virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0;
121259079029SYuri Benditovich     if (n->rss_data.default_queue >= n->max_queues) {
121359079029SYuri Benditovich         err_msg = "Invalid default queue";
121459079029SYuri Benditovich         err_value = n->rss_data.default_queue;
121559079029SYuri Benditovich         goto error;
121659079029SYuri Benditovich     }
121759079029SYuri Benditovich     offset += size_get;
121859079029SYuri Benditovich     size_get = sizeof(uint16_t) * n->rss_data.indirections_len;
121959079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
122059079029SYuri Benditovich     n->rss_data.indirections_table = g_malloc(size_get);
122159079029SYuri Benditovich     if (!n->rss_data.indirections_table) {
122259079029SYuri Benditovich         err_msg = "Can't allocate indirections table";
122359079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
122459079029SYuri Benditovich         goto error;
122559079029SYuri Benditovich     }
122659079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset,
122759079029SYuri Benditovich                    n->rss_data.indirections_table, size_get);
122859079029SYuri Benditovich     if (s != size_get) {
122959079029SYuri Benditovich         err_msg = "Short indirection table buffer";
123059079029SYuri Benditovich         err_value = (uint32_t)s;
123159079029SYuri Benditovich         goto error;
123259079029SYuri Benditovich     }
123359079029SYuri Benditovich     for (i = 0; i < n->rss_data.indirections_len; ++i) {
123459079029SYuri Benditovich         uint16_t val = n->rss_data.indirections_table[i];
123559079029SYuri Benditovich         n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val);
123659079029SYuri Benditovich     }
123759079029SYuri Benditovich     offset += size_get;
123859079029SYuri Benditovich     size_get = sizeof(temp);
123959079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get);
124059079029SYuri Benditovich     if (s != size_get) {
124159079029SYuri Benditovich         err_msg = "Can't get queues";
124259079029SYuri Benditovich         err_value = (uint32_t)s;
124359079029SYuri Benditovich         goto error;
124459079029SYuri Benditovich     }
1245e22f0603SYuri Benditovich     queues = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queues;
124659079029SYuri Benditovich     if (queues == 0 || queues > n->max_queues) {
124759079029SYuri Benditovich         err_msg = "Invalid number of queues";
124859079029SYuri Benditovich         err_value = queues;
124959079029SYuri Benditovich         goto error;
125059079029SYuri Benditovich     }
125159079029SYuri Benditovich     if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) {
125259079029SYuri Benditovich         err_msg = "Invalid key size";
125359079029SYuri Benditovich         err_value = temp.b;
125459079029SYuri Benditovich         goto error;
125559079029SYuri Benditovich     }
125659079029SYuri Benditovich     if (!temp.b && n->rss_data.hash_types) {
125759079029SYuri Benditovich         err_msg = "No key provided";
125859079029SYuri Benditovich         err_value = 0;
125959079029SYuri Benditovich         goto error;
126059079029SYuri Benditovich     }
126159079029SYuri Benditovich     if (!temp.b && !n->rss_data.hash_types) {
126259079029SYuri Benditovich         virtio_net_disable_rss(n);
126359079029SYuri Benditovich         return queues;
126459079029SYuri Benditovich     }
126559079029SYuri Benditovich     offset += size_get;
126659079029SYuri Benditovich     size_get = temp.b;
126759079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get);
126859079029SYuri Benditovich     if (s != size_get) {
126959079029SYuri Benditovich         err_msg = "Can get key buffer";
127059079029SYuri Benditovich         err_value = (uint32_t)s;
127159079029SYuri Benditovich         goto error;
127259079029SYuri Benditovich     }
127359079029SYuri Benditovich     n->rss_data.enabled = true;
127459079029SYuri Benditovich     trace_virtio_net_rss_enable(n->rss_data.hash_types,
127559079029SYuri Benditovich                                 n->rss_data.indirections_len,
127659079029SYuri Benditovich                                 temp.b);
127759079029SYuri Benditovich     return queues;
127859079029SYuri Benditovich error:
127959079029SYuri Benditovich     trace_virtio_net_rss_error(err_msg, err_value);
128059079029SYuri Benditovich     virtio_net_disable_rss(n);
128159079029SYuri Benditovich     return 0;
128259079029SYuri Benditovich }
128359079029SYuri Benditovich 
12846e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
12856e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
12866e790746SPaolo Bonzini {
128717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
12886e790746SPaolo Bonzini     uint16_t queues;
12896e790746SPaolo Bonzini 
129059079029SYuri Benditovich     virtio_net_disable_rss(n);
1291e22f0603SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) {
1292e22f0603SYuri Benditovich         queues = virtio_net_handle_rss(n, iov, iov_cnt, false);
1293e22f0603SYuri Benditovich         return queues ? VIRTIO_NET_OK : VIRTIO_NET_ERR;
1294e22f0603SYuri Benditovich     }
129559079029SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) {
1296e22f0603SYuri Benditovich         queues = virtio_net_handle_rss(n, iov, iov_cnt, true);
129759079029SYuri Benditovich     } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
129859079029SYuri Benditovich         struct virtio_net_ctrl_mq mq;
129959079029SYuri Benditovich         size_t s;
130059079029SYuri Benditovich         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) {
130159079029SYuri Benditovich             return VIRTIO_NET_ERR;
130259079029SYuri Benditovich         }
13036e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
13046e790746SPaolo Bonzini         if (s != sizeof(mq)) {
13056e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
13066e790746SPaolo Bonzini         }
130759079029SYuri Benditovich         queues = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
13086e790746SPaolo Bonzini 
130959079029SYuri Benditovich     } else {
13106e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
13116e790746SPaolo Bonzini     }
13126e790746SPaolo Bonzini 
13136e790746SPaolo Bonzini     if (queues < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
13146e790746SPaolo Bonzini         queues > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
13156e790746SPaolo Bonzini         queues > n->max_queues ||
13166e790746SPaolo Bonzini         !n->multiqueue) {
13176e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
13186e790746SPaolo Bonzini     }
13196e790746SPaolo Bonzini 
13206e790746SPaolo Bonzini     n->curr_queues = queues;
13216e790746SPaolo Bonzini     /* stop the backend before changing the number of queues to avoid handling a
13226e790746SPaolo Bonzini      * disabled queue */
132317a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
13246e790746SPaolo Bonzini     virtio_net_set_queues(n);
13256e790746SPaolo Bonzini 
13266e790746SPaolo Bonzini     return VIRTIO_NET_OK;
13276e790746SPaolo Bonzini }
1328ba7eadb5SGreg Kurz 
13296e790746SPaolo Bonzini static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
13306e790746SPaolo Bonzini {
133117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
13326e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
13336e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
133451b19ebeSPaolo Bonzini     VirtQueueElement *elem;
13356e790746SPaolo Bonzini     size_t s;
1336771b6ed3SJason Wang     struct iovec *iov, *iov2;
13376e790746SPaolo Bonzini     unsigned int iov_cnt;
13386e790746SPaolo Bonzini 
133951b19ebeSPaolo Bonzini     for (;;) {
134051b19ebeSPaolo Bonzini         elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
134151b19ebeSPaolo Bonzini         if (!elem) {
134251b19ebeSPaolo Bonzini             break;
134351b19ebeSPaolo Bonzini         }
134451b19ebeSPaolo Bonzini         if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) ||
134551b19ebeSPaolo Bonzini             iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) {
1346ba7eadb5SGreg Kurz             virtio_error(vdev, "virtio-net ctrl missing headers");
1347ba7eadb5SGreg Kurz             virtqueue_detach_element(vq, elem, 0);
1348ba7eadb5SGreg Kurz             g_free(elem);
1349ba7eadb5SGreg Kurz             break;
13506e790746SPaolo Bonzini         }
13516e790746SPaolo Bonzini 
135251b19ebeSPaolo Bonzini         iov_cnt = elem->out_num;
135351b19ebeSPaolo Bonzini         iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num);
13546e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl));
13556e790746SPaolo Bonzini         iov_discard_front(&iov, &iov_cnt, sizeof(ctrl));
13566e790746SPaolo Bonzini         if (s != sizeof(ctrl)) {
13576e790746SPaolo Bonzini             status = VIRTIO_NET_ERR;
13586e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
13596e790746SPaolo Bonzini             status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt);
13606e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
13616e790746SPaolo Bonzini             status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt);
13626e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
13636e790746SPaolo Bonzini             status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt);
1364f57fcf70SJason Wang         } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
1365f57fcf70SJason Wang             status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt);
13666e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
13676e790746SPaolo Bonzini             status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt);
1368644c9858SDmitry Fleytman         } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
1369644c9858SDmitry Fleytman             status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt);
13706e790746SPaolo Bonzini         }
13716e790746SPaolo Bonzini 
137251b19ebeSPaolo Bonzini         s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status));
13736e790746SPaolo Bonzini         assert(s == sizeof(status));
13746e790746SPaolo Bonzini 
137551b19ebeSPaolo Bonzini         virtqueue_push(vq, elem, sizeof(status));
13766e790746SPaolo Bonzini         virtio_notify(vdev, vq);
1377771b6ed3SJason Wang         g_free(iov2);
137851b19ebeSPaolo Bonzini         g_free(elem);
13796e790746SPaolo Bonzini     }
13806e790746SPaolo Bonzini }
13816e790746SPaolo Bonzini 
13826e790746SPaolo Bonzini /* RX */
13836e790746SPaolo Bonzini 
13846e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
13856e790746SPaolo Bonzini {
138617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
13876e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
13886e790746SPaolo Bonzini 
13896e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
13906e790746SPaolo Bonzini }
13916e790746SPaolo Bonzini 
1392b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc)
13936e790746SPaolo Bonzini {
13946e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
139517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
13966e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
13976e790746SPaolo Bonzini 
139817a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
1399b8c4b67eSPhilippe Mathieu-Daudé         return false;
14006e790746SPaolo Bonzini     }
14016e790746SPaolo Bonzini 
14026e790746SPaolo Bonzini     if (nc->queue_index >= n->curr_queues) {
1403b8c4b67eSPhilippe Mathieu-Daudé         return false;
14046e790746SPaolo Bonzini     }
14056e790746SPaolo Bonzini 
14066e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
140717a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
1408b8c4b67eSPhilippe Mathieu-Daudé         return false;
14096e790746SPaolo Bonzini     }
14106e790746SPaolo Bonzini 
1411b8c4b67eSPhilippe Mathieu-Daudé     return true;
14126e790746SPaolo Bonzini }
14136e790746SPaolo Bonzini 
14146e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
14156e790746SPaolo Bonzini {
14166e790746SPaolo Bonzini     VirtIONet *n = q->n;
14176e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
14186e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
14196e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
14206e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
14216e790746SPaolo Bonzini 
14226e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
14236e790746SPaolo Bonzini          * available after the above check but before notification was
14246e790746SPaolo Bonzini          * enabled, check for available buffers again.
14256e790746SPaolo Bonzini          */
14266e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
14276e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
14286e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
14296e790746SPaolo Bonzini             return 0;
14306e790746SPaolo Bonzini         }
14316e790746SPaolo Bonzini     }
14326e790746SPaolo Bonzini 
14336e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
14346e790746SPaolo Bonzini     return 1;
14356e790746SPaolo Bonzini }
14366e790746SPaolo Bonzini 
14371399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
1438032a74a1SCédric Le Goater {
14391399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->hdr_len);
14401399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->gso_size);
14411399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_start);
14421399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_offset);
1443032a74a1SCédric Le Goater }
1444032a74a1SCédric Le Goater 
14456e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
14466e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
14476e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
14486e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
14496e790746SPaolo Bonzini  * dhclient yet.
14506e790746SPaolo Bonzini  *
14516e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
14526e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
14536e790746SPaolo Bonzini  * kernels.
14546e790746SPaolo Bonzini  *
14556e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
14566e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
14576e790746SPaolo Bonzini  * cache.
14586e790746SPaolo Bonzini  */
14596e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
14606e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
14616e790746SPaolo Bonzini {
14626e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
14636e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
14646e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
14656e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
14666e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
1467*f5746335SBin Meng         net_checksum_calculate(buf, size, CSUM_UDP);
14686e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
14696e790746SPaolo Bonzini     }
14706e790746SPaolo Bonzini }
14716e790746SPaolo Bonzini 
14726e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
14736e790746SPaolo Bonzini                            const void *buf, size_t size)
14746e790746SPaolo Bonzini {
14756e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
14766e790746SPaolo Bonzini         /* FIXME this cast is evil */
14776e790746SPaolo Bonzini         void *wbuf = (void *)buf;
14786e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
14796e790746SPaolo Bonzini                                     size - n->host_hdr_len);
14801bfa316cSGreg Kurz 
14811bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
14821399c60dSRusty Russell             virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
14831bfa316cSGreg Kurz         }
14846e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
14856e790746SPaolo Bonzini     } else {
14866e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
14876e790746SPaolo Bonzini             .flags = 0,
14886e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
14896e790746SPaolo Bonzini         };
14906e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
14916e790746SPaolo Bonzini     }
14926e790746SPaolo Bonzini }
14936e790746SPaolo Bonzini 
14946e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
14956e790746SPaolo Bonzini {
14966e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
14976e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
14986e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
14996e790746SPaolo Bonzini     int i;
15006e790746SPaolo Bonzini 
15016e790746SPaolo Bonzini     if (n->promisc)
15026e790746SPaolo Bonzini         return 1;
15036e790746SPaolo Bonzini 
15046e790746SPaolo Bonzini     ptr += n->host_hdr_len;
15056e790746SPaolo Bonzini 
15066e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
15077542d3e7SPeter Maydell         int vid = lduw_be_p(ptr + 14) & 0xfff;
15086e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
15096e790746SPaolo Bonzini             return 0;
15106e790746SPaolo Bonzini     }
15116e790746SPaolo Bonzini 
15126e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
15136e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
15146e790746SPaolo Bonzini             return !n->nobcast;
15156e790746SPaolo Bonzini         } else if (n->nomulti) {
15166e790746SPaolo Bonzini             return 0;
15176e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
15186e790746SPaolo Bonzini             return 1;
15196e790746SPaolo Bonzini         }
15206e790746SPaolo Bonzini 
15216e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
15226e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
15236e790746SPaolo Bonzini                 return 1;
15246e790746SPaolo Bonzini             }
15256e790746SPaolo Bonzini         }
15266e790746SPaolo Bonzini     } else { // unicast
15276e790746SPaolo Bonzini         if (n->nouni) {
15286e790746SPaolo Bonzini             return 0;
15296e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
15306e790746SPaolo Bonzini             return 1;
15316e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
15326e790746SPaolo Bonzini             return 1;
15336e790746SPaolo Bonzini         }
15346e790746SPaolo Bonzini 
15356e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
15366e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
15376e790746SPaolo Bonzini                 return 1;
15386e790746SPaolo Bonzini             }
15396e790746SPaolo Bonzini         }
15406e790746SPaolo Bonzini     }
15416e790746SPaolo Bonzini 
15426e790746SPaolo Bonzini     return 0;
15436e790746SPaolo Bonzini }
15446e790746SPaolo Bonzini 
15454474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4,
15464474e37aSYuri Benditovich                                         bool isip6,
15474474e37aSYuri Benditovich                                         bool isudp,
15484474e37aSYuri Benditovich                                         bool istcp,
15494474e37aSYuri Benditovich                                         uint32_t types)
15504474e37aSYuri Benditovich {
15514474e37aSYuri Benditovich     if (isip4) {
15524474e37aSYuri Benditovich         if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) {
15534474e37aSYuri Benditovich             return NetPktRssIpV4Tcp;
15544474e37aSYuri Benditovich         }
15554474e37aSYuri Benditovich         if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) {
15564474e37aSYuri Benditovich             return NetPktRssIpV4Udp;
15574474e37aSYuri Benditovich         }
15584474e37aSYuri Benditovich         if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) {
15594474e37aSYuri Benditovich             return NetPktRssIpV4;
15604474e37aSYuri Benditovich         }
15614474e37aSYuri Benditovich     } else if (isip6) {
15624474e37aSYuri Benditovich         uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX |
15634474e37aSYuri Benditovich                         VIRTIO_NET_RSS_HASH_TYPE_TCPv6;
15644474e37aSYuri Benditovich 
15654474e37aSYuri Benditovich         if (istcp && (types & mask)) {
15664474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ?
15674474e37aSYuri Benditovich                 NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp;
15684474e37aSYuri Benditovich         }
15694474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6;
15704474e37aSYuri Benditovich         if (isudp && (types & mask)) {
15714474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ?
15724474e37aSYuri Benditovich                 NetPktRssIpV6UdpEx : NetPktRssIpV6Udp;
15734474e37aSYuri Benditovich         }
15744474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6;
15754474e37aSYuri Benditovich         if (types & mask) {
15764474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ?
15774474e37aSYuri Benditovich                 NetPktRssIpV6Ex : NetPktRssIpV6;
15784474e37aSYuri Benditovich         }
15794474e37aSYuri Benditovich     }
15804474e37aSYuri Benditovich     return 0xff;
15814474e37aSYuri Benditovich }
15824474e37aSYuri Benditovich 
1583e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report,
1584e22f0603SYuri Benditovich                                    uint32_t hash)
1585e22f0603SYuri Benditovich {
1586e22f0603SYuri Benditovich     struct virtio_net_hdr_v1_hash *hdr = (void *)buf;
1587e22f0603SYuri Benditovich     hdr->hash_value = hash;
1588e22f0603SYuri Benditovich     hdr->hash_report = report;
1589e22f0603SYuri Benditovich }
1590e22f0603SYuri Benditovich 
15914474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf,
159297cd965cSPaolo Bonzini                                   size_t size)
15936e790746SPaolo Bonzini {
15946e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1595e22f0603SYuri Benditovich     unsigned int index = nc->queue_index, new_index = index;
15964474e37aSYuri Benditovich     struct NetRxPkt *pkt = n->rx_pkt;
15974474e37aSYuri Benditovich     uint8_t net_hash_type;
15984474e37aSYuri Benditovich     uint32_t hash;
15994474e37aSYuri Benditovich     bool isip4, isip6, isudp, istcp;
1600e22f0603SYuri Benditovich     static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = {
1601e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv4,
1602e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv4,
1603e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6,
1604e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6,
1605e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6_EX,
1606e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6_EX,
1607e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv4,
1608e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6,
1609e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6_EX
1610e22f0603SYuri Benditovich     };
16114474e37aSYuri Benditovich 
16124474e37aSYuri Benditovich     net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len,
16134474e37aSYuri Benditovich                              size - n->host_hdr_len);
16144474e37aSYuri Benditovich     net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp);
16154474e37aSYuri Benditovich     if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) {
16164474e37aSYuri Benditovich         istcp = isudp = false;
16174474e37aSYuri Benditovich     }
16184474e37aSYuri Benditovich     if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) {
16194474e37aSYuri Benditovich         istcp = isudp = false;
16204474e37aSYuri Benditovich     }
16214474e37aSYuri Benditovich     net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp,
16224474e37aSYuri Benditovich                                              n->rss_data.hash_types);
16234474e37aSYuri Benditovich     if (net_hash_type > NetPktRssIpV6UdpEx) {
1624e22f0603SYuri Benditovich         if (n->rss_data.populate_hash) {
1625e22f0603SYuri Benditovich             virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0);
1626e22f0603SYuri Benditovich         }
1627e22f0603SYuri Benditovich         return n->rss_data.redirect ? n->rss_data.default_queue : -1;
16284474e37aSYuri Benditovich     }
16294474e37aSYuri Benditovich 
16304474e37aSYuri Benditovich     hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key);
1631e22f0603SYuri Benditovich 
1632e22f0603SYuri Benditovich     if (n->rss_data.populate_hash) {
1633e22f0603SYuri Benditovich         virtio_set_packet_hash(buf, reports[net_hash_type], hash);
1634e22f0603SYuri Benditovich     }
1635e22f0603SYuri Benditovich 
1636e22f0603SYuri Benditovich     if (n->rss_data.redirect) {
16374474e37aSYuri Benditovich         new_index = hash & (n->rss_data.indirections_len - 1);
16384474e37aSYuri Benditovich         new_index = n->rss_data.indirections_table[new_index];
16394474e37aSYuri Benditovich     }
1640e22f0603SYuri Benditovich 
1641e22f0603SYuri Benditovich     return (index == new_index) ? -1 : new_index;
16424474e37aSYuri Benditovich }
16434474e37aSYuri Benditovich 
16444474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf,
16454474e37aSYuri Benditovich                                       size_t size, bool no_rss)
16464474e37aSYuri Benditovich {
16474474e37aSYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
16486e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
164917a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
16506e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
16516e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
16526e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
16536e790746SPaolo Bonzini     size_t offset, i, guest_offset;
16546e790746SPaolo Bonzini 
16556e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
16566e790746SPaolo Bonzini         return -1;
16576e790746SPaolo Bonzini     }
16586e790746SPaolo Bonzini 
16594474e37aSYuri Benditovich     if (!no_rss && n->rss_data.enabled) {
16604474e37aSYuri Benditovich         int index = virtio_net_process_rss(nc, buf, size);
16614474e37aSYuri Benditovich         if (index >= 0) {
16624474e37aSYuri Benditovich             NetClientState *nc2 = qemu_get_subqueue(n->nic, index);
16634474e37aSYuri Benditovich             return virtio_net_receive_rcu(nc2, buf, size, true);
16644474e37aSYuri Benditovich         }
16654474e37aSYuri Benditovich     }
16664474e37aSYuri Benditovich 
16676e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
16686e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
16696e790746SPaolo Bonzini         return 0;
16706e790746SPaolo Bonzini     }
16716e790746SPaolo Bonzini 
16726e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
16736e790746SPaolo Bonzini         return size;
16746e790746SPaolo Bonzini 
16756e790746SPaolo Bonzini     offset = i = 0;
16766e790746SPaolo Bonzini 
16776e790746SPaolo Bonzini     while (offset < size) {
167851b19ebeSPaolo Bonzini         VirtQueueElement *elem;
16796e790746SPaolo Bonzini         int len, total;
168051b19ebeSPaolo Bonzini         const struct iovec *sg;
16816e790746SPaolo Bonzini 
16826e790746SPaolo Bonzini         total = 0;
16836e790746SPaolo Bonzini 
168451b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
168551b19ebeSPaolo Bonzini         if (!elem) {
1686ba10b9c0SGreg Kurz             if (i) {
1687ba10b9c0SGreg Kurz                 virtio_error(vdev, "virtio-net unexpected empty queue: "
16886e790746SPaolo Bonzini                              "i %zd mergeable %d offset %zd, size %zd, "
1689019a3edbSGerd Hoffmann                              "guest hdr len %zd, host hdr len %zd "
1690019a3edbSGerd Hoffmann                              "guest features 0x%" PRIx64,
16916e790746SPaolo Bonzini                              i, n->mergeable_rx_bufs, offset, size,
1692019a3edbSGerd Hoffmann                              n->guest_hdr_len, n->host_hdr_len,
1693019a3edbSGerd Hoffmann                              vdev->guest_features);
1694ba10b9c0SGreg Kurz             }
1695ba10b9c0SGreg Kurz             return -1;
16966e790746SPaolo Bonzini         }
16976e790746SPaolo Bonzini 
169851b19ebeSPaolo Bonzini         if (elem->in_num < 1) {
1699ba10b9c0SGreg Kurz             virtio_error(vdev,
1700ba10b9c0SGreg Kurz                          "virtio-net receive queue contains no in buffers");
1701ba10b9c0SGreg Kurz             virtqueue_detach_element(q->rx_vq, elem, 0);
1702ba10b9c0SGreg Kurz             g_free(elem);
1703ba10b9c0SGreg Kurz             return -1;
17046e790746SPaolo Bonzini         }
17056e790746SPaolo Bonzini 
170651b19ebeSPaolo Bonzini         sg = elem->in_sg;
17076e790746SPaolo Bonzini         if (i == 0) {
17086e790746SPaolo Bonzini             assert(offset == 0);
17096e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
17106e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
171151b19ebeSPaolo Bonzini                                     sg, elem->in_num,
17126e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
17136e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
17146e790746SPaolo Bonzini             }
17156e790746SPaolo Bonzini 
171651b19ebeSPaolo Bonzini             receive_header(n, sg, elem->in_num, buf, size);
1717e22f0603SYuri Benditovich             if (n->rss_data.populate_hash) {
1718e22f0603SYuri Benditovich                 offset = sizeof(mhdr);
1719e22f0603SYuri Benditovich                 iov_from_buf(sg, elem->in_num, offset,
1720e22f0603SYuri Benditovich                              buf + offset, n->host_hdr_len - sizeof(mhdr));
1721e22f0603SYuri Benditovich             }
17226e790746SPaolo Bonzini             offset = n->host_hdr_len;
17236e790746SPaolo Bonzini             total += n->guest_hdr_len;
17246e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
17256e790746SPaolo Bonzini         } else {
17266e790746SPaolo Bonzini             guest_offset = 0;
17276e790746SPaolo Bonzini         }
17286e790746SPaolo Bonzini 
17296e790746SPaolo Bonzini         /* copy in packet.  ugh */
173051b19ebeSPaolo Bonzini         len = iov_from_buf(sg, elem->in_num, guest_offset,
17316e790746SPaolo Bonzini                            buf + offset, size - offset);
17326e790746SPaolo Bonzini         total += len;
17336e790746SPaolo Bonzini         offset += len;
17346e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
17356e790746SPaolo Bonzini          * must have consumed the complete packet.
17366e790746SPaolo Bonzini          * Otherwise, drop it. */
17376e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
173827e57efeSLadi Prosek             virtqueue_unpop(q->rx_vq, elem, total);
173951b19ebeSPaolo Bonzini             g_free(elem);
17406e790746SPaolo Bonzini             return size;
17416e790746SPaolo Bonzini         }
17426e790746SPaolo Bonzini 
17436e790746SPaolo Bonzini         /* signal other side */
174451b19ebeSPaolo Bonzini         virtqueue_fill(q->rx_vq, elem, total, i++);
174551b19ebeSPaolo Bonzini         g_free(elem);
17466e790746SPaolo Bonzini     }
17476e790746SPaolo Bonzini 
17486e790746SPaolo Bonzini     if (mhdr_cnt) {
17491399c60dSRusty Russell         virtio_stw_p(vdev, &mhdr.num_buffers, i);
17506e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
17516e790746SPaolo Bonzini                      0,
17526e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
17536e790746SPaolo Bonzini     }
17546e790746SPaolo Bonzini 
17556e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
175617a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
17576e790746SPaolo Bonzini 
17586e790746SPaolo Bonzini     return size;
17596e790746SPaolo Bonzini }
17606e790746SPaolo Bonzini 
17612974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf,
176297cd965cSPaolo Bonzini                                   size_t size)
176397cd965cSPaolo Bonzini {
1764068ddfa9SDr. David Alan Gilbert     RCU_READ_LOCK_GUARD();
176597cd965cSPaolo Bonzini 
17664474e37aSYuri Benditovich     return virtio_net_receive_rcu(nc, buf, size, false);
176797cd965cSPaolo Bonzini }
176897cd965cSPaolo Bonzini 
17692974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain,
17702974e916SYuri Benditovich                                          const uint8_t *buf,
17712974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
17722974e916SYuri Benditovich {
17732974e916SYuri Benditovich     uint16_t ip_hdrlen;
17742974e916SYuri Benditovich     struct ip_header *ip;
17752974e916SYuri Benditovich 
17762974e916SYuri Benditovich     ip = (struct ip_header *)(buf + chain->n->guest_hdr_len
17772974e916SYuri Benditovich                               + sizeof(struct eth_header));
17782974e916SYuri Benditovich     unit->ip = (void *)ip;
17792974e916SYuri Benditovich     ip_hdrlen = (ip->ip_ver_len & 0xF) << 2;
17802974e916SYuri Benditovich     unit->ip_plen = &ip->ip_len;
17812974e916SYuri Benditovich     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen);
17822974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
17832974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen;
17842974e916SYuri Benditovich }
17852974e916SYuri Benditovich 
17862974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain,
17872974e916SYuri Benditovich                                          const uint8_t *buf,
17882974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
17892974e916SYuri Benditovich {
17902974e916SYuri Benditovich     struct ip6_header *ip6;
17912974e916SYuri Benditovich 
17922974e916SYuri Benditovich     ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len
17932974e916SYuri Benditovich                                  + sizeof(struct eth_header));
17942974e916SYuri Benditovich     unit->ip = ip6;
17952974e916SYuri Benditovich     unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
179678ee6bd0SPhilippe Mathieu-Daudé     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip)
17972974e916SYuri Benditovich                                         + sizeof(struct ip6_header));
17982974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
17992974e916SYuri Benditovich 
18002974e916SYuri Benditovich     /* There is a difference between payload lenght in ipv4 and v6,
18012974e916SYuri Benditovich        ip header is excluded in ipv6 */
18022974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen;
18032974e916SYuri Benditovich }
18042974e916SYuri Benditovich 
18052974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain,
18062974e916SYuri Benditovich                                        VirtioNetRscSeg *seg)
18072974e916SYuri Benditovich {
18082974e916SYuri Benditovich     int ret;
1809dd3d85e8SYuri Benditovich     struct virtio_net_hdr_v1 *h;
18102974e916SYuri Benditovich 
1811dd3d85e8SYuri Benditovich     h = (struct virtio_net_hdr_v1 *)seg->buf;
18122974e916SYuri Benditovich     h->flags = 0;
18132974e916SYuri Benditovich     h->gso_type = VIRTIO_NET_HDR_GSO_NONE;
18142974e916SYuri Benditovich 
18152974e916SYuri Benditovich     if (seg->is_coalesced) {
1816dd3d85e8SYuri Benditovich         h->rsc.segments = seg->packets;
1817dd3d85e8SYuri Benditovich         h->rsc.dup_acks = seg->dup_ack;
18182974e916SYuri Benditovich         h->flags = VIRTIO_NET_HDR_F_RSC_INFO;
18192974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
18202974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
18212974e916SYuri Benditovich         } else {
18222974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
18232974e916SYuri Benditovich         }
18242974e916SYuri Benditovich     }
18252974e916SYuri Benditovich 
18262974e916SYuri Benditovich     ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size);
18272974e916SYuri Benditovich     QTAILQ_REMOVE(&chain->buffers, seg, next);
18282974e916SYuri Benditovich     g_free(seg->buf);
18292974e916SYuri Benditovich     g_free(seg);
18302974e916SYuri Benditovich 
18312974e916SYuri Benditovich     return ret;
18322974e916SYuri Benditovich }
18332974e916SYuri Benditovich 
18342974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq)
18352974e916SYuri Benditovich {
18362974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn;
18372974e916SYuri Benditovich     VirtioNetRscChain *chain = (VirtioNetRscChain *)opq;
18382974e916SYuri Benditovich 
18392974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) {
18402974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
18412974e916SYuri Benditovich             chain->stat.purge_failed++;
18422974e916SYuri Benditovich             continue;
18432974e916SYuri Benditovich         }
18442974e916SYuri Benditovich     }
18452974e916SYuri Benditovich 
18462974e916SYuri Benditovich     chain->stat.timer++;
18472974e916SYuri Benditovich     if (!QTAILQ_EMPTY(&chain->buffers)) {
18482974e916SYuri Benditovich         timer_mod(chain->drain_timer,
18492974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
18502974e916SYuri Benditovich     }
18512974e916SYuri Benditovich }
18522974e916SYuri Benditovich 
18532974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n)
18542974e916SYuri Benditovich {
18552974e916SYuri Benditovich     VirtioNetRscChain *chain, *rn_chain;
18562974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn_seg;
18572974e916SYuri Benditovich 
18582974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) {
18592974e916SYuri Benditovich         QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) {
18602974e916SYuri Benditovich             QTAILQ_REMOVE(&chain->buffers, seg, next);
18612974e916SYuri Benditovich             g_free(seg->buf);
18622974e916SYuri Benditovich             g_free(seg);
18632974e916SYuri Benditovich         }
18642974e916SYuri Benditovich 
18652974e916SYuri Benditovich         timer_free(chain->drain_timer);
18662974e916SYuri Benditovich         QTAILQ_REMOVE(&n->rsc_chains, chain, next);
18672974e916SYuri Benditovich         g_free(chain);
18682974e916SYuri Benditovich     }
18692974e916SYuri Benditovich }
18702974e916SYuri Benditovich 
18712974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain,
18722974e916SYuri Benditovich                                      NetClientState *nc,
18732974e916SYuri Benditovich                                      const uint8_t *buf, size_t size)
18742974e916SYuri Benditovich {
18752974e916SYuri Benditovich     uint16_t hdr_len;
18762974e916SYuri Benditovich     VirtioNetRscSeg *seg;
18772974e916SYuri Benditovich 
18782974e916SYuri Benditovich     hdr_len = chain->n->guest_hdr_len;
18792974e916SYuri Benditovich     seg = g_malloc(sizeof(VirtioNetRscSeg));
18802974e916SYuri Benditovich     seg->buf = g_malloc(hdr_len + sizeof(struct eth_header)
18812974e916SYuri Benditovich         + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD);
18822974e916SYuri Benditovich     memcpy(seg->buf, buf, size);
18832974e916SYuri Benditovich     seg->size = size;
18842974e916SYuri Benditovich     seg->packets = 1;
18852974e916SYuri Benditovich     seg->dup_ack = 0;
18862974e916SYuri Benditovich     seg->is_coalesced = 0;
18872974e916SYuri Benditovich     seg->nc = nc;
18882974e916SYuri Benditovich 
18892974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&chain->buffers, seg, next);
18902974e916SYuri Benditovich     chain->stat.cache++;
18912974e916SYuri Benditovich 
18922974e916SYuri Benditovich     switch (chain->proto) {
18932974e916SYuri Benditovich     case ETH_P_IP:
18942974e916SYuri Benditovich         virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit);
18952974e916SYuri Benditovich         break;
18962974e916SYuri Benditovich     case ETH_P_IPV6:
18972974e916SYuri Benditovich         virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit);
18982974e916SYuri Benditovich         break;
18992974e916SYuri Benditovich     default:
19002974e916SYuri Benditovich         g_assert_not_reached();
19012974e916SYuri Benditovich     }
19022974e916SYuri Benditovich }
19032974e916SYuri Benditovich 
19042974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain,
19052974e916SYuri Benditovich                                          VirtioNetRscSeg *seg,
19062974e916SYuri Benditovich                                          const uint8_t *buf,
19072974e916SYuri Benditovich                                          struct tcp_header *n_tcp,
19082974e916SYuri Benditovich                                          struct tcp_header *o_tcp)
19092974e916SYuri Benditovich {
19102974e916SYuri Benditovich     uint32_t nack, oack;
19112974e916SYuri Benditovich     uint16_t nwin, owin;
19122974e916SYuri Benditovich 
19132974e916SYuri Benditovich     nack = htonl(n_tcp->th_ack);
19142974e916SYuri Benditovich     nwin = htons(n_tcp->th_win);
19152974e916SYuri Benditovich     oack = htonl(o_tcp->th_ack);
19162974e916SYuri Benditovich     owin = htons(o_tcp->th_win);
19172974e916SYuri Benditovich 
19182974e916SYuri Benditovich     if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) {
19192974e916SYuri Benditovich         chain->stat.ack_out_of_win++;
19202974e916SYuri Benditovich         return RSC_FINAL;
19212974e916SYuri Benditovich     } else if (nack == oack) {
19222974e916SYuri Benditovich         /* duplicated ack or window probe */
19232974e916SYuri Benditovich         if (nwin == owin) {
19242974e916SYuri Benditovich             /* duplicated ack, add dup ack count due to whql test up to 1 */
19252974e916SYuri Benditovich             chain->stat.dup_ack++;
19262974e916SYuri Benditovich             return RSC_FINAL;
19272974e916SYuri Benditovich         } else {
19282974e916SYuri Benditovich             /* Coalesce window update */
19292974e916SYuri Benditovich             o_tcp->th_win = n_tcp->th_win;
19302974e916SYuri Benditovich             chain->stat.win_update++;
19312974e916SYuri Benditovich             return RSC_COALESCE;
19322974e916SYuri Benditovich         }
19332974e916SYuri Benditovich     } else {
19342974e916SYuri Benditovich         /* pure ack, go to 'C', finalize*/
19352974e916SYuri Benditovich         chain->stat.pure_ack++;
19362974e916SYuri Benditovich         return RSC_FINAL;
19372974e916SYuri Benditovich     }
19382974e916SYuri Benditovich }
19392974e916SYuri Benditovich 
19402974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain,
19412974e916SYuri Benditovich                                             VirtioNetRscSeg *seg,
19422974e916SYuri Benditovich                                             const uint8_t *buf,
19432974e916SYuri Benditovich                                             VirtioNetRscUnit *n_unit)
19442974e916SYuri Benditovich {
19452974e916SYuri Benditovich     void *data;
19462974e916SYuri Benditovich     uint16_t o_ip_len;
19472974e916SYuri Benditovich     uint32_t nseq, oseq;
19482974e916SYuri Benditovich     VirtioNetRscUnit *o_unit;
19492974e916SYuri Benditovich 
19502974e916SYuri Benditovich     o_unit = &seg->unit;
19512974e916SYuri Benditovich     o_ip_len = htons(*o_unit->ip_plen);
19522974e916SYuri Benditovich     nseq = htonl(n_unit->tcp->th_seq);
19532974e916SYuri Benditovich     oseq = htonl(o_unit->tcp->th_seq);
19542974e916SYuri Benditovich 
19552974e916SYuri Benditovich     /* out of order or retransmitted. */
19562974e916SYuri Benditovich     if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) {
19572974e916SYuri Benditovich         chain->stat.data_out_of_win++;
19582974e916SYuri Benditovich         return RSC_FINAL;
19592974e916SYuri Benditovich     }
19602974e916SYuri Benditovich 
19612974e916SYuri Benditovich     data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen;
19622974e916SYuri Benditovich     if (nseq == oseq) {
19632974e916SYuri Benditovich         if ((o_unit->payload == 0) && n_unit->payload) {
19642974e916SYuri Benditovich             /* From no payload to payload, normal case, not a dup ack or etc */
19652974e916SYuri Benditovich             chain->stat.data_after_pure_ack++;
19662974e916SYuri Benditovich             goto coalesce;
19672974e916SYuri Benditovich         } else {
19682974e916SYuri Benditovich             return virtio_net_rsc_handle_ack(chain, seg, buf,
19692974e916SYuri Benditovich                                              n_unit->tcp, o_unit->tcp);
19702974e916SYuri Benditovich         }
19712974e916SYuri Benditovich     } else if ((nseq - oseq) != o_unit->payload) {
19722974e916SYuri Benditovich         /* Not a consistent packet, out of order */
19732974e916SYuri Benditovich         chain->stat.data_out_of_order++;
19742974e916SYuri Benditovich         return RSC_FINAL;
19752974e916SYuri Benditovich     } else {
19762974e916SYuri Benditovich coalesce:
19772974e916SYuri Benditovich         if ((o_ip_len + n_unit->payload) > chain->max_payload) {
19782974e916SYuri Benditovich             chain->stat.over_size++;
19792974e916SYuri Benditovich             return RSC_FINAL;
19802974e916SYuri Benditovich         }
19812974e916SYuri Benditovich 
19822974e916SYuri Benditovich         /* Here comes the right data, the payload length in v4/v6 is different,
19832974e916SYuri Benditovich            so use the field value to update and record the new data len */
19842974e916SYuri Benditovich         o_unit->payload += n_unit->payload; /* update new data len */
19852974e916SYuri Benditovich 
19862974e916SYuri Benditovich         /* update field in ip header */
19872974e916SYuri Benditovich         *o_unit->ip_plen = htons(o_ip_len + n_unit->payload);
19882974e916SYuri Benditovich 
19892974e916SYuri Benditovich         /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced
19902974e916SYuri Benditovich            for windows guest, while this may change the behavior for linux
19912974e916SYuri Benditovich            guest (only if it uses RSC feature). */
19922974e916SYuri Benditovich         o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags;
19932974e916SYuri Benditovich 
19942974e916SYuri Benditovich         o_unit->tcp->th_ack = n_unit->tcp->th_ack;
19952974e916SYuri Benditovich         o_unit->tcp->th_win = n_unit->tcp->th_win;
19962974e916SYuri Benditovich 
19972974e916SYuri Benditovich         memmove(seg->buf + seg->size, data, n_unit->payload);
19982974e916SYuri Benditovich         seg->size += n_unit->payload;
19992974e916SYuri Benditovich         seg->packets++;
20002974e916SYuri Benditovich         chain->stat.coalesced++;
20012974e916SYuri Benditovich         return RSC_COALESCE;
20022974e916SYuri Benditovich     }
20032974e916SYuri Benditovich }
20042974e916SYuri Benditovich 
20052974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain,
20062974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
20072974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
20082974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
20092974e916SYuri Benditovich {
20102974e916SYuri Benditovich     struct ip_header *ip1, *ip2;
20112974e916SYuri Benditovich 
20122974e916SYuri Benditovich     ip1 = (struct ip_header *)(unit->ip);
20132974e916SYuri Benditovich     ip2 = (struct ip_header *)(seg->unit.ip);
20142974e916SYuri Benditovich     if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst)
20152974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
20162974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
20172974e916SYuri Benditovich         chain->stat.no_match++;
20182974e916SYuri Benditovich         return RSC_NO_MATCH;
20192974e916SYuri Benditovich     }
20202974e916SYuri Benditovich 
20212974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
20222974e916SYuri Benditovich }
20232974e916SYuri Benditovich 
20242974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain,
20252974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
20262974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
20272974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
20282974e916SYuri Benditovich {
20292974e916SYuri Benditovich     struct ip6_header *ip1, *ip2;
20302974e916SYuri Benditovich 
20312974e916SYuri Benditovich     ip1 = (struct ip6_header *)(unit->ip);
20322974e916SYuri Benditovich     ip2 = (struct ip6_header *)(seg->unit.ip);
20332974e916SYuri Benditovich     if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address))
20342974e916SYuri Benditovich         || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address))
20352974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
20362974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
20372974e916SYuri Benditovich             chain->stat.no_match++;
20382974e916SYuri Benditovich             return RSC_NO_MATCH;
20392974e916SYuri Benditovich     }
20402974e916SYuri Benditovich 
20412974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
20422974e916SYuri Benditovich }
20432974e916SYuri Benditovich 
20442974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain
20452974e916SYuri Benditovich  * to prevent out of order */
20462974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain,
20472974e916SYuri Benditovich                                          struct tcp_header *tcp)
20482974e916SYuri Benditovich {
20492974e916SYuri Benditovich     uint16_t tcp_hdr;
20502974e916SYuri Benditovich     uint16_t tcp_flag;
20512974e916SYuri Benditovich 
20522974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags);
20532974e916SYuri Benditovich     tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10;
20542974e916SYuri Benditovich     tcp_flag &= VIRTIO_NET_TCP_FLAG;
20552974e916SYuri Benditovich     if (tcp_flag & TH_SYN) {
20562974e916SYuri Benditovich         chain->stat.tcp_syn++;
20572974e916SYuri Benditovich         return RSC_BYPASS;
20582974e916SYuri Benditovich     }
20592974e916SYuri Benditovich 
20602974e916SYuri Benditovich     if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) {
20612974e916SYuri Benditovich         chain->stat.tcp_ctrl_drain++;
20622974e916SYuri Benditovich         return RSC_FINAL;
20632974e916SYuri Benditovich     }
20642974e916SYuri Benditovich 
20652974e916SYuri Benditovich     if (tcp_hdr > sizeof(struct tcp_header)) {
20662974e916SYuri Benditovich         chain->stat.tcp_all_opt++;
20672974e916SYuri Benditovich         return RSC_FINAL;
20682974e916SYuri Benditovich     }
20692974e916SYuri Benditovich 
20702974e916SYuri Benditovich     return RSC_CANDIDATE;
20712974e916SYuri Benditovich }
20722974e916SYuri Benditovich 
20732974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain,
20742974e916SYuri Benditovich                                          NetClientState *nc,
20752974e916SYuri Benditovich                                          const uint8_t *buf, size_t size,
20762974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
20772974e916SYuri Benditovich {
20782974e916SYuri Benditovich     int ret;
20792974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
20802974e916SYuri Benditovich 
20812974e916SYuri Benditovich     if (QTAILQ_EMPTY(&chain->buffers)) {
20822974e916SYuri Benditovich         chain->stat.empty_cache++;
20832974e916SYuri Benditovich         virtio_net_rsc_cache_buf(chain, nc, buf, size);
20842974e916SYuri Benditovich         timer_mod(chain->drain_timer,
20852974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
20862974e916SYuri Benditovich         return size;
20872974e916SYuri Benditovich     }
20882974e916SYuri Benditovich 
20892974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
20902974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
20912974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit);
20922974e916SYuri Benditovich         } else {
20932974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit);
20942974e916SYuri Benditovich         }
20952974e916SYuri Benditovich 
20962974e916SYuri Benditovich         if (ret == RSC_FINAL) {
20972974e916SYuri Benditovich             if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
20982974e916SYuri Benditovich                 /* Send failed */
20992974e916SYuri Benditovich                 chain->stat.final_failed++;
21002974e916SYuri Benditovich                 return 0;
21012974e916SYuri Benditovich             }
21022974e916SYuri Benditovich 
21032974e916SYuri Benditovich             /* Send current packet */
21042974e916SYuri Benditovich             return virtio_net_do_receive(nc, buf, size);
21052974e916SYuri Benditovich         } else if (ret == RSC_NO_MATCH) {
21062974e916SYuri Benditovich             continue;
21072974e916SYuri Benditovich         } else {
21082974e916SYuri Benditovich             /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */
21092974e916SYuri Benditovich             seg->is_coalesced = 1;
21102974e916SYuri Benditovich             return size;
21112974e916SYuri Benditovich         }
21122974e916SYuri Benditovich     }
21132974e916SYuri Benditovich 
21142974e916SYuri Benditovich     chain->stat.no_match_cache++;
21152974e916SYuri Benditovich     virtio_net_rsc_cache_buf(chain, nc, buf, size);
21162974e916SYuri Benditovich     return size;
21172974e916SYuri Benditovich }
21182974e916SYuri Benditovich 
21192974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */
21202974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain,
21212974e916SYuri Benditovich                                         NetClientState *nc,
21222974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21232974e916SYuri Benditovich                                         uint16_t ip_start, uint16_t ip_size,
21242974e916SYuri Benditovich                                         uint16_t tcp_port)
21252974e916SYuri Benditovich {
21262974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
21272974e916SYuri Benditovich     uint32_t ppair1, ppair2;
21282974e916SYuri Benditovich 
21292974e916SYuri Benditovich     ppair1 = *(uint32_t *)(buf + tcp_port);
21302974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
21312974e916SYuri Benditovich         ppair2 = *(uint32_t *)(seg->buf + tcp_port);
21322974e916SYuri Benditovich         if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size)
21332974e916SYuri Benditovich             || (ppair1 != ppair2)) {
21342974e916SYuri Benditovich             continue;
21352974e916SYuri Benditovich         }
21362974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
21372974e916SYuri Benditovich             chain->stat.drain_failed++;
21382974e916SYuri Benditovich         }
21392974e916SYuri Benditovich 
21402974e916SYuri Benditovich         break;
21412974e916SYuri Benditovich     }
21422974e916SYuri Benditovich 
21432974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
21442974e916SYuri Benditovich }
21452974e916SYuri Benditovich 
21462974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain,
21472974e916SYuri Benditovich                                             struct ip_header *ip,
21482974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
21492974e916SYuri Benditovich {
21502974e916SYuri Benditovich     uint16_t ip_len;
21512974e916SYuri Benditovich 
21522974e916SYuri Benditovich     /* Not an ipv4 packet */
21532974e916SYuri Benditovich     if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) {
21542974e916SYuri Benditovich         chain->stat.ip_option++;
21552974e916SYuri Benditovich         return RSC_BYPASS;
21562974e916SYuri Benditovich     }
21572974e916SYuri Benditovich 
21582974e916SYuri Benditovich     /* Don't handle packets with ip option */
21592974e916SYuri Benditovich     if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) {
21602974e916SYuri Benditovich         chain->stat.ip_option++;
21612974e916SYuri Benditovich         return RSC_BYPASS;
21622974e916SYuri Benditovich     }
21632974e916SYuri Benditovich 
21642974e916SYuri Benditovich     if (ip->ip_p != IPPROTO_TCP) {
21652974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
21662974e916SYuri Benditovich         return RSC_BYPASS;
21672974e916SYuri Benditovich     }
21682974e916SYuri Benditovich 
21692974e916SYuri Benditovich     /* Don't handle packets with ip fragment */
21702974e916SYuri Benditovich     if (!(htons(ip->ip_off) & IP_DF)) {
21712974e916SYuri Benditovich         chain->stat.ip_frag++;
21722974e916SYuri Benditovich         return RSC_BYPASS;
21732974e916SYuri Benditovich     }
21742974e916SYuri Benditovich 
21752974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
21762974e916SYuri Benditovich     if (IPTOS_ECN(ip->ip_tos)) {
21772974e916SYuri Benditovich         chain->stat.ip_ecn++;
21782974e916SYuri Benditovich         return RSC_BYPASS;
21792974e916SYuri Benditovich     }
21802974e916SYuri Benditovich 
21812974e916SYuri Benditovich     ip_len = htons(ip->ip_len);
21822974e916SYuri Benditovich     if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header))
21832974e916SYuri Benditovich         || ip_len > (size - chain->n->guest_hdr_len -
21842974e916SYuri Benditovich                      sizeof(struct eth_header))) {
21852974e916SYuri Benditovich         chain->stat.ip_hacked++;
21862974e916SYuri Benditovich         return RSC_BYPASS;
21872974e916SYuri Benditovich     }
21882974e916SYuri Benditovich 
21892974e916SYuri Benditovich     return RSC_CANDIDATE;
21902974e916SYuri Benditovich }
21912974e916SYuri Benditovich 
21922974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain,
21932974e916SYuri Benditovich                                       NetClientState *nc,
21942974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
21952974e916SYuri Benditovich {
21962974e916SYuri Benditovich     int32_t ret;
21972974e916SYuri Benditovich     uint16_t hdr_len;
21982974e916SYuri Benditovich     VirtioNetRscUnit unit;
21992974e916SYuri Benditovich 
22002974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
22012974e916SYuri Benditovich 
22022974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)
22032974e916SYuri Benditovich         + sizeof(struct tcp_header))) {
22042974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
22052974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22062974e916SYuri Benditovich     }
22072974e916SYuri Benditovich 
22082974e916SYuri Benditovich     virtio_net_rsc_extract_unit4(chain, buf, &unit);
22092974e916SYuri Benditovich     if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size)
22102974e916SYuri Benditovich         != RSC_CANDIDATE) {
22112974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22122974e916SYuri Benditovich     }
22132974e916SYuri Benditovich 
22142974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
22152974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
22162974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22172974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
22182974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
22192974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 12),
22202974e916SYuri Benditovich                 VIRTIO_NET_IP4_ADDR_SIZE,
22212974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header));
22222974e916SYuri Benditovich     }
22232974e916SYuri Benditovich 
22242974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
22252974e916SYuri Benditovich }
22262974e916SYuri Benditovich 
22272974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain,
22282974e916SYuri Benditovich                                             struct ip6_header *ip6,
22292974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
22302974e916SYuri Benditovich {
22312974e916SYuri Benditovich     uint16_t ip_len;
22322974e916SYuri Benditovich 
22332974e916SYuri Benditovich     if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4)
22342974e916SYuri Benditovich         != IP_HEADER_VERSION_6) {
22352974e916SYuri Benditovich         return RSC_BYPASS;
22362974e916SYuri Benditovich     }
22372974e916SYuri Benditovich 
22382974e916SYuri Benditovich     /* Both option and protocol is checked in this */
22392974e916SYuri Benditovich     if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) {
22402974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
22412974e916SYuri Benditovich         return RSC_BYPASS;
22422974e916SYuri Benditovich     }
22432974e916SYuri Benditovich 
22442974e916SYuri Benditovich     ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
22452974e916SYuri Benditovich     if (ip_len < sizeof(struct tcp_header) ||
22462974e916SYuri Benditovich         ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header)
22472974e916SYuri Benditovich                   - sizeof(struct ip6_header))) {
22482974e916SYuri Benditovich         chain->stat.ip_hacked++;
22492974e916SYuri Benditovich         return RSC_BYPASS;
22502974e916SYuri Benditovich     }
22512974e916SYuri Benditovich 
22522974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
22532974e916SYuri Benditovich     if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) {
22542974e916SYuri Benditovich         chain->stat.ip_ecn++;
22552974e916SYuri Benditovich         return RSC_BYPASS;
22562974e916SYuri Benditovich     }
22572974e916SYuri Benditovich 
22582974e916SYuri Benditovich     return RSC_CANDIDATE;
22592974e916SYuri Benditovich }
22602974e916SYuri Benditovich 
22612974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc,
22622974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
22632974e916SYuri Benditovich {
22642974e916SYuri Benditovich     int32_t ret;
22652974e916SYuri Benditovich     uint16_t hdr_len;
22662974e916SYuri Benditovich     VirtioNetRscChain *chain;
22672974e916SYuri Benditovich     VirtioNetRscUnit unit;
22682974e916SYuri Benditovich 
22692974e916SYuri Benditovich     chain = (VirtioNetRscChain *)opq;
22702974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
22712974e916SYuri Benditovich 
22722974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header)
22732974e916SYuri Benditovich         + sizeof(tcp_header))) {
22742974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22752974e916SYuri Benditovich     }
22762974e916SYuri Benditovich 
22772974e916SYuri Benditovich     virtio_net_rsc_extract_unit6(chain, buf, &unit);
22782974e916SYuri Benditovich     if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain,
22792974e916SYuri Benditovich                                                  unit.ip, buf, size)) {
22802974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22812974e916SYuri Benditovich     }
22822974e916SYuri Benditovich 
22832974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
22842974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
22852974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22862974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
22872974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
22882974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 8),
22892974e916SYuri Benditovich                 VIRTIO_NET_IP6_ADDR_SIZE,
22902974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header)
22912974e916SYuri Benditovich                 + sizeof(struct ip6_header));
22922974e916SYuri Benditovich     }
22932974e916SYuri Benditovich 
22942974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
22952974e916SYuri Benditovich }
22962974e916SYuri Benditovich 
22972974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n,
22982974e916SYuri Benditovich                                                       NetClientState *nc,
22992974e916SYuri Benditovich                                                       uint16_t proto)
23002974e916SYuri Benditovich {
23012974e916SYuri Benditovich     VirtioNetRscChain *chain;
23022974e916SYuri Benditovich 
23032974e916SYuri Benditovich     if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) {
23042974e916SYuri Benditovich         return NULL;
23052974e916SYuri Benditovich     }
23062974e916SYuri Benditovich 
23072974e916SYuri Benditovich     QTAILQ_FOREACH(chain, &n->rsc_chains, next) {
23082974e916SYuri Benditovich         if (chain->proto == proto) {
23092974e916SYuri Benditovich             return chain;
23102974e916SYuri Benditovich         }
23112974e916SYuri Benditovich     }
23122974e916SYuri Benditovich 
23132974e916SYuri Benditovich     chain = g_malloc(sizeof(*chain));
23142974e916SYuri Benditovich     chain->n = n;
23152974e916SYuri Benditovich     chain->proto = proto;
23162974e916SYuri Benditovich     if (proto == (uint16_t)ETH_P_IP) {
23172974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD;
23182974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
23192974e916SYuri Benditovich     } else {
23202974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD;
23212974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
23222974e916SYuri Benditovich     }
23232974e916SYuri Benditovich     chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST,
23242974e916SYuri Benditovich                                       virtio_net_rsc_purge, chain);
23252974e916SYuri Benditovich     memset(&chain->stat, 0, sizeof(chain->stat));
23262974e916SYuri Benditovich 
23272974e916SYuri Benditovich     QTAILQ_INIT(&chain->buffers);
23282974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next);
23292974e916SYuri Benditovich 
23302974e916SYuri Benditovich     return chain;
23312974e916SYuri Benditovich }
23322974e916SYuri Benditovich 
23332974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc,
23342974e916SYuri Benditovich                                       const uint8_t *buf,
23352974e916SYuri Benditovich                                       size_t size)
23362974e916SYuri Benditovich {
23372974e916SYuri Benditovich     uint16_t proto;
23382974e916SYuri Benditovich     VirtioNetRscChain *chain;
23392974e916SYuri Benditovich     struct eth_header *eth;
23402974e916SYuri Benditovich     VirtIONet *n;
23412974e916SYuri Benditovich 
23422974e916SYuri Benditovich     n = qemu_get_nic_opaque(nc);
23432974e916SYuri Benditovich     if (size < (n->host_hdr_len + sizeof(struct eth_header))) {
23442974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23452974e916SYuri Benditovich     }
23462974e916SYuri Benditovich 
23472974e916SYuri Benditovich     eth = (struct eth_header *)(buf + n->guest_hdr_len);
23482974e916SYuri Benditovich     proto = htons(eth->h_proto);
23492974e916SYuri Benditovich 
23502974e916SYuri Benditovich     chain = virtio_net_rsc_lookup_chain(n, nc, proto);
23512974e916SYuri Benditovich     if (chain) {
23522974e916SYuri Benditovich         chain->stat.received++;
23532974e916SYuri Benditovich         if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) {
23542974e916SYuri Benditovich             return virtio_net_rsc_receive4(chain, nc, buf, size);
23552974e916SYuri Benditovich         } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) {
23562974e916SYuri Benditovich             return virtio_net_rsc_receive6(chain, nc, buf, size);
23572974e916SYuri Benditovich         }
23582974e916SYuri Benditovich     }
23592974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
23602974e916SYuri Benditovich }
23612974e916SYuri Benditovich 
23622974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf,
23632974e916SYuri Benditovich                                   size_t size)
23642974e916SYuri Benditovich {
23652974e916SYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
23662974e916SYuri Benditovich     if ((n->rsc4_enabled || n->rsc6_enabled)) {
23672974e916SYuri Benditovich         return virtio_net_rsc_receive(nc, buf, size);
23682974e916SYuri Benditovich     } else {
23692974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23702974e916SYuri Benditovich     }
23712974e916SYuri Benditovich }
23722974e916SYuri Benditovich 
23736e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
23746e790746SPaolo Bonzini 
23756e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
23766e790746SPaolo Bonzini {
23776e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
23786e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
237917a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
23806e790746SPaolo Bonzini 
238151b19ebeSPaolo Bonzini     virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
238217a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
23836e790746SPaolo Bonzini 
238451b19ebeSPaolo Bonzini     g_free(q->async_tx.elem);
238551b19ebeSPaolo Bonzini     q->async_tx.elem = NULL;
23866e790746SPaolo Bonzini 
23876e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
23886e790746SPaolo Bonzini     virtio_net_flush_tx(q);
23896e790746SPaolo Bonzini }
23906e790746SPaolo Bonzini 
23916e790746SPaolo Bonzini /* TX */
23926e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
23936e790746SPaolo Bonzini {
23946e790746SPaolo Bonzini     VirtIONet *n = q->n;
239517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
239651b19ebeSPaolo Bonzini     VirtQueueElement *elem;
23976e790746SPaolo Bonzini     int32_t num_packets = 0;
23986e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
239917a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
24006e790746SPaolo Bonzini         return num_packets;
24016e790746SPaolo Bonzini     }
24026e790746SPaolo Bonzini 
240351b19ebeSPaolo Bonzini     if (q->async_tx.elem) {
24046e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
24056e790746SPaolo Bonzini         return num_packets;
24066e790746SPaolo Bonzini     }
24076e790746SPaolo Bonzini 
240851b19ebeSPaolo Bonzini     for (;;) {
2409bd89dd98SJason Wang         ssize_t ret;
241051b19ebeSPaolo Bonzini         unsigned int out_num;
241151b19ebeSPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
2412feb93f36SJason Wang         struct virtio_net_hdr_mrg_rxbuf mhdr;
24136e790746SPaolo Bonzini 
241451b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
241551b19ebeSPaolo Bonzini         if (!elem) {
241651b19ebeSPaolo Bonzini             break;
241751b19ebeSPaolo Bonzini         }
241851b19ebeSPaolo Bonzini 
241951b19ebeSPaolo Bonzini         out_num = elem->out_num;
242051b19ebeSPaolo Bonzini         out_sg = elem->out_sg;
24216e790746SPaolo Bonzini         if (out_num < 1) {
2422fa5e56c2SGreg Kurz             virtio_error(vdev, "virtio-net header not in first element");
2423fa5e56c2SGreg Kurz             virtqueue_detach_element(q->tx_vq, elem, 0);
2424fa5e56c2SGreg Kurz             g_free(elem);
2425fa5e56c2SGreg Kurz             return -EINVAL;
24266e790746SPaolo Bonzini         }
24276e790746SPaolo Bonzini 
2428032a74a1SCédric Le Goater         if (n->has_vnet_hdr) {
2429feb93f36SJason Wang             if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
2430feb93f36SJason Wang                 n->guest_hdr_len) {
2431fa5e56c2SGreg Kurz                 virtio_error(vdev, "virtio-net header incorrect");
2432fa5e56c2SGreg Kurz                 virtqueue_detach_element(q->tx_vq, elem, 0);
2433fa5e56c2SGreg Kurz                 g_free(elem);
2434fa5e56c2SGreg Kurz                 return -EINVAL;
2435032a74a1SCédric Le Goater             }
24361bfa316cSGreg Kurz             if (n->needs_vnet_hdr_swap) {
2437feb93f36SJason Wang                 virtio_net_hdr_swap(vdev, (void *) &mhdr);
2438feb93f36SJason Wang                 sg2[0].iov_base = &mhdr;
2439feb93f36SJason Wang                 sg2[0].iov_len = n->guest_hdr_len;
2440feb93f36SJason Wang                 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
2441feb93f36SJason Wang                                    out_sg, out_num,
2442feb93f36SJason Wang                                    n->guest_hdr_len, -1);
2443feb93f36SJason Wang                 if (out_num == VIRTQUEUE_MAX_SIZE) {
2444feb93f36SJason Wang                     goto drop;
2445032a74a1SCédric Le Goater                 }
2446feb93f36SJason Wang                 out_num += 1;
2447feb93f36SJason Wang                 out_sg = sg2;
2448feb93f36SJason Wang             }
2449feb93f36SJason Wang         }
24506e790746SPaolo Bonzini         /*
24516e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
24526e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
24536e790746SPaolo Bonzini          * that host is interested in.
24546e790746SPaolo Bonzini          */
24556e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
24566e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
24576e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
24586e790746SPaolo Bonzini                                        out_sg, out_num,
24596e790746SPaolo Bonzini                                        0, n->host_hdr_len);
24606e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
24616e790746SPaolo Bonzini                              out_sg, out_num,
24626e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
24636e790746SPaolo Bonzini             out_num = sg_num;
24646e790746SPaolo Bonzini             out_sg = sg;
24656e790746SPaolo Bonzini         }
24666e790746SPaolo Bonzini 
24676e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
24686e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
24696e790746SPaolo Bonzini         if (ret == 0) {
24706e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
24716e790746SPaolo Bonzini             q->async_tx.elem = elem;
24726e790746SPaolo Bonzini             return -EBUSY;
24736e790746SPaolo Bonzini         }
24746e790746SPaolo Bonzini 
2475feb93f36SJason Wang drop:
247651b19ebeSPaolo Bonzini         virtqueue_push(q->tx_vq, elem, 0);
247717a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
247851b19ebeSPaolo Bonzini         g_free(elem);
24796e790746SPaolo Bonzini 
24806e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
24816e790746SPaolo Bonzini             break;
24826e790746SPaolo Bonzini         }
24836e790746SPaolo Bonzini     }
24846e790746SPaolo Bonzini     return num_packets;
24856e790746SPaolo Bonzini }
24866e790746SPaolo Bonzini 
24876e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
24886e790746SPaolo Bonzini {
248917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
24906e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
24916e790746SPaolo Bonzini 
2492283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2493283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2494283e2c2aSYuri Benditovich         return;
2495283e2c2aSYuri Benditovich     }
2496283e2c2aSYuri Benditovich 
24976e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
249817a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
24996e790746SPaolo Bonzini         q->tx_waiting = 1;
25006e790746SPaolo Bonzini         return;
25016e790746SPaolo Bonzini     }
25026e790746SPaolo Bonzini 
25036e790746SPaolo Bonzini     if (q->tx_waiting) {
25046e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 1);
2505bc72ad67SAlex Bligh         timer_del(q->tx_timer);
25066e790746SPaolo Bonzini         q->tx_waiting = 0;
2507fa5e56c2SGreg Kurz         if (virtio_net_flush_tx(q) == -EINVAL) {
2508fa5e56c2SGreg Kurz             return;
2509fa5e56c2SGreg Kurz         }
25106e790746SPaolo Bonzini     } else {
2511bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
2512bc72ad67SAlex Bligh                        qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
25136e790746SPaolo Bonzini         q->tx_waiting = 1;
25146e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
25156e790746SPaolo Bonzini     }
25166e790746SPaolo Bonzini }
25176e790746SPaolo Bonzini 
25186e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
25196e790746SPaolo Bonzini {
252017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
25216e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
25226e790746SPaolo Bonzini 
2523283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2524283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2525283e2c2aSYuri Benditovich         return;
2526283e2c2aSYuri Benditovich     }
2527283e2c2aSYuri Benditovich 
25286e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
25296e790746SPaolo Bonzini         return;
25306e790746SPaolo Bonzini     }
25316e790746SPaolo Bonzini     q->tx_waiting = 1;
25326e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
253317a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
25346e790746SPaolo Bonzini         return;
25356e790746SPaolo Bonzini     }
25366e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
25376e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
25386e790746SPaolo Bonzini }
25396e790746SPaolo Bonzini 
25406e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
25416e790746SPaolo Bonzini {
25426e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
25436e790746SPaolo Bonzini     VirtIONet *n = q->n;
254417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2545e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2546e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2547e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2548e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2549e8bcf842SMichael S. Tsirkin         return;
2550e8bcf842SMichael S. Tsirkin     }
25516e790746SPaolo Bonzini 
25526e790746SPaolo Bonzini     q->tx_waiting = 0;
25536e790746SPaolo Bonzini 
25546e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
255517a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
25566e790746SPaolo Bonzini         return;
255717a0ca55SKONRAD Frederic     }
25586e790746SPaolo Bonzini 
25596e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
25606e790746SPaolo Bonzini     virtio_net_flush_tx(q);
25616e790746SPaolo Bonzini }
25626e790746SPaolo Bonzini 
25636e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
25646e790746SPaolo Bonzini {
25656e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
25666e790746SPaolo Bonzini     VirtIONet *n = q->n;
256717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
25686e790746SPaolo Bonzini     int32_t ret;
25696e790746SPaolo Bonzini 
2570e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2571e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2572e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2573e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2574e8bcf842SMichael S. Tsirkin         return;
2575e8bcf842SMichael S. Tsirkin     }
25766e790746SPaolo Bonzini 
25776e790746SPaolo Bonzini     q->tx_waiting = 0;
25786e790746SPaolo Bonzini 
25796e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
258017a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
25816e790746SPaolo Bonzini         return;
258217a0ca55SKONRAD Frederic     }
25836e790746SPaolo Bonzini 
25846e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
2585fa5e56c2SGreg Kurz     if (ret == -EBUSY || ret == -EINVAL) {
2586fa5e56c2SGreg Kurz         return; /* Notification re-enable handled by tx_complete or device
2587fa5e56c2SGreg Kurz                  * broken */
25886e790746SPaolo Bonzini     }
25896e790746SPaolo Bonzini 
25906e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
25916e790746SPaolo Bonzini      * more coming and immediately reschedule */
25926e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
25936e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
25946e790746SPaolo Bonzini         q->tx_waiting = 1;
25956e790746SPaolo Bonzini         return;
25966e790746SPaolo Bonzini     }
25976e790746SPaolo Bonzini 
25986e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
25996e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
26006e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
26016e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2602fa5e56c2SGreg Kurz     ret = virtio_net_flush_tx(q);
2603fa5e56c2SGreg Kurz     if (ret == -EINVAL) {
2604fa5e56c2SGreg Kurz         return;
2605fa5e56c2SGreg Kurz     } else if (ret > 0) {
26066e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
26076e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
26086e790746SPaolo Bonzini         q->tx_waiting = 1;
26096e790746SPaolo Bonzini     }
26106e790746SPaolo Bonzini }
26116e790746SPaolo Bonzini 
2612f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index)
2613f9d6dbf0SWen Congyang {
2614f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2615f9d6dbf0SWen Congyang 
26161c0fbfa3SMichael S. Tsirkin     n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
26171c0fbfa3SMichael S. Tsirkin                                            virtio_net_handle_rx);
26189b02e161SWei Wang 
2619f9d6dbf0SWen Congyang     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
2620f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
26219b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
26229b02e161SWei Wang                              virtio_net_handle_tx_timer);
2623f9d6dbf0SWen Congyang         n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
2624f9d6dbf0SWen Congyang                                               virtio_net_tx_timer,
2625f9d6dbf0SWen Congyang                                               &n->vqs[index]);
2626f9d6dbf0SWen Congyang     } else {
2627f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
26289b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
26299b02e161SWei Wang                              virtio_net_handle_tx_bh);
2630f9d6dbf0SWen Congyang         n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
2631f9d6dbf0SWen Congyang     }
2632f9d6dbf0SWen Congyang 
2633f9d6dbf0SWen Congyang     n->vqs[index].tx_waiting = 0;
2634f9d6dbf0SWen Congyang     n->vqs[index].n = n;
2635f9d6dbf0SWen Congyang }
2636f9d6dbf0SWen Congyang 
2637f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index)
2638f9d6dbf0SWen Congyang {
2639f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2640f9d6dbf0SWen Congyang     VirtIONetQueue *q = &n->vqs[index];
2641f9d6dbf0SWen Congyang     NetClientState *nc = qemu_get_subqueue(n->nic, index);
2642f9d6dbf0SWen Congyang 
2643f9d6dbf0SWen Congyang     qemu_purge_queued_packets(nc);
2644f9d6dbf0SWen Congyang 
2645f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2);
2646f9d6dbf0SWen Congyang     if (q->tx_timer) {
2647f9d6dbf0SWen Congyang         timer_free(q->tx_timer);
2648f989c30cSYunjian Wang         q->tx_timer = NULL;
2649f9d6dbf0SWen Congyang     } else {
2650f9d6dbf0SWen Congyang         qemu_bh_delete(q->tx_bh);
2651f989c30cSYunjian Wang         q->tx_bh = NULL;
2652f9d6dbf0SWen Congyang     }
2653f989c30cSYunjian Wang     q->tx_waiting = 0;
2654f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2 + 1);
2655f9d6dbf0SWen Congyang }
2656f9d6dbf0SWen Congyang 
2657f9d6dbf0SWen Congyang static void virtio_net_change_num_queues(VirtIONet *n, int new_max_queues)
2658f9d6dbf0SWen Congyang {
2659f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2660f9d6dbf0SWen Congyang     int old_num_queues = virtio_get_num_queues(vdev);
2661f9d6dbf0SWen Congyang     int new_num_queues = new_max_queues * 2 + 1;
2662f9d6dbf0SWen Congyang     int i;
2663f9d6dbf0SWen Congyang 
2664f9d6dbf0SWen Congyang     assert(old_num_queues >= 3);
2665f9d6dbf0SWen Congyang     assert(old_num_queues % 2 == 1);
2666f9d6dbf0SWen Congyang 
2667f9d6dbf0SWen Congyang     if (old_num_queues == new_num_queues) {
2668f9d6dbf0SWen Congyang         return;
2669f9d6dbf0SWen Congyang     }
2670f9d6dbf0SWen Congyang 
2671f9d6dbf0SWen Congyang     /*
2672f9d6dbf0SWen Congyang      * We always need to remove and add ctrl vq if
2673f9d6dbf0SWen Congyang      * old_num_queues != new_num_queues. Remove ctrl_vq first,
267420f86a75SYuval Shaia      * and then we only enter one of the following two loops.
2675f9d6dbf0SWen Congyang      */
2676f9d6dbf0SWen Congyang     virtio_del_queue(vdev, old_num_queues - 1);
2677f9d6dbf0SWen Congyang 
2678f9d6dbf0SWen Congyang     for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
2679f9d6dbf0SWen Congyang         /* new_num_queues < old_num_queues */
2680f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i / 2);
2681f9d6dbf0SWen Congyang     }
2682f9d6dbf0SWen Congyang 
2683f9d6dbf0SWen Congyang     for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
2684f9d6dbf0SWen Congyang         /* new_num_queues > old_num_queues */
2685f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i / 2);
2686f9d6dbf0SWen Congyang     }
2687f9d6dbf0SWen Congyang 
2688f9d6dbf0SWen Congyang     /* add ctrl_vq last */
2689f9d6dbf0SWen Congyang     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
2690f9d6dbf0SWen Congyang }
2691f9d6dbf0SWen Congyang 
2692ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
26936e790746SPaolo Bonzini {
2694f9d6dbf0SWen Congyang     int max = multiqueue ? n->max_queues : 1;
2695f9d6dbf0SWen Congyang 
26966e790746SPaolo Bonzini     n->multiqueue = multiqueue;
2697f9d6dbf0SWen Congyang     virtio_net_change_num_queues(n, max);
26986e790746SPaolo Bonzini 
26996e790746SPaolo Bonzini     virtio_net_set_queues(n);
27006e790746SPaolo Bonzini }
27016e790746SPaolo Bonzini 
2702982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id)
2703037dab2fSGreg Kurz {
2704982b78c5SDr. David Alan Gilbert     VirtIONet *n = opaque;
2705982b78c5SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2706037dab2fSGreg Kurz     int i, link_down;
2707037dab2fSGreg Kurz 
27089d8c6a25SDr. David Alan Gilbert     trace_virtio_net_post_load_device();
2709982b78c5SDr. David Alan Gilbert     virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs,
271095129d6fSCornelia Huck                                virtio_vdev_has_feature(vdev,
2711e22f0603SYuri Benditovich                                                        VIRTIO_F_VERSION_1),
2712e22f0603SYuri Benditovich                                virtio_vdev_has_feature(vdev,
2713e22f0603SYuri Benditovich                                                        VIRTIO_NET_F_HASH_REPORT));
27146e790746SPaolo Bonzini 
27156e790746SPaolo Bonzini     /* MAC_TABLE_ENTRIES may be different from the saved image */
2716982b78c5SDr. David Alan Gilbert     if (n->mac_table.in_use > MAC_TABLE_ENTRIES) {
27176e790746SPaolo Bonzini         n->mac_table.in_use = 0;
27186e790746SPaolo Bonzini     }
27196e790746SPaolo Bonzini 
2720982b78c5SDr. David Alan Gilbert     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
27216c666823SMichael S. Tsirkin         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
27226c666823SMichael S. Tsirkin     }
27236c666823SMichael S. Tsirkin 
27247788c3f2SMikhail Sennikovsky     /*
27257788c3f2SMikhail Sennikovsky      * curr_guest_offloads will be later overwritten by the
27267788c3f2SMikhail Sennikovsky      * virtio_set_features_nocheck call done from the virtio_load.
27277788c3f2SMikhail Sennikovsky      * Here we make sure it is preserved and restored accordingly
27287788c3f2SMikhail Sennikovsky      * in the virtio_net_post_load_virtio callback.
27297788c3f2SMikhail Sennikovsky      */
27307788c3f2SMikhail Sennikovsky     n->saved_guest_offloads = n->curr_guest_offloads;
27316c666823SMichael S. Tsirkin 
27326e790746SPaolo Bonzini     virtio_net_set_queues(n);
27336e790746SPaolo Bonzini 
27346e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
27356e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
27366e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
27376e790746SPaolo Bonzini             break;
27386e790746SPaolo Bonzini         }
27396e790746SPaolo Bonzini     }
27406e790746SPaolo Bonzini     n->mac_table.first_multi = i;
27416e790746SPaolo Bonzini 
27426e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
27436e790746SPaolo Bonzini      * to link status bit in n->status */
27446e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
27456e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
27466e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
27476e790746SPaolo Bonzini     }
27486e790746SPaolo Bonzini 
27496c666823SMichael S. Tsirkin     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
27506c666823SMichael S. Tsirkin         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
27519d8c6a25SDr. David Alan Gilbert         qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
27529d8c6a25SDr. David Alan Gilbert                                   QEMU_CLOCK_VIRTUAL,
27539d8c6a25SDr. David Alan Gilbert                                   virtio_net_announce_timer, n);
27549d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
27559d8c6a25SDr. David Alan Gilbert             timer_mod(n->announce_timer.tm,
27569d8c6a25SDr. David Alan Gilbert                       qemu_clock_get_ms(n->announce_timer.type));
27579d8c6a25SDr. David Alan Gilbert         } else {
2758944458b6SDr. David Alan Gilbert             qemu_announce_timer_del(&n->announce_timer, false);
27599d8c6a25SDr. David Alan Gilbert         }
27606c666823SMichael S. Tsirkin     }
27616c666823SMichael S. Tsirkin 
2762e41b7114SYuri Benditovich     if (n->rss_data.enabled) {
2763e41b7114SYuri Benditovich         trace_virtio_net_rss_enable(n->rss_data.hash_types,
2764e41b7114SYuri Benditovich                                     n->rss_data.indirections_len,
2765e41b7114SYuri Benditovich                                     sizeof(n->rss_data.key));
2766e41b7114SYuri Benditovich     } else {
2767e41b7114SYuri Benditovich         trace_virtio_net_rss_disable();
2768e41b7114SYuri Benditovich     }
27696e790746SPaolo Bonzini     return 0;
27706e790746SPaolo Bonzini }
27716e790746SPaolo Bonzini 
27727788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev)
27737788c3f2SMikhail Sennikovsky {
27747788c3f2SMikhail Sennikovsky     VirtIONet *n = VIRTIO_NET(vdev);
27757788c3f2SMikhail Sennikovsky     /*
27767788c3f2SMikhail Sennikovsky      * The actual needed state is now in saved_guest_offloads,
27777788c3f2SMikhail Sennikovsky      * see virtio_net_post_load_device for detail.
27787788c3f2SMikhail Sennikovsky      * Restore it back and apply the desired offloads.
27797788c3f2SMikhail Sennikovsky      */
27807788c3f2SMikhail Sennikovsky     n->curr_guest_offloads = n->saved_guest_offloads;
27817788c3f2SMikhail Sennikovsky     if (peer_has_vnet_hdr(n)) {
27827788c3f2SMikhail Sennikovsky         virtio_net_apply_guest_offloads(n);
27837788c3f2SMikhail Sennikovsky     }
27847788c3f2SMikhail Sennikovsky 
27857788c3f2SMikhail Sennikovsky     return 0;
27867788c3f2SMikhail Sennikovsky }
27877788c3f2SMikhail Sennikovsky 
2788982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */
2789982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = {
2790982b78c5SDr. David Alan Gilbert     .name = "virtio-net-queue-tx_waiting",
2791982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2792982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(tx_waiting, VirtIONetQueue),
2793982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2794982b78c5SDr. David Alan Gilbert    },
2795982b78c5SDr. David Alan Gilbert };
2796982b78c5SDr. David Alan Gilbert 
2797982b78c5SDr. David Alan Gilbert static bool max_queues_gt_1(void *opaque, int version_id)
2798982b78c5SDr. David Alan Gilbert {
2799982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->max_queues > 1;
2800982b78c5SDr. David Alan Gilbert }
2801982b78c5SDr. David Alan Gilbert 
2802982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id)
2803982b78c5SDr. David Alan Gilbert {
2804982b78c5SDr. David Alan Gilbert     return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque),
2805982b78c5SDr. David Alan Gilbert                                    VIRTIO_NET_F_CTRL_GUEST_OFFLOADS);
2806982b78c5SDr. David Alan Gilbert }
2807982b78c5SDr. David Alan Gilbert 
2808982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id)
2809982b78c5SDr. David Alan Gilbert {
2810982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES;
2811982b78c5SDr. David Alan Gilbert }
2812982b78c5SDr. David Alan Gilbert 
2813982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id)
2814982b78c5SDr. David Alan Gilbert {
2815982b78c5SDr. David Alan Gilbert     return !mac_table_fits(opaque, version_id);
2816982b78c5SDr. David Alan Gilbert }
2817982b78c5SDr. David Alan Gilbert 
2818982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods
2819982b78c5SDr. David Alan Gilbert  * although only some fields are used by each.
2820982b78c5SDr. David Alan Gilbert  */
2821982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp {
2822982b78c5SDr. David Alan Gilbert     VirtIONet      *parent;
2823982b78c5SDr. David Alan Gilbert     VirtIONetQueue *vqs_1;
2824982b78c5SDr. David Alan Gilbert     uint16_t        curr_queues_1;
2825982b78c5SDr. David Alan Gilbert     uint8_t         has_ufo;
2826982b78c5SDr. David Alan Gilbert     uint32_t        has_vnet_hdr;
2827982b78c5SDr. David Alan Gilbert };
2828982b78c5SDr. David Alan Gilbert 
2829982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than
2830982b78c5SDr. David Alan Gilbert  * the 1st entry in the queues and only if there's more than one
2831982b78c5SDr. David Alan Gilbert  * entry.  We use the tmp mechanism to calculate a temporary
2832982b78c5SDr. David Alan Gilbert  * pointer and count and also validate the count.
2833982b78c5SDr. David Alan Gilbert  */
2834982b78c5SDr. David Alan Gilbert 
283544b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque)
2836982b78c5SDr. David Alan Gilbert {
2837982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2838982b78c5SDr. David Alan Gilbert 
2839982b78c5SDr. David Alan Gilbert     tmp->vqs_1 = tmp->parent->vqs + 1;
2840982b78c5SDr. David Alan Gilbert     tmp->curr_queues_1 = tmp->parent->curr_queues - 1;
2841982b78c5SDr. David Alan Gilbert     if (tmp->parent->curr_queues == 0) {
2842982b78c5SDr. David Alan Gilbert         tmp->curr_queues_1 = 0;
2843982b78c5SDr. David Alan Gilbert     }
284444b1ff31SDr. David Alan Gilbert 
284544b1ff31SDr. David Alan Gilbert     return 0;
2846982b78c5SDr. David Alan Gilbert }
2847982b78c5SDr. David Alan Gilbert 
2848982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque)
2849982b78c5SDr. David Alan Gilbert {
2850982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2851982b78c5SDr. David Alan Gilbert 
2852982b78c5SDr. David Alan Gilbert     /* Reuse the pointer setup from save */
2853982b78c5SDr. David Alan Gilbert     virtio_net_tx_waiting_pre_save(opaque);
2854982b78c5SDr. David Alan Gilbert 
2855982b78c5SDr. David Alan Gilbert     if (tmp->parent->curr_queues > tmp->parent->max_queues) {
2856982b78c5SDr. David Alan Gilbert         error_report("virtio-net: curr_queues %x > max_queues %x",
2857982b78c5SDr. David Alan Gilbert             tmp->parent->curr_queues, tmp->parent->max_queues);
2858982b78c5SDr. David Alan Gilbert 
2859982b78c5SDr. David Alan Gilbert         return -EINVAL;
2860982b78c5SDr. David Alan Gilbert     }
2861982b78c5SDr. David Alan Gilbert 
2862982b78c5SDr. David Alan Gilbert     return 0; /* all good */
2863982b78c5SDr. David Alan Gilbert }
2864982b78c5SDr. David Alan Gilbert 
2865982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = {
2866982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-tx_waiting",
2867982b78c5SDr. David Alan Gilbert     .pre_load  = virtio_net_tx_waiting_pre_load,
2868982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_tx_waiting_pre_save,
2869982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2870982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp,
2871982b78c5SDr. David Alan Gilbert                                      curr_queues_1,
2872982b78c5SDr. David Alan Gilbert                                      vmstate_virtio_net_queue_tx_waiting,
2873982b78c5SDr. David Alan Gilbert                                      struct VirtIONetQueue),
2874982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2875982b78c5SDr. David Alan Gilbert     },
2876982b78c5SDr. David Alan Gilbert };
2877982b78c5SDr. David Alan Gilbert 
2878982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the
2879982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
2880982b78c5SDr. David Alan Gilbert  */
2881982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id)
2882982b78c5SDr. David Alan Gilbert {
2883982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2884982b78c5SDr. David Alan Gilbert 
2885982b78c5SDr. David Alan Gilbert     if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) {
2886982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires TUN_F_UFO support");
2887982b78c5SDr. David Alan Gilbert         return -EINVAL;
2888982b78c5SDr. David Alan Gilbert     }
2889982b78c5SDr. David Alan Gilbert 
2890982b78c5SDr. David Alan Gilbert     return 0;
2891982b78c5SDr. David Alan Gilbert }
2892982b78c5SDr. David Alan Gilbert 
289344b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque)
2894982b78c5SDr. David Alan Gilbert {
2895982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2896982b78c5SDr. David Alan Gilbert 
2897982b78c5SDr. David Alan Gilbert     tmp->has_ufo = tmp->parent->has_ufo;
289844b1ff31SDr. David Alan Gilbert 
289944b1ff31SDr. David Alan Gilbert     return 0;
2900982b78c5SDr. David Alan Gilbert }
2901982b78c5SDr. David Alan Gilbert 
2902982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = {
2903982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-ufo",
2904982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_ufo_post_load,
2905982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_ufo_pre_save,
2906982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2907982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp),
2908982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2909982b78c5SDr. David Alan Gilbert     },
2910982b78c5SDr. David Alan Gilbert };
2911982b78c5SDr. David Alan Gilbert 
2912982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the
2913982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
2914982b78c5SDr. David Alan Gilbert  */
2915982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id)
2916982b78c5SDr. David Alan Gilbert {
2917982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2918982b78c5SDr. David Alan Gilbert 
2919982b78c5SDr. David Alan Gilbert     if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) {
2920982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires vnet_hdr=on");
2921982b78c5SDr. David Alan Gilbert         return -EINVAL;
2922982b78c5SDr. David Alan Gilbert     }
2923982b78c5SDr. David Alan Gilbert 
2924982b78c5SDr. David Alan Gilbert     return 0;
2925982b78c5SDr. David Alan Gilbert }
2926982b78c5SDr. David Alan Gilbert 
292744b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque)
2928982b78c5SDr. David Alan Gilbert {
2929982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2930982b78c5SDr. David Alan Gilbert 
2931982b78c5SDr. David Alan Gilbert     tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr;
293244b1ff31SDr. David Alan Gilbert 
293344b1ff31SDr. David Alan Gilbert     return 0;
2934982b78c5SDr. David Alan Gilbert }
2935982b78c5SDr. David Alan Gilbert 
2936982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = {
2937982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-vnet",
2938982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_vnet_post_load,
2939982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_vnet_pre_save,
2940982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2941982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp),
2942982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2943982b78c5SDr. David Alan Gilbert     },
2944982b78c5SDr. David Alan Gilbert };
2945982b78c5SDr. David Alan Gilbert 
2946e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque)
2947e41b7114SYuri Benditovich {
2948e41b7114SYuri Benditovich     return VIRTIO_NET(opaque)->rss_data.enabled;
2949e41b7114SYuri Benditovich }
2950e41b7114SYuri Benditovich 
2951e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = {
2952e41b7114SYuri Benditovich     .name      = "virtio-net-device/rss",
2953e41b7114SYuri Benditovich     .version_id = 1,
2954e41b7114SYuri Benditovich     .minimum_version_id = 1,
2955e41b7114SYuri Benditovich     .needed = virtio_net_rss_needed,
2956e41b7114SYuri Benditovich     .fields = (VMStateField[]) {
2957e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.enabled, VirtIONet),
2958e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.redirect, VirtIONet),
2959e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.populate_hash, VirtIONet),
2960e41b7114SYuri Benditovich         VMSTATE_UINT32(rss_data.hash_types, VirtIONet),
2961e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.indirections_len, VirtIONet),
2962e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.default_queue, VirtIONet),
2963e41b7114SYuri Benditovich         VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet,
2964e41b7114SYuri Benditovich                             VIRTIO_NET_RSS_MAX_KEY_SIZE),
2965e41b7114SYuri Benditovich         VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet,
2966e41b7114SYuri Benditovich                                     rss_data.indirections_len, 0,
2967e41b7114SYuri Benditovich                                     vmstate_info_uint16, uint16_t),
2968e41b7114SYuri Benditovich         VMSTATE_END_OF_LIST()
2969e41b7114SYuri Benditovich     },
2970e41b7114SYuri Benditovich };
2971e41b7114SYuri Benditovich 
2972982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = {
2973982b78c5SDr. David Alan Gilbert     .name = "virtio-net-device",
2974982b78c5SDr. David Alan Gilbert     .version_id = VIRTIO_NET_VM_VERSION,
2975982b78c5SDr. David Alan Gilbert     .minimum_version_id = VIRTIO_NET_VM_VERSION,
2976982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_post_load_device,
2977982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2978982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN),
2979982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_POINTER(vqs, VirtIONet,
2980982b78c5SDr. David Alan Gilbert                                vmstate_virtio_net_queue_tx_waiting,
2981982b78c5SDr. David Alan Gilbert                                VirtIONetQueue),
2982982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet),
2983982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16(status, VirtIONet),
2984982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(promisc, VirtIONet),
2985982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(allmulti, VirtIONet),
2986982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mac_table.in_use, VirtIONet),
2987982b78c5SDr. David Alan Gilbert 
2988982b78c5SDr. David Alan Gilbert         /* Guarded pair: If it fits we load it, else we throw it away
2989982b78c5SDr. David Alan Gilbert          * - can happen if source has a larger MAC table.; post-load
2990982b78c5SDr. David Alan Gilbert          *  sets flags in this case.
2991982b78c5SDr. David Alan Gilbert          */
2992982b78c5SDr. David Alan Gilbert         VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet,
2993982b78c5SDr. David Alan Gilbert                                 0, mac_table_fits, mac_table.in_use,
2994982b78c5SDr. David Alan Gilbert                                  ETH_ALEN),
2995982b78c5SDr. David Alan Gilbert         VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0,
2996982b78c5SDr. David Alan Gilbert                                      mac_table.in_use, ETH_ALEN),
2997982b78c5SDr. David Alan Gilbert 
2998982b78c5SDr. David Alan Gilbert         /* Note: This is an array of uint32's that's always been saved as a
2999982b78c5SDr. David Alan Gilbert          * buffer; hold onto your endiannesses; it's actually used as a bitmap
3000982b78c5SDr. David Alan Gilbert          * but based on the uint.
3001982b78c5SDr. David Alan Gilbert          */
3002982b78c5SDr. David Alan Gilbert         VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3),
3003982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3004982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_vnet),
3005982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet),
3006982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet),
3007982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(alluni, VirtIONet),
3008982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nomulti, VirtIONet),
3009982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nouni, VirtIONet),
3010982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nobcast, VirtIONet),
3011982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3012982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_ufo),
3013982b78c5SDr. David Alan Gilbert         VMSTATE_SINGLE_TEST(max_queues, VirtIONet, max_queues_gt_1, 0,
3014982b78c5SDr. David Alan Gilbert                             vmstate_info_uint16_equal, uint16_t),
3015982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16_TEST(curr_queues, VirtIONet, max_queues_gt_1),
3016982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3017982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_tx_waiting),
3018982b78c5SDr. David Alan Gilbert         VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet,
3019982b78c5SDr. David Alan Gilbert                             has_ctrl_guest_offloads),
3020982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3021982b78c5SDr. David Alan Gilbert    },
3022e41b7114SYuri Benditovich     .subsections = (const VMStateDescription * []) {
3023e41b7114SYuri Benditovich         &vmstate_virtio_net_rss,
3024e41b7114SYuri Benditovich         NULL
3025e41b7114SYuri Benditovich     }
3026982b78c5SDr. David Alan Gilbert };
3027982b78c5SDr. David Alan Gilbert 
30286e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
3029f394b2e2SEric Blake     .type = NET_CLIENT_DRIVER_NIC,
30306e790746SPaolo Bonzini     .size = sizeof(NICState),
30316e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
30326e790746SPaolo Bonzini     .receive = virtio_net_receive,
30336e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
3034b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
3035b2c929f0SDr. David Alan Gilbert     .announce = virtio_net_announce,
30366e790746SPaolo Bonzini };
30376e790746SPaolo Bonzini 
30386e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
30396e790746SPaolo Bonzini {
304017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
30416e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
30426e790746SPaolo Bonzini     assert(n->vhost_started);
3043ed8b4afeSNikolay Nikolaev     return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
30446e790746SPaolo Bonzini }
30456e790746SPaolo Bonzini 
30466e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
30476e790746SPaolo Bonzini                                            bool mask)
30486e790746SPaolo Bonzini {
304917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
30506e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
30516e790746SPaolo Bonzini     assert(n->vhost_started);
3052ed8b4afeSNikolay Nikolaev     vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
30536e790746SPaolo Bonzini                              vdev, idx, mask);
30546e790746SPaolo Bonzini }
30556e790746SPaolo Bonzini 
3056019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
30576e790746SPaolo Bonzini {
30580cd09c3aSCornelia Huck     virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
3059a93e599dSMaxime Coquelin 
3060ba550851SStefano Garzarella     n->config_size = virtio_feature_get_config_size(feature_sizes,
3061ba550851SStefano Garzarella                                                     host_features);
306217ec5a86SKONRAD Frederic }
30636e790746SPaolo Bonzini 
30648a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
30658a253ec2SKONRAD Frederic                                    const char *type)
30668a253ec2SKONRAD Frederic {
30678a253ec2SKONRAD Frederic     /*
30688a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
30698a253ec2SKONRAD Frederic      */
30708a253ec2SKONRAD Frederic     assert(type != NULL);
30718a253ec2SKONRAD Frederic 
30728a253ec2SKONRAD Frederic     g_free(n->netclient_name);
30738a253ec2SKONRAD Frederic     g_free(n->netclient_type);
30748a253ec2SKONRAD Frederic     n->netclient_name = g_strdup(name);
30758a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
30768a253ec2SKONRAD Frederic }
30778a253ec2SKONRAD Frederic 
30780e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev)
30799711cd0dSJens Freimann {
30809711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
30819711cd0dSJens Freimann     PCIDevice *pci_dev;
30829711cd0dSJens Freimann     Error *err = NULL;
30839711cd0dSJens Freimann 
30840e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
30859711cd0dSJens Freimann     if (hotplug_ctrl) {
30860e9a65c5SJuan Quintela         pci_dev = PCI_DEVICE(dev);
30879711cd0dSJens Freimann         pci_dev->partially_hotplugged = true;
30880e9a65c5SJuan Quintela         hotplug_handler_unplug_request(hotplug_ctrl, dev, &err);
30899711cd0dSJens Freimann         if (err) {
30909711cd0dSJens Freimann             error_report_err(err);
30919711cd0dSJens Freimann             return false;
30929711cd0dSJens Freimann         }
30939711cd0dSJens Freimann     } else {
30949711cd0dSJens Freimann         return false;
30959711cd0dSJens Freimann     }
30969711cd0dSJens Freimann     return true;
30979711cd0dSJens Freimann }
30989711cd0dSJens Freimann 
30990e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev,
31000e9a65c5SJuan Quintela                                     Error **errp)
31019711cd0dSJens Freimann {
31025a0948d3SMarkus Armbruster     Error *err = NULL;
31039711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
31040e9a65c5SJuan Quintela     PCIDevice *pdev = PCI_DEVICE(dev);
310578274682SJuan Quintela     BusState *primary_bus;
31069711cd0dSJens Freimann 
31079711cd0dSJens Freimann     if (!pdev->partially_hotplugged) {
31089711cd0dSJens Freimann         return true;
31099711cd0dSJens Freimann     }
31100e9a65c5SJuan Quintela     primary_bus = dev->parent_bus;
311178274682SJuan Quintela     if (!primary_bus) {
3112150ab54aSJens Freimann         error_setg(errp, "virtio_net: couldn't find primary bus");
31135a0948d3SMarkus Armbruster         return false;
31149711cd0dSJens Freimann     }
31150e9a65c5SJuan Quintela     qdev_set_parent_bus(dev, primary_bus, &error_abort);
3116e2bde83eSJuan Quintela     qatomic_set(&n->failover_primary_hidden, false);
31170e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
31189711cd0dSJens Freimann     if (hotplug_ctrl) {
31190e9a65c5SJuan Quintela         hotplug_handler_pre_plug(hotplug_ctrl, dev, &err);
31205a0948d3SMarkus Armbruster         if (err) {
31215a0948d3SMarkus Armbruster             goto out;
31225a0948d3SMarkus Armbruster         }
31230e9a65c5SJuan Quintela         hotplug_handler_plug(hotplug_ctrl, dev, &err);
31249711cd0dSJens Freimann     }
3125150ab54aSJens Freimann 
3126150ab54aSJens Freimann out:
31275a0948d3SMarkus Armbruster     error_propagate(errp, err);
31285a0948d3SMarkus Armbruster     return !err;
31299711cd0dSJens Freimann }
31309711cd0dSJens Freimann 
313107a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s)
31329711cd0dSJens Freimann {
31339711cd0dSJens Freimann     bool should_be_hidden;
31349711cd0dSJens Freimann     Error *err = NULL;
313507a5d816SJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
313607a5d816SJuan Quintela 
313707a5d816SJuan Quintela     if (!dev) {
313807a5d816SJuan Quintela         return;
313907a5d816SJuan Quintela     }
31409711cd0dSJens Freimann 
3141e2bde83eSJuan Quintela     should_be_hidden = qatomic_read(&n->failover_primary_hidden);
31429711cd0dSJens Freimann 
31434dbac1aeSMarkus Armbruster     if (migration_in_setup(s) && !should_be_hidden) {
314407a5d816SJuan Quintela         if (failover_unplug_primary(n, dev)) {
314507a5d816SJuan Quintela             vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev);
314607a5d816SJuan Quintela             qapi_event_send_unplug_primary(dev->id);
3147e2bde83eSJuan Quintela             qatomic_set(&n->failover_primary_hidden, true);
31489711cd0dSJens Freimann         } else {
31499711cd0dSJens Freimann             warn_report("couldn't unplug primary device");
31509711cd0dSJens Freimann         }
31519711cd0dSJens Freimann     } else if (migration_has_failed(s)) {
3152150ab54aSJens Freimann         /* We already unplugged the device let's plug it back */
315307a5d816SJuan Quintela         if (!failover_replug_primary(n, dev, &err)) {
31549711cd0dSJens Freimann             if (err) {
31559711cd0dSJens Freimann                 error_report_err(err);
31569711cd0dSJens Freimann             }
31579711cd0dSJens Freimann         }
31589711cd0dSJens Freimann     }
31599711cd0dSJens Freimann }
31609711cd0dSJens Freimann 
31619711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data)
31629711cd0dSJens Freimann {
31639711cd0dSJens Freimann     MigrationState *s = data;
31649711cd0dSJens Freimann     VirtIONet *n = container_of(notifier, VirtIONet, migration_state);
31659711cd0dSJens Freimann     virtio_net_handle_migration_primary(n, s);
31669711cd0dSJens Freimann }
31679711cd0dSJens Freimann 
3168b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener,
31699711cd0dSJens Freimann                                          QemuOpts *device_opts)
31709711cd0dSJens Freimann {
31719711cd0dSJens Freimann     VirtIONet *n = container_of(listener, VirtIONet, primary_listener);
31724f0303aeSJuan Quintela     const char *standby_id;
31739711cd0dSJens Freimann 
31744d0e59acSJens Freimann     if (!device_opts) {
317589631fedSJuan Quintela         return false;
31764d0e59acSJens Freimann     }
31774f0303aeSJuan Quintela     standby_id = qemu_opt_get(device_opts, "failover_pair_id");
317889631fedSJuan Quintela     if (g_strcmp0(standby_id, n->netclient_name) != 0) {
317989631fedSJuan Quintela         return false;
31809711cd0dSJens Freimann     }
31819711cd0dSJens Freimann 
3182e2bde83eSJuan Quintela     /* failover_primary_hidden is set during feature negotiation */
31833abad4a2SJuan Quintela     return qatomic_read(&n->failover_primary_hidden);
31849711cd0dSJens Freimann }
31859711cd0dSJens Freimann 
3186e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
318717ec5a86SKONRAD Frederic {
3188e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3189284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3190284a32f0SAndreas Färber     NetClientState *nc;
31911773d9eeSKONRAD Frederic     int i;
319217ec5a86SKONRAD Frederic 
3193a93e599dSMaxime Coquelin     if (n->net_conf.mtu) {
3194127833eeSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_MTU);
3195a93e599dSMaxime Coquelin     }
3196a93e599dSMaxime Coquelin 
31979473939eSJason Baron     if (n->net_conf.duplex_str) {
31989473939eSJason Baron         if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) {
31999473939eSJason Baron             n->net_conf.duplex = DUPLEX_HALF;
32009473939eSJason Baron         } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) {
32019473939eSJason Baron             n->net_conf.duplex = DUPLEX_FULL;
32029473939eSJason Baron         } else {
32039473939eSJason Baron             error_setg(errp, "'duplex' must be 'half' or 'full'");
3204843c4cfcSMarkus Armbruster             return;
32059473939eSJason Baron         }
32069473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
32079473939eSJason Baron     } else {
32089473939eSJason Baron         n->net_conf.duplex = DUPLEX_UNKNOWN;
32099473939eSJason Baron     }
32109473939eSJason Baron 
32119473939eSJason Baron     if (n->net_conf.speed < SPEED_UNKNOWN) {
32129473939eSJason Baron         error_setg(errp, "'speed' must be between 0 and INT_MAX");
3213843c4cfcSMarkus Armbruster         return;
3214843c4cfcSMarkus Armbruster     }
3215843c4cfcSMarkus Armbruster     if (n->net_conf.speed >= 0) {
32169473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
32179473939eSJason Baron     }
32189473939eSJason Baron 
32199711cd0dSJens Freimann     if (n->failover) {
3220b91ad981SJuan Quintela         n->primary_listener.hide_device = failover_hide_primary_device;
3221e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, true);
32229711cd0dSJens Freimann         device_listener_register(&n->primary_listener);
32239711cd0dSJens Freimann         n->migration_state.notify = virtio_net_migration_state_notifier;
32249711cd0dSJens Freimann         add_migration_state_change_notifier(&n->migration_state);
32259711cd0dSJens Freimann         n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY);
32269711cd0dSJens Freimann     }
32279711cd0dSJens Freimann 
3228da3e8a23SShannon Zhao     virtio_net_set_config_size(n, n->host_features);
3229284a32f0SAndreas Färber     virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size);
323017ec5a86SKONRAD Frederic 
32311c0fbfa3SMichael S. Tsirkin     /*
32321c0fbfa3SMichael S. Tsirkin      * We set a lower limit on RX queue size to what it always was.
32331c0fbfa3SMichael S. Tsirkin      * Guests that want a smaller ring can always resize it without
32341c0fbfa3SMichael S. Tsirkin      * help from us (using virtio 1 and up).
32351c0fbfa3SMichael S. Tsirkin      */
32361c0fbfa3SMichael S. Tsirkin     if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
32371c0fbfa3SMichael S. Tsirkin         n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
32385f997fd1SMichal Privoznik         !is_power_of_2(n->net_conf.rx_queue_size)) {
32391c0fbfa3SMichael S. Tsirkin         error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
32401c0fbfa3SMichael S. Tsirkin                    "must be a power of 2 between %d and %d.",
32411c0fbfa3SMichael S. Tsirkin                    n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
32421c0fbfa3SMichael S. Tsirkin                    VIRTQUEUE_MAX_SIZE);
32431c0fbfa3SMichael S. Tsirkin         virtio_cleanup(vdev);
32441c0fbfa3SMichael S. Tsirkin         return;
32451c0fbfa3SMichael S. Tsirkin     }
32461c0fbfa3SMichael S. Tsirkin 
32479b02e161SWei Wang     if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE ||
32489b02e161SWei Wang         n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE ||
32499b02e161SWei Wang         !is_power_of_2(n->net_conf.tx_queue_size)) {
32509b02e161SWei Wang         error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), "
32519b02e161SWei Wang                    "must be a power of 2 between %d and %d",
32529b02e161SWei Wang                    n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE,
32539b02e161SWei Wang                    VIRTQUEUE_MAX_SIZE);
32549b02e161SWei Wang         virtio_cleanup(vdev);
32559b02e161SWei Wang         return;
32569b02e161SWei Wang     }
32579b02e161SWei Wang 
3258575a1c0eSJiri Pirko     n->max_queues = MAX(n->nic_conf.peers.queues, 1);
325987b3bd1cSJason Wang     if (n->max_queues * 2 + 1 > VIRTIO_QUEUE_MAX) {
32607e0e736eSJason Wang         error_setg(errp, "Invalid number of queues (= %" PRIu32 "), "
3261631b22eaSStefan Weil                    "must be a positive integer less than %d.",
326287b3bd1cSJason Wang                    n->max_queues, (VIRTIO_QUEUE_MAX - 1) / 2);
32637e0e736eSJason Wang         virtio_cleanup(vdev);
32647e0e736eSJason Wang         return;
32657e0e736eSJason Wang     }
32666e790746SPaolo Bonzini     n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queues);
32676e790746SPaolo Bonzini     n->curr_queues = 1;
32681773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
32696e790746SPaolo Bonzini 
32701773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
32711773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
32720765691eSMarkus Armbruster         warn_report("virtio-net: "
32736e790746SPaolo Bonzini                     "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
32741773d9eeSKONRAD Frederic                     n->net_conf.tx);
32750765691eSMarkus Armbruster         error_printf("Defaulting to \"bh\"");
32766e790746SPaolo Bonzini     }
32776e790746SPaolo Bonzini 
32782eef278bSMichael S. Tsirkin     n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n),
32792eef278bSMichael S. Tsirkin                                     n->net_conf.tx_queue_size);
32809b02e161SWei Wang 
3281da51a335SJason Wang     for (i = 0; i < n->max_queues; i++) {
3282f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i);
3283da51a335SJason Wang     }
3284da51a335SJason Wang 
328517a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
32861773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
32871773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
32886e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
32899d8c6a25SDr. David Alan Gilbert     qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
32909d8c6a25SDr. David Alan Gilbert                               QEMU_CLOCK_VIRTUAL,
3291f57fcf70SJason Wang                               virtio_net_announce_timer, n);
3292b2c929f0SDr. David Alan Gilbert     n->announce_timer.round = 0;
32936e790746SPaolo Bonzini 
32948a253ec2SKONRAD Frederic     if (n->netclient_type) {
32958a253ec2SKONRAD Frederic         /*
32968a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
32978a253ec2SKONRAD Frederic          */
32988a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
32998a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
33008a253ec2SKONRAD Frederic     } else {
33011773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
3302284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
33038a253ec2SKONRAD Frederic     }
33048a253ec2SKONRAD Frederic 
33056e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
33066e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
33076e790746SPaolo Bonzini         for (i = 0; i < n->max_queues; i++) {
3308d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
33096e790746SPaolo Bonzini         }
33106e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
33116e790746SPaolo Bonzini     } else {
33126e790746SPaolo Bonzini         n->host_hdr_len = 0;
33136e790746SPaolo Bonzini     }
33146e790746SPaolo Bonzini 
33151773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
33166e790746SPaolo Bonzini 
33176e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
33181773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
3319e22f0603SYuri Benditovich     virtio_net_set_mrg_rx_bufs(n, 0, 0, 0);
33206e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
33216e790746SPaolo Bonzini 
33226e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
33236e790746SPaolo Bonzini 
33246e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
33256e790746SPaolo Bonzini 
3326b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
3327b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
3328b1be4280SAmos Kong 
3329e87936eaSCindy Lu    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
3330e87936eaSCindy Lu         struct virtio_net_config netcfg = {};
3331e87936eaSCindy Lu         memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN);
3332e87936eaSCindy Lu         vhost_net_set_config(get_vhost_net(nc->peer),
3333e87936eaSCindy Lu             (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER);
3334e87936eaSCindy Lu     }
33352974e916SYuri Benditovich     QTAILQ_INIT(&n->rsc_chains);
3336284a32f0SAndreas Färber     n->qdev = dev;
33374474e37aSYuri Benditovich 
33384474e37aSYuri Benditovich     net_rx_pkt_init(&n->rx_pkt, false);
333917ec5a86SKONRAD Frederic }
334017ec5a86SKONRAD Frederic 
3341b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev)
334217ec5a86SKONRAD Frederic {
3343306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3344306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3345f9d6dbf0SWen Congyang     int i, max_queues;
334617ec5a86SKONRAD Frederic 
334717ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
334817ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
334917ec5a86SKONRAD Frederic 
33508a253ec2SKONRAD Frederic     g_free(n->netclient_name);
33518a253ec2SKONRAD Frederic     n->netclient_name = NULL;
33528a253ec2SKONRAD Frederic     g_free(n->netclient_type);
33538a253ec2SKONRAD Frederic     n->netclient_type = NULL;
33548a253ec2SKONRAD Frederic 
335517ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
335617ec5a86SKONRAD Frederic     g_free(n->vlans);
335717ec5a86SKONRAD Frederic 
33589711cd0dSJens Freimann     if (n->failover) {
335965018100SJuan Quintela         device_listener_unregister(&n->primary_listener);
33609711cd0dSJens Freimann     }
33619711cd0dSJens Freimann 
3362f9d6dbf0SWen Congyang     max_queues = n->multiqueue ? n->max_queues : 1;
3363f9d6dbf0SWen Congyang     for (i = 0; i < max_queues; i++) {
3364f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i);
336517ec5a86SKONRAD Frederic     }
3366d945d9f1SYuri Benditovich     /* delete also control vq */
3367d945d9f1SYuri Benditovich     virtio_del_queue(vdev, max_queues * 2);
3368944458b6SDr. David Alan Gilbert     qemu_announce_timer_del(&n->announce_timer, false);
336917ec5a86SKONRAD Frederic     g_free(n->vqs);
337017ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
33712974e916SYuri Benditovich     virtio_net_rsc_cleanup(n);
337259079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
33734474e37aSYuri Benditovich     net_rx_pkt_uninit(n->rx_pkt);
33746a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
337517ec5a86SKONRAD Frederic }
337617ec5a86SKONRAD Frederic 
337717ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
337817ec5a86SKONRAD Frederic {
337917ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
338017ec5a86SKONRAD Frederic 
338117ec5a86SKONRAD Frederic     /*
338217ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
338317ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
338417ec5a86SKONRAD Frederic      */
338517ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
3386aa4197c3SGonglei     device_add_bootindex_property(obj, &n->nic_conf.bootindex,
3387aa4197c3SGonglei                                   "bootindex", "/ethernet-phy@0",
338840c2281cSMarkus Armbruster                                   DEVICE(n));
338917ec5a86SKONRAD Frederic }
339017ec5a86SKONRAD Frederic 
339144b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque)
33924d45dcfbSHalil Pasic {
33934d45dcfbSHalil Pasic     VirtIONet *n = opaque;
33944d45dcfbSHalil Pasic 
33954d45dcfbSHalil Pasic     /* At this point, backend must be stopped, otherwise
33964d45dcfbSHalil Pasic      * it might keep writing to memory. */
33974d45dcfbSHalil Pasic     assert(!n->vhost_started);
339844b1ff31SDr. David Alan Gilbert 
339944b1ff31SDr. David Alan Gilbert     return 0;
34004d45dcfbSHalil Pasic }
34014d45dcfbSHalil Pasic 
34029711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque)
34039711cd0dSJens Freimann {
34049711cd0dSJens Freimann     DeviceState *dev = opaque;
340521e8709bSJuan Quintela     DeviceState *primary;
34069711cd0dSJens Freimann     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
34079711cd0dSJens Freimann     VirtIONet *n = VIRTIO_NET(vdev);
34089711cd0dSJens Freimann 
3409284f42a5SJens Freimann     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) {
3410284f42a5SJens Freimann         return false;
3411284f42a5SJens Freimann     }
341221e8709bSJuan Quintela     primary = failover_find_primary_device(n);
341321e8709bSJuan Quintela     return primary ? primary->pending_deleted_event : false;
34149711cd0dSJens Freimann }
34159711cd0dSJens Freimann 
34169711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque)
34179711cd0dSJens Freimann {
34189711cd0dSJens Freimann     DeviceState *dev = opaque;
34199711cd0dSJens Freimann     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
34209711cd0dSJens Freimann 
34219711cd0dSJens Freimann     return vdc->primary_unplug_pending(dev);
34229711cd0dSJens Freimann }
34239711cd0dSJens Freimann 
34244d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = {
34254d45dcfbSHalil Pasic     .name = "virtio-net",
34264d45dcfbSHalil Pasic     .minimum_version_id = VIRTIO_NET_VM_VERSION,
34274d45dcfbSHalil Pasic     .version_id = VIRTIO_NET_VM_VERSION,
34284d45dcfbSHalil Pasic     .fields = (VMStateField[]) {
34294d45dcfbSHalil Pasic         VMSTATE_VIRTIO_DEVICE,
34304d45dcfbSHalil Pasic         VMSTATE_END_OF_LIST()
34314d45dcfbSHalil Pasic     },
34324d45dcfbSHalil Pasic     .pre_save = virtio_net_pre_save,
34339711cd0dSJens Freimann     .dev_unplug_pending = dev_unplug_pending,
34344d45dcfbSHalil Pasic };
3435290c2428SDr. David Alan Gilbert 
343617ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
3437127833eeSJason Baron     DEFINE_PROP_BIT64("csum", VirtIONet, host_features,
3438127833eeSJason Baron                     VIRTIO_NET_F_CSUM, true),
3439127833eeSJason Baron     DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features,
344087108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_CSUM, true),
3441127833eeSJason Baron     DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
3442127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features,
344387108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO4, true),
3444127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features,
344587108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO6, true),
3446127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features,
344787108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ECN, true),
3448127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features,
344987108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_UFO, true),
3450127833eeSJason Baron     DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features,
345187108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ANNOUNCE, true),
3452127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features,
345387108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO4, true),
3454127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features,
345587108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO6, true),
3456127833eeSJason Baron     DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features,
345787108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_ECN, true),
3458127833eeSJason Baron     DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features,
345987108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_UFO, true),
3460127833eeSJason Baron     DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features,
346187108bb2SShannon Zhao                     VIRTIO_NET_F_MRG_RXBUF, true),
3462127833eeSJason Baron     DEFINE_PROP_BIT64("status", VirtIONet, host_features,
346387108bb2SShannon Zhao                     VIRTIO_NET_F_STATUS, true),
3464127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features,
346587108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VQ, true),
3466127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features,
346787108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX, true),
3468127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features,
346987108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VLAN, true),
3470127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features,
347187108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX_EXTRA, true),
3472127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features,
347387108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_MAC_ADDR, true),
3474127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features,
347587108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
3476127833eeSJason Baron     DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
347759079029SYuri Benditovich     DEFINE_PROP_BIT64("rss", VirtIONet, host_features,
347859079029SYuri Benditovich                     VIRTIO_NET_F_RSS, false),
3479e22f0603SYuri Benditovich     DEFINE_PROP_BIT64("hash", VirtIONet, host_features,
3480e22f0603SYuri Benditovich                     VIRTIO_NET_F_HASH_REPORT, false),
34812974e916SYuri Benditovich     DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features,
34822974e916SYuri Benditovich                     VIRTIO_NET_F_RSC_EXT, false),
34832974e916SYuri Benditovich     DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout,
34842974e916SYuri Benditovich                        VIRTIO_NET_RSC_DEFAULT_INTERVAL),
348517ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
348617ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
348717ec5a86SKONRAD Frederic                        TX_TIMER_INTERVAL),
348817ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
348917ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
34901c0fbfa3SMichael S. Tsirkin     DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
34911c0fbfa3SMichael S. Tsirkin                        VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
34929b02e161SWei Wang     DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size,
34939b02e161SWei Wang                        VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE),
3494a93e599dSMaxime Coquelin     DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0),
349575ebec11SMaxime Coquelin     DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend,
349675ebec11SMaxime Coquelin                      true),
34979473939eSJason Baron     DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN),
34989473939eSJason Baron     DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str),
34999711cd0dSJens Freimann     DEFINE_PROP_BOOL("failover", VirtIONet, failover, false),
350017ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
350117ec5a86SKONRAD Frederic };
350217ec5a86SKONRAD Frederic 
350317ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
350417ec5a86SKONRAD Frederic {
350517ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
350617ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
3507e6f746b3SAndreas Färber 
35084f67d30bSMarc-André Lureau     device_class_set_props(dc, virtio_net_properties);
3509290c2428SDr. David Alan Gilbert     dc->vmsd = &vmstate_virtio_net;
3510125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
3511e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
3512306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
351317ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
351417ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
351517ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
351617ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
351717ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
351817ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
351917ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
352017ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
352117ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
35222a083ffdSMichael S. Tsirkin     vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO);
35237788c3f2SMikhail Sennikovsky     vdc->post_load = virtio_net_post_load_virtio;
3524982b78c5SDr. David Alan Gilbert     vdc->vmsd = &vmstate_virtio_net_device;
35259711cd0dSJens Freimann     vdc->primary_unplug_pending = primary_unplug_pending;
352617ec5a86SKONRAD Frederic }
352717ec5a86SKONRAD Frederic 
352817ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
352917ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
353017ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
353117ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
353217ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
353317ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
353417ec5a86SKONRAD Frederic };
353517ec5a86SKONRAD Frederic 
353617ec5a86SKONRAD Frederic static void virtio_register_types(void)
353717ec5a86SKONRAD Frederic {
353817ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
353917ec5a86SKONRAD Frederic }
354017ec5a86SKONRAD Frederic 
354117ec5a86SKONRAD Frederic type_init(virtio_register_types)
3542