xref: /openbmc/qemu/hw/net/virtio-net.c (revision e87936ea299d8204e496b5ff19ffdca46c21610e)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
149b8bfe21SPeter Maydell #include "qemu/osdep.h"
159711cd0dSJens Freimann #include "qemu/atomic.h"
166e790746SPaolo Bonzini #include "qemu/iov.h"
17db725815SMarkus Armbruster #include "qemu/main-loop.h"
180b8fa32fSMarkus Armbruster #include "qemu/module.h"
196e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
206e790746SPaolo Bonzini #include "net/net.h"
216e790746SPaolo Bonzini #include "net/checksum.h"
226e790746SPaolo Bonzini #include "net/tap.h"
236e790746SPaolo Bonzini #include "qemu/error-report.h"
246e790746SPaolo Bonzini #include "qemu/timer.h"
259711cd0dSJens Freimann #include "qemu/option.h"
269711cd0dSJens Freimann #include "qemu/option_int.h"
279711cd0dSJens Freimann #include "qemu/config-file.h"
289711cd0dSJens Freimann #include "qapi/qmp/qdict.h"
296e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
306e790746SPaolo Bonzini #include "net/vhost_net.h"
319d8c6a25SDr. David Alan Gilbert #include "net/announce.h"
3217ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
33e688df6bSMarkus Armbruster #include "qapi/error.h"
349af23989SMarkus Armbruster #include "qapi/qapi-events-net.h"
35a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h"
369711cd0dSJens Freimann #include "qapi/qapi-types-migration.h"
379711cd0dSJens Freimann #include "qapi/qapi-events-migration.h"
381399c60dSRusty Russell #include "hw/virtio/virtio-access.h"
39f8d806c9SJuan Quintela #include "migration/misc.h"
409473939eSJason Baron #include "standard-headers/linux/ethtool.h"
412f780b6aSMarkus Armbruster #include "sysemu/sysemu.h"
429d8c6a25SDr. David Alan Gilbert #include "trace.h"
439711cd0dSJens Freimann #include "monitor/qdev.h"
449711cd0dSJens Freimann #include "hw/pci/pci.h"
454474e37aSYuri Benditovich #include "net_rx_pkt.h"
46108a6481SCindy Lu #include "hw/virtio/vhost.h"
476e790746SPaolo Bonzini 
486e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
496e790746SPaolo Bonzini 
506e790746SPaolo Bonzini #define MAC_TABLE_ENTRIES    64
516e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
526e790746SPaolo Bonzini 
531c0fbfa3SMichael S. Tsirkin /* previously fixed value */
541c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
559b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256
569b02e161SWei Wang 
571c0fbfa3SMichael S. Tsirkin /* for now, only allow larger queues; with virtio-1, guest can downsize */
581c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
599b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE
601c0fbfa3SMichael S. Tsirkin 
612974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE   8        /* ipv4 saddr + daddr */
622974e916SYuri Benditovich 
632974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG         0x3F
642974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH   0xF000
652974e916SYuri Benditovich 
662974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */
672974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header))
682974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535
692974e916SYuri Benditovich 
702974e916SYuri Benditovich /* header length value in ip header without option */
712974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5
722974e916SYuri Benditovich 
732974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE   32      /* ipv6 saddr + daddr */
742974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD
752974e916SYuri Benditovich 
762974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance
772974e916SYuri Benditovich    a lot, and should be tuned carefully, '300000'(300us) is the recommended
782974e916SYuri Benditovich    value to pass the WHQL test, '50000' can gain 2x netperf throughput with
792974e916SYuri Benditovich    tso/gso/gro 'off'. */
802974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000
812974e916SYuri Benditovich 
8259079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \
8359079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \
8459079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \
8559079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \
8659079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \
8759079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \
8859079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \
8959079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \
9059079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDP_EX)
9159079029SYuri Benditovich 
926e790746SPaolo Bonzini static VirtIOFeature feature_sizes[] = {
93127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MAC,
945d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mac)},
95127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_STATUS,
965d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, status)},
97127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MQ,
985d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
99127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MTU,
1005d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mtu)},
1019473939eSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX,
1025d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, duplex)},
103e22f0603SYuri Benditovich     {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT),
10459079029SYuri Benditovich      .end = endof(struct virtio_net_config, supported_hash_types)},
1056e790746SPaolo Bonzini     {}
1066e790746SPaolo Bonzini };
1076e790746SPaolo Bonzini 
1086e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
1096e790746SPaolo Bonzini {
1106e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1116e790746SPaolo Bonzini 
1126e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
1136e790746SPaolo Bonzini }
1146e790746SPaolo Bonzini 
1156e790746SPaolo Bonzini static int vq2q(int queue_index)
1166e790746SPaolo Bonzini {
1176e790746SPaolo Bonzini     return queue_index / 2;
1186e790746SPaolo Bonzini }
1196e790746SPaolo Bonzini 
1206e790746SPaolo Bonzini /* TODO
1216e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
1226e790746SPaolo Bonzini  */
1236e790746SPaolo Bonzini 
1246e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
1256e790746SPaolo Bonzini {
12617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1276e790746SPaolo Bonzini     struct virtio_net_config netcfg;
128c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1296e790746SPaolo Bonzini 
130108a6481SCindy Lu     int ret = 0;
131108a6481SCindy Lu     memset(&netcfg, 0 , sizeof(struct virtio_net_config));
1321399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.status, n->status);
1331399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queues);
134a93e599dSMaxime Coquelin     virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu);
1356e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
1369473939eSJason Baron     virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed);
1379473939eSJason Baron     netcfg.duplex = n->net_conf.duplex;
13859079029SYuri Benditovich     netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE;
13959079029SYuri Benditovich     virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length,
140e22f0603SYuri Benditovich                  virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ?
141e22f0603SYuri Benditovich                  VIRTIO_NET_RSS_MAX_TABLE_LEN : 1);
14259079029SYuri Benditovich     virtio_stl_p(vdev, &netcfg.supported_hash_types,
14359079029SYuri Benditovich                  VIRTIO_NET_RSS_SUPPORTED_HASHES);
1446e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
145108a6481SCindy Lu 
146c546ecf2SJason Wang     /*
147c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
148c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
149c546ecf2SJason Wang      */
150c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
151108a6481SCindy Lu         ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
152108a6481SCindy Lu                                    n->config_size);
153108a6481SCindy Lu         if (ret != -1) {
154108a6481SCindy Lu             memcpy(config, &netcfg, n->config_size);
155108a6481SCindy Lu         }
156108a6481SCindy Lu     }
1576e790746SPaolo Bonzini }
1586e790746SPaolo Bonzini 
1596e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
1606e790746SPaolo Bonzini {
16117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1626e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
163c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1646e790746SPaolo Bonzini 
1656e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
1666e790746SPaolo Bonzini 
16795129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
16895129d6fSCornelia Huck         !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
1696e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
1706e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
1716e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1726e790746SPaolo Bonzini     }
173108a6481SCindy Lu 
174c546ecf2SJason Wang     /*
175c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
176c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
177c546ecf2SJason Wang      */
178c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
179c546ecf2SJason Wang         vhost_net_set_config(get_vhost_net(nc->peer),
180c546ecf2SJason Wang                              (uint8_t *)&netcfg, 0, n->config_size,
181108a6481SCindy Lu                              VHOST_SET_CONFIG_TYPE_MASTER);
182108a6481SCindy Lu       }
1836e790746SPaolo Bonzini }
1846e790746SPaolo Bonzini 
1856e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
1866e790746SPaolo Bonzini {
18717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1886e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
18917a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
1906e790746SPaolo Bonzini }
1916e790746SPaolo Bonzini 
192b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net)
193b2c929f0SDr. David Alan Gilbert {
194b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(net);
195b2c929f0SDr. David Alan Gilbert     trace_virtio_net_announce_notify();
196b2c929f0SDr. David Alan Gilbert 
197b2c929f0SDr. David Alan Gilbert     net->status |= VIRTIO_NET_S_ANNOUNCE;
198b2c929f0SDr. David Alan Gilbert     virtio_notify_config(vdev);
199b2c929f0SDr. David Alan Gilbert }
200b2c929f0SDr. David Alan Gilbert 
201f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque)
202f57fcf70SJason Wang {
203f57fcf70SJason Wang     VirtIONet *n = opaque;
2049d8c6a25SDr. David Alan Gilbert     trace_virtio_net_announce_timer(n->announce_timer.round);
205f57fcf70SJason Wang 
2069d8c6a25SDr. David Alan Gilbert     n->announce_timer.round--;
207b2c929f0SDr. David Alan Gilbert     virtio_net_announce_notify(n);
208b2c929f0SDr. David Alan Gilbert }
209b2c929f0SDr. David Alan Gilbert 
210b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc)
211b2c929f0SDr. David Alan Gilbert {
212b2c929f0SDr. David Alan Gilbert     VirtIONet *n = qemu_get_nic_opaque(nc);
213b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
214b2c929f0SDr. David Alan Gilbert 
215b2c929f0SDr. David Alan Gilbert     /*
216b2c929f0SDr. David Alan Gilbert      * Make sure the virtio migration announcement timer isn't running
217b2c929f0SDr. David Alan Gilbert      * If it is, let it trigger announcement so that we do not cause
218b2c929f0SDr. David Alan Gilbert      * confusion.
219b2c929f0SDr. David Alan Gilbert      */
220b2c929f0SDr. David Alan Gilbert     if (n->announce_timer.round) {
221b2c929f0SDr. David Alan Gilbert         return;
222b2c929f0SDr. David Alan Gilbert     }
223b2c929f0SDr. David Alan Gilbert 
224b2c929f0SDr. David Alan Gilbert     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
225b2c929f0SDr. David Alan Gilbert         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
226b2c929f0SDr. David Alan Gilbert             virtio_net_announce_notify(n);
227b2c929f0SDr. David Alan Gilbert     }
228f57fcf70SJason Wang }
229f57fcf70SJason Wang 
2306e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
2316e790746SPaolo Bonzini {
23217a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2336e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
2346e790746SPaolo Bonzini     int queues = n->multiqueue ? n->max_queues : 1;
2356e790746SPaolo Bonzini 
236ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
2376e790746SPaolo Bonzini         return;
2386e790746SPaolo Bonzini     }
2396e790746SPaolo Bonzini 
2408c1ac475SRadim Krčmář     if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
2418c1ac475SRadim Krčmář         !!n->vhost_started) {
2426e790746SPaolo Bonzini         return;
2436e790746SPaolo Bonzini     }
2446e790746SPaolo Bonzini     if (!n->vhost_started) {
245086abc1cSMichael S. Tsirkin         int r, i;
246086abc1cSMichael S. Tsirkin 
2471bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
2481bfa316cSGreg Kurz             error_report("backend does not support %s vnet headers; "
2491bfa316cSGreg Kurz                          "falling back on userspace virtio",
2501bfa316cSGreg Kurz                          virtio_is_big_endian(vdev) ? "BE" : "LE");
2511bfa316cSGreg Kurz             return;
2521bfa316cSGreg Kurz         }
2531bfa316cSGreg Kurz 
254086abc1cSMichael S. Tsirkin         /* Any packets outstanding? Purge them to avoid touching rings
255086abc1cSMichael S. Tsirkin          * when vhost is running.
256086abc1cSMichael S. Tsirkin          */
257086abc1cSMichael S. Tsirkin         for (i = 0;  i < queues; i++) {
258086abc1cSMichael S. Tsirkin             NetClientState *qnc = qemu_get_subqueue(n->nic, i);
259086abc1cSMichael S. Tsirkin 
260086abc1cSMichael S. Tsirkin             /* Purge both directions: TX and RX. */
261086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
262086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
263086abc1cSMichael S. Tsirkin         }
264086abc1cSMichael S. Tsirkin 
265a93e599dSMaxime Coquelin         if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) {
266a93e599dSMaxime Coquelin             r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu);
267a93e599dSMaxime Coquelin             if (r < 0) {
268a93e599dSMaxime Coquelin                 error_report("%uBytes MTU not supported by the backend",
269a93e599dSMaxime Coquelin                              n->net_conf.mtu);
270a93e599dSMaxime Coquelin 
271a93e599dSMaxime Coquelin                 return;
272a93e599dSMaxime Coquelin             }
273a93e599dSMaxime Coquelin         }
274a93e599dSMaxime Coquelin 
2756e790746SPaolo Bonzini         n->vhost_started = 1;
27617a0ca55SKONRAD Frederic         r = vhost_net_start(vdev, n->nic->ncs, queues);
2776e790746SPaolo Bonzini         if (r < 0) {
2786e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
2796e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
2806e790746SPaolo Bonzini             n->vhost_started = 0;
2816e790746SPaolo Bonzini         }
2826e790746SPaolo Bonzini     } else {
28317a0ca55SKONRAD Frederic         vhost_net_stop(vdev, n->nic->ncs, queues);
2846e790746SPaolo Bonzini         n->vhost_started = 0;
2856e790746SPaolo Bonzini     }
2866e790746SPaolo Bonzini }
2876e790746SPaolo Bonzini 
2881bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
2891bfa316cSGreg Kurz                                           NetClientState *peer,
2901bfa316cSGreg Kurz                                           bool enable)
2911bfa316cSGreg Kurz {
2921bfa316cSGreg Kurz     if (virtio_is_big_endian(vdev)) {
2931bfa316cSGreg Kurz         return qemu_set_vnet_be(peer, enable);
2941bfa316cSGreg Kurz     } else {
2951bfa316cSGreg Kurz         return qemu_set_vnet_le(peer, enable);
2961bfa316cSGreg Kurz     }
2971bfa316cSGreg Kurz }
2981bfa316cSGreg Kurz 
2991bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
3001bfa316cSGreg Kurz                                        int queues, bool enable)
3011bfa316cSGreg Kurz {
3021bfa316cSGreg Kurz     int i;
3031bfa316cSGreg Kurz 
3041bfa316cSGreg Kurz     for (i = 0; i < queues; i++) {
3051bfa316cSGreg Kurz         if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
3061bfa316cSGreg Kurz             enable) {
3071bfa316cSGreg Kurz             while (--i >= 0) {
3081bfa316cSGreg Kurz                 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
3091bfa316cSGreg Kurz             }
3101bfa316cSGreg Kurz 
3111bfa316cSGreg Kurz             return true;
3121bfa316cSGreg Kurz         }
3131bfa316cSGreg Kurz     }
3141bfa316cSGreg Kurz 
3151bfa316cSGreg Kurz     return false;
3161bfa316cSGreg Kurz }
3171bfa316cSGreg Kurz 
3181bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
3191bfa316cSGreg Kurz {
3201bfa316cSGreg Kurz     VirtIODevice *vdev = VIRTIO_DEVICE(n);
3211bfa316cSGreg Kurz     int queues = n->multiqueue ? n->max_queues : 1;
3221bfa316cSGreg Kurz 
3231bfa316cSGreg Kurz     if (virtio_net_started(n, status)) {
3241bfa316cSGreg Kurz         /* Before using the device, we tell the network backend about the
3251bfa316cSGreg Kurz          * endianness to use when parsing vnet headers. If the backend
3261bfa316cSGreg Kurz          * can't do it, we fallback onto fixing the headers in the core
3271bfa316cSGreg Kurz          * virtio-net code.
3281bfa316cSGreg Kurz          */
3291bfa316cSGreg Kurz         n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
3301bfa316cSGreg Kurz                                                             queues, true);
3311bfa316cSGreg Kurz     } else if (virtio_net_started(n, vdev->status)) {
3321bfa316cSGreg Kurz         /* After using the device, we need to reset the network backend to
3331bfa316cSGreg Kurz          * the default (guest native endianness), otherwise the guest may
3341bfa316cSGreg Kurz          * lose network connectivity if it is rebooted into a different
3351bfa316cSGreg Kurz          * endianness.
3361bfa316cSGreg Kurz          */
3371bfa316cSGreg Kurz         virtio_net_set_vnet_endian(vdev, n->nic->ncs, queues, false);
3381bfa316cSGreg Kurz     }
3391bfa316cSGreg Kurz }
3401bfa316cSGreg Kurz 
341283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq)
342283e2c2aSYuri Benditovich {
343283e2c2aSYuri Benditovich     unsigned int dropped = virtqueue_drop_all(vq);
344283e2c2aSYuri Benditovich     if (dropped) {
345283e2c2aSYuri Benditovich         virtio_notify(vdev, vq);
346283e2c2aSYuri Benditovich     }
347283e2c2aSYuri Benditovich }
348283e2c2aSYuri Benditovich 
3496e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
3506e790746SPaolo Bonzini {
35117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3526e790746SPaolo Bonzini     VirtIONetQueue *q;
3536e790746SPaolo Bonzini     int i;
3546e790746SPaolo Bonzini     uint8_t queue_status;
3556e790746SPaolo Bonzini 
3561bfa316cSGreg Kurz     virtio_net_vnet_endian_status(n, status);
3576e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
3586e790746SPaolo Bonzini 
3596e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
36038705bb5SFam Zheng         NetClientState *ncs = qemu_get_subqueue(n->nic, i);
36138705bb5SFam Zheng         bool queue_started;
3626e790746SPaolo Bonzini         q = &n->vqs[i];
3636e790746SPaolo Bonzini 
3646e790746SPaolo Bonzini         if ((!n->multiqueue && i != 0) || i >= n->curr_queues) {
3656e790746SPaolo Bonzini             queue_status = 0;
3666e790746SPaolo Bonzini         } else {
3676e790746SPaolo Bonzini             queue_status = status;
3686e790746SPaolo Bonzini         }
36938705bb5SFam Zheng         queue_started =
37038705bb5SFam Zheng             virtio_net_started(n, queue_status) && !n->vhost_started;
37138705bb5SFam Zheng 
37238705bb5SFam Zheng         if (queue_started) {
37338705bb5SFam Zheng             qemu_flush_queued_packets(ncs);
37438705bb5SFam Zheng         }
3756e790746SPaolo Bonzini 
3766e790746SPaolo Bonzini         if (!q->tx_waiting) {
3776e790746SPaolo Bonzini             continue;
3786e790746SPaolo Bonzini         }
3796e790746SPaolo Bonzini 
38038705bb5SFam Zheng         if (queue_started) {
3816e790746SPaolo Bonzini             if (q->tx_timer) {
382bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
383bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
3846e790746SPaolo Bonzini             } else {
3856e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
3866e790746SPaolo Bonzini             }
3876e790746SPaolo Bonzini         } else {
3886e790746SPaolo Bonzini             if (q->tx_timer) {
389bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
3906e790746SPaolo Bonzini             } else {
3916e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
3926e790746SPaolo Bonzini             }
393283e2c2aSYuri Benditovich             if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 &&
39470e53e6eSJason Wang                 (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) &&
39570e53e6eSJason Wang                 vdev->vm_running) {
396283e2c2aSYuri Benditovich                 /* if tx is waiting we are likely have some packets in tx queue
397283e2c2aSYuri Benditovich                  * and disabled notification */
398283e2c2aSYuri Benditovich                 q->tx_waiting = 0;
399283e2c2aSYuri Benditovich                 virtio_queue_set_notification(q->tx_vq, 1);
400283e2c2aSYuri Benditovich                 virtio_net_drop_tx_queue_data(vdev, q->tx_vq);
401283e2c2aSYuri Benditovich             }
4026e790746SPaolo Bonzini         }
4036e790746SPaolo Bonzini     }
4046e790746SPaolo Bonzini }
4056e790746SPaolo Bonzini 
4066e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
4076e790746SPaolo Bonzini {
4086e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
40917a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
4106e790746SPaolo Bonzini     uint16_t old_status = n->status;
4116e790746SPaolo Bonzini 
4126e790746SPaolo Bonzini     if (nc->link_down)
4136e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
4146e790746SPaolo Bonzini     else
4156e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
4166e790746SPaolo Bonzini 
4176e790746SPaolo Bonzini     if (n->status != old_status)
41817a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
4196e790746SPaolo Bonzini 
42017a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
4216e790746SPaolo Bonzini }
4226e790746SPaolo Bonzini 
423b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
424b1be4280SAmos Kong {
425b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
426b1be4280SAmos Kong 
427b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
428ddfb0baaSMarkus Armbruster         char *path = object_get_canonical_path(OBJECT(n->qdev));
42906150279SWenchao Xia         qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
4303ab72385SPeter Xu                                               n->netclient_name, path);
43196e35046SAmos Kong         g_free(path);
432b1be4280SAmos Kong 
433b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
434b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
435b1be4280SAmos Kong     }
436b1be4280SAmos Kong }
437b1be4280SAmos Kong 
438f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
439f7bc8ef8SAmos Kong {
440f7bc8ef8SAmos Kong     intList *list, *entry;
441f7bc8ef8SAmos Kong     int i, j;
442f7bc8ef8SAmos Kong 
443f7bc8ef8SAmos Kong     list = NULL;
444f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
445f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
446f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
447f7bc8ef8SAmos Kong                 entry = g_malloc0(sizeof(*entry));
448f7bc8ef8SAmos Kong                 entry->value = (i << 5) + j;
449f7bc8ef8SAmos Kong                 entry->next = list;
450f7bc8ef8SAmos Kong                 list = entry;
451f7bc8ef8SAmos Kong             }
452f7bc8ef8SAmos Kong         }
453f7bc8ef8SAmos Kong     }
454f7bc8ef8SAmos Kong 
455f7bc8ef8SAmos Kong     return list;
456f7bc8ef8SAmos Kong }
457f7bc8ef8SAmos Kong 
458b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
459b1be4280SAmos Kong {
460b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
461f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
462b1be4280SAmos Kong     RxFilterInfo *info;
463b1be4280SAmos Kong     strList *str_list, *entry;
464f7bc8ef8SAmos Kong     int i;
465b1be4280SAmos Kong 
466b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
467b1be4280SAmos Kong     info->name = g_strdup(nc->name);
468b1be4280SAmos Kong     info->promiscuous = n->promisc;
469b1be4280SAmos Kong 
470b1be4280SAmos Kong     if (n->nouni) {
471b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
472b1be4280SAmos Kong     } else if (n->alluni) {
473b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
474b1be4280SAmos Kong     } else {
475b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
476b1be4280SAmos Kong     }
477b1be4280SAmos Kong 
478b1be4280SAmos Kong     if (n->nomulti) {
479b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
480b1be4280SAmos Kong     } else if (n->allmulti) {
481b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
482b1be4280SAmos Kong     } else {
483b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
484b1be4280SAmos Kong     }
485b1be4280SAmos Kong 
486b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
487b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
488b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
489b1be4280SAmos Kong 
490b0575ba4SScott Feldman     info->main_mac = qemu_mac_strdup_printf(n->mac);
491b1be4280SAmos Kong 
492b1be4280SAmos Kong     str_list = NULL;
493b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
494b1be4280SAmos Kong         entry = g_malloc0(sizeof(*entry));
495b0575ba4SScott Feldman         entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
496b1be4280SAmos Kong         entry->next = str_list;
497b1be4280SAmos Kong         str_list = entry;
498b1be4280SAmos Kong     }
499b1be4280SAmos Kong     info->unicast_table = str_list;
500b1be4280SAmos Kong 
501b1be4280SAmos Kong     str_list = NULL;
502b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
503b1be4280SAmos Kong         entry = g_malloc0(sizeof(*entry));
504b0575ba4SScott Feldman         entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
505b1be4280SAmos Kong         entry->next = str_list;
506b1be4280SAmos Kong         str_list = entry;
507b1be4280SAmos Kong     }
508b1be4280SAmos Kong     info->multicast_table = str_list;
509f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
510b1be4280SAmos Kong 
51195129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
512f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
513f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
514f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
515f7bc8ef8SAmos Kong     } else {
516f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
517b1be4280SAmos Kong     }
518b1be4280SAmos Kong 
519b1be4280SAmos Kong     /* enable event notification after query */
520b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
521b1be4280SAmos Kong 
522b1be4280SAmos Kong     return info;
523b1be4280SAmos Kong }
524b1be4280SAmos Kong 
5256e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
5266e790746SPaolo Bonzini {
52717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
52894b52958SGreg Kurz     int i;
5296e790746SPaolo Bonzini 
5306e790746SPaolo Bonzini     /* Reset back to compatibility mode */
5316e790746SPaolo Bonzini     n->promisc = 1;
5326e790746SPaolo Bonzini     n->allmulti = 0;
5336e790746SPaolo Bonzini     n->alluni = 0;
5346e790746SPaolo Bonzini     n->nomulti = 0;
5356e790746SPaolo Bonzini     n->nouni = 0;
5366e790746SPaolo Bonzini     n->nobcast = 0;
5376e790746SPaolo Bonzini     /* multiqueue is disabled by default */
5386e790746SPaolo Bonzini     n->curr_queues = 1;
5399d8c6a25SDr. David Alan Gilbert     timer_del(n->announce_timer.tm);
5409d8c6a25SDr. David Alan Gilbert     n->announce_timer.round = 0;
541f57fcf70SJason Wang     n->status &= ~VIRTIO_NET_S_ANNOUNCE;
5426e790746SPaolo Bonzini 
5436e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
5446e790746SPaolo Bonzini     n->mac_table.in_use = 0;
5456e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
5466e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
5476e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
5486e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
5496e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
550702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
5516e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
55294b52958SGreg Kurz 
55394b52958SGreg Kurz     /* Flush any async TX */
55494b52958SGreg Kurz     for (i = 0;  i < n->max_queues; i++) {
55594b52958SGreg Kurz         NetClientState *nc = qemu_get_subqueue(n->nic, i);
55694b52958SGreg Kurz 
55794b52958SGreg Kurz         if (nc->peer) {
55894b52958SGreg Kurz             qemu_flush_or_purge_queued_packets(nc->peer, true);
55994b52958SGreg Kurz             assert(!virtio_net_get_subqueue(nc)->async_tx.elem);
56094b52958SGreg Kurz         }
56194b52958SGreg Kurz     }
5626e790746SPaolo Bonzini }
5636e790746SPaolo Bonzini 
5646e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
5656e790746SPaolo Bonzini {
5666e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
5676e790746SPaolo Bonzini     if (!nc->peer) {
5686e790746SPaolo Bonzini         return;
5696e790746SPaolo Bonzini     }
5706e790746SPaolo Bonzini 
571d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
5726e790746SPaolo Bonzini }
5736e790746SPaolo Bonzini 
5746e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
5756e790746SPaolo Bonzini {
5766e790746SPaolo Bonzini     return n->has_vnet_hdr;
5776e790746SPaolo Bonzini }
5786e790746SPaolo Bonzini 
5796e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
5806e790746SPaolo Bonzini {
5816e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
5826e790746SPaolo Bonzini         return 0;
5836e790746SPaolo Bonzini 
584d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
5856e790746SPaolo Bonzini 
5866e790746SPaolo Bonzini     return n->has_ufo;
5876e790746SPaolo Bonzini }
5886e790746SPaolo Bonzini 
589bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
590e22f0603SYuri Benditovich                                        int version_1, int hash_report)
5916e790746SPaolo Bonzini {
5926e790746SPaolo Bonzini     int i;
5936e790746SPaolo Bonzini     NetClientState *nc;
5946e790746SPaolo Bonzini 
5956e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
5966e790746SPaolo Bonzini 
597bb9d17f8SCornelia Huck     if (version_1) {
598e22f0603SYuri Benditovich         n->guest_hdr_len = hash_report ?
599e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_v1_hash) :
600e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_mrg_rxbuf);
601e22f0603SYuri Benditovich         n->rss_data.populate_hash = !!hash_report;
602bb9d17f8SCornelia Huck     } else {
6036e790746SPaolo Bonzini         n->guest_hdr_len = n->mergeable_rx_bufs ?
604bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr_mrg_rxbuf) :
605bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr);
606bb9d17f8SCornelia Huck     }
6076e790746SPaolo Bonzini 
6086e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
6096e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
6106e790746SPaolo Bonzini 
6116e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
612d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
613d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
6146e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
6156e790746SPaolo Bonzini         }
6166e790746SPaolo Bonzini     }
6176e790746SPaolo Bonzini }
6186e790746SPaolo Bonzini 
6192eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n)
6202eef278bSMichael S. Tsirkin {
6212eef278bSMichael S. Tsirkin     NetClientState *peer = n->nic_conf.peers.ncs[0];
6222eef278bSMichael S. Tsirkin 
6232eef278bSMichael S. Tsirkin     /*
6242eef278bSMichael S. Tsirkin      * Backends other than vhost-user don't support max queue size.
6252eef278bSMichael S. Tsirkin      */
6262eef278bSMichael S. Tsirkin     if (!peer) {
6272eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6282eef278bSMichael S. Tsirkin     }
6292eef278bSMichael S. Tsirkin 
6302eef278bSMichael S. Tsirkin     if (peer->info->type != NET_CLIENT_DRIVER_VHOST_USER) {
6312eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6322eef278bSMichael S. Tsirkin     }
6332eef278bSMichael S. Tsirkin 
6342eef278bSMichael S. Tsirkin     return VIRTQUEUE_MAX_SIZE;
6352eef278bSMichael S. Tsirkin }
6362eef278bSMichael S. Tsirkin 
6376e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
6386e790746SPaolo Bonzini {
6396e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6406e790746SPaolo Bonzini 
6416e790746SPaolo Bonzini     if (!nc->peer) {
6426e790746SPaolo Bonzini         return 0;
6436e790746SPaolo Bonzini     }
6446e790746SPaolo Bonzini 
645f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6467263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 1);
6477263a0adSChangchun Ouyang     }
6487263a0adSChangchun Ouyang 
649f394b2e2SEric Blake     if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
6506e790746SPaolo Bonzini         return 0;
6516e790746SPaolo Bonzini     }
6526e790746SPaolo Bonzini 
6531074b879SJason Wang     if (n->max_queues == 1) {
6541074b879SJason Wang         return 0;
6551074b879SJason Wang     }
6561074b879SJason Wang 
6576e790746SPaolo Bonzini     return tap_enable(nc->peer);
6586e790746SPaolo Bonzini }
6596e790746SPaolo Bonzini 
6606e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
6616e790746SPaolo Bonzini {
6626e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6636e790746SPaolo Bonzini 
6646e790746SPaolo Bonzini     if (!nc->peer) {
6656e790746SPaolo Bonzini         return 0;
6666e790746SPaolo Bonzini     }
6676e790746SPaolo Bonzini 
668f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6697263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 0);
6707263a0adSChangchun Ouyang     }
6717263a0adSChangchun Ouyang 
672f394b2e2SEric Blake     if (nc->peer->info->type !=  NET_CLIENT_DRIVER_TAP) {
6736e790746SPaolo Bonzini         return 0;
6746e790746SPaolo Bonzini     }
6756e790746SPaolo Bonzini 
6766e790746SPaolo Bonzini     return tap_disable(nc->peer);
6776e790746SPaolo Bonzini }
6786e790746SPaolo Bonzini 
6796e790746SPaolo Bonzini static void virtio_net_set_queues(VirtIONet *n)
6806e790746SPaolo Bonzini {
6816e790746SPaolo Bonzini     int i;
682ddfa83eaSJoel Stanley     int r;
6836e790746SPaolo Bonzini 
68468b5f314SYuri Benditovich     if (n->nic->peer_deleted) {
68568b5f314SYuri Benditovich         return;
68668b5f314SYuri Benditovich     }
68768b5f314SYuri Benditovich 
6886e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
6896e790746SPaolo Bonzini         if (i < n->curr_queues) {
690ddfa83eaSJoel Stanley             r = peer_attach(n, i);
691ddfa83eaSJoel Stanley             assert(!r);
6926e790746SPaolo Bonzini         } else {
693ddfa83eaSJoel Stanley             r = peer_detach(n, i);
694ddfa83eaSJoel Stanley             assert(!r);
6956e790746SPaolo Bonzini         }
6966e790746SPaolo Bonzini     }
6976e790746SPaolo Bonzini }
6986e790746SPaolo Bonzini 
699ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
7006e790746SPaolo Bonzini 
7019d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
7029d5b731dSJason Wang                                         Error **errp)
7036e790746SPaolo Bonzini {
70417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
7056e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
7066e790746SPaolo Bonzini 
707da3e8a23SShannon Zhao     /* Firstly sync all virtio-net possible supported features */
708da3e8a23SShannon Zhao     features |= n->host_features;
709da3e8a23SShannon Zhao 
7100cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7116e790746SPaolo Bonzini 
7126e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
7130cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
7140cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7150cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7160cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
7176e790746SPaolo Bonzini 
7180cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
7190cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
7200cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
7210cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
722e22f0603SYuri Benditovich 
723e22f0603SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
7246e790746SPaolo Bonzini     }
7256e790746SPaolo Bonzini 
7266e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
7270cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
7280cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
7296e790746SPaolo Bonzini     }
7306e790746SPaolo Bonzini 
731ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
7326e790746SPaolo Bonzini         return features;
7336e790746SPaolo Bonzini     }
7342974e916SYuri Benditovich 
73559079029SYuri Benditovich     virtio_clear_feature(&features, VIRTIO_NET_F_RSS);
736e22f0603SYuri Benditovich     virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
73775ebec11SMaxime Coquelin     features = vhost_net_get_features(get_vhost_net(nc->peer), features);
73875ebec11SMaxime Coquelin     vdev->backend_features = features;
73975ebec11SMaxime Coquelin 
74075ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
74175ebec11SMaxime Coquelin             (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) {
74275ebec11SMaxime Coquelin         features |= (1ULL << VIRTIO_NET_F_MTU);
74375ebec11SMaxime Coquelin     }
74475ebec11SMaxime Coquelin 
74575ebec11SMaxime Coquelin     return features;
7466e790746SPaolo Bonzini }
7476e790746SPaolo Bonzini 
748019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
7496e790746SPaolo Bonzini {
750019a3edbSGerd Hoffmann     uint64_t features = 0;
7516e790746SPaolo Bonzini 
7526e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
7536e790746SPaolo Bonzini      * but also these: */
7540cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7550cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
7560cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7570cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7580cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
7596e790746SPaolo Bonzini 
7606e790746SPaolo Bonzini     return features;
7616e790746SPaolo Bonzini }
7626e790746SPaolo Bonzini 
763644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
764644c9858SDmitry Fleytman {
765ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
766644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
767644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
768644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
769644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
770644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
771644c9858SDmitry Fleytman }
772644c9858SDmitry Fleytman 
773644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
774644c9858SDmitry Fleytman {
775644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
776644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
777644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
778644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
779644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
780644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
781644c9858SDmitry Fleytman 
782644c9858SDmitry Fleytman     return guest_offloads_mask & features;
783644c9858SDmitry Fleytman }
784644c9858SDmitry Fleytman 
785644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
786644c9858SDmitry Fleytman {
787644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
788644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
789644c9858SDmitry Fleytman }
790644c9858SDmitry Fleytman 
7919711cd0dSJens Freimann static void failover_add_primary(VirtIONet *n, Error **errp)
7929711cd0dSJens Freimann {
7939711cd0dSJens Freimann     Error *err = NULL;
7949711cd0dSJens Freimann 
795117378bfSJens Freimann     if (n->primary_dev) {
796117378bfSJens Freimann         return;
797117378bfSJens Freimann     }
798117378bfSJens Freimann 
7999711cd0dSJens Freimann     n->primary_device_opts = qemu_opts_find(qemu_find_opts("device"),
8009711cd0dSJens Freimann             n->primary_device_id);
8019711cd0dSJens Freimann     if (n->primary_device_opts) {
8029711cd0dSJens Freimann         n->primary_dev = qdev_device_add(n->primary_device_opts, &err);
8039711cd0dSJens Freimann         if (err) {
8049711cd0dSJens Freimann             qemu_opts_del(n->primary_device_opts);
8059711cd0dSJens Freimann         }
8069711cd0dSJens Freimann         if (n->primary_dev) {
8079711cd0dSJens Freimann             n->primary_bus = n->primary_dev->parent_bus;
8089711cd0dSJens Freimann             if (err) {
8099711cd0dSJens Freimann                 qdev_unplug(n->primary_dev, &err);
8109711cd0dSJens Freimann                 qdev_set_id(n->primary_dev, "");
8119711cd0dSJens Freimann 
8129711cd0dSJens Freimann             }
8139711cd0dSJens Freimann         }
8149711cd0dSJens Freimann     } else {
8159711cd0dSJens Freimann         error_setg(errp, "Primary device not found");
8169711cd0dSJens Freimann         error_append_hint(errp, "Virtio-net failover will not work. Make "
8179711cd0dSJens Freimann             "sure primary device has parameter"
8189711cd0dSJens Freimann             " failover_pair_id=<virtio-net-id>\n");
8199711cd0dSJens Freimann }
8209711cd0dSJens Freimann     error_propagate(errp, err);
8219711cd0dSJens Freimann }
8229711cd0dSJens Freimann 
8239711cd0dSJens Freimann static int is_my_primary(void *opaque, QemuOpts *opts, Error **errp)
8249711cd0dSJens Freimann {
8259711cd0dSJens Freimann     VirtIONet *n = opaque;
8269711cd0dSJens Freimann     int ret = 0;
8279711cd0dSJens Freimann 
8289711cd0dSJens Freimann     const char *standby_id = qemu_opt_get(opts, "failover_pair_id");
8299711cd0dSJens Freimann 
8309711cd0dSJens Freimann     if (standby_id != NULL && (g_strcmp0(standby_id, n->netclient_name) == 0)) {
8319711cd0dSJens Freimann         n->primary_device_id = g_strdup(opts->id);
8329711cd0dSJens Freimann         ret = 1;
8339711cd0dSJens Freimann     }
8349711cd0dSJens Freimann 
8359711cd0dSJens Freimann     return ret;
8369711cd0dSJens Freimann }
8379711cd0dSJens Freimann 
8389711cd0dSJens Freimann static DeviceState *virtio_net_find_primary(VirtIONet *n, Error **errp)
8399711cd0dSJens Freimann {
8409711cd0dSJens Freimann     DeviceState *dev = NULL;
8419711cd0dSJens Freimann     Error *err = NULL;
8429711cd0dSJens Freimann 
8439711cd0dSJens Freimann     if (qemu_opts_foreach(qemu_find_opts("device"),
8449711cd0dSJens Freimann                          is_my_primary, n, &err)) {
8459711cd0dSJens Freimann         if (err) {
8469711cd0dSJens Freimann             error_propagate(errp, err);
8479711cd0dSJens Freimann             return NULL;
8489711cd0dSJens Freimann         }
8499711cd0dSJens Freimann         if (n->primary_device_id) {
8509711cd0dSJens Freimann             dev = qdev_find_recursive(sysbus_get_default(),
8519711cd0dSJens Freimann                     n->primary_device_id);
8529711cd0dSJens Freimann         } else {
8539711cd0dSJens Freimann             error_setg(errp, "Primary device id not found");
8549711cd0dSJens Freimann             return NULL;
8559711cd0dSJens Freimann         }
8569711cd0dSJens Freimann     }
8579711cd0dSJens Freimann     return dev;
8589711cd0dSJens Freimann }
8599711cd0dSJens Freimann 
8609711cd0dSJens Freimann 
8619711cd0dSJens Freimann 
8629711cd0dSJens Freimann static DeviceState *virtio_connect_failover_devices(VirtIONet *n,
8639711cd0dSJens Freimann                                                     DeviceState *dev,
8649711cd0dSJens Freimann                                                     Error **errp)
8659711cd0dSJens Freimann {
8669711cd0dSJens Freimann     DeviceState *prim_dev = NULL;
8679711cd0dSJens Freimann     Error *err = NULL;
8689711cd0dSJens Freimann 
8699711cd0dSJens Freimann     prim_dev = virtio_net_find_primary(n, &err);
8709711cd0dSJens Freimann     if (prim_dev) {
8719711cd0dSJens Freimann         n->primary_device_id = g_strdup(prim_dev->id);
8729711cd0dSJens Freimann         n->primary_device_opts = prim_dev->opts;
8739711cd0dSJens Freimann     } else {
8749711cd0dSJens Freimann         error_propagate(errp, err);
8759711cd0dSJens Freimann     }
8769711cd0dSJens Freimann 
8779711cd0dSJens Freimann     return prim_dev;
8789711cd0dSJens Freimann }
8799711cd0dSJens Freimann 
880d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
8816e790746SPaolo Bonzini {
88217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
8839711cd0dSJens Freimann     Error *err = NULL;
8846e790746SPaolo Bonzini     int i;
8856e790746SPaolo Bonzini 
88675ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
88775ebec11SMaxime Coquelin             !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) {
88875ebec11SMaxime Coquelin         features &= ~(1ULL << VIRTIO_NET_F_MTU);
88975ebec11SMaxime Coquelin     }
89075ebec11SMaxime Coquelin 
891ef546f12SCornelia Huck     virtio_net_set_multiqueue(n,
89259079029SYuri Benditovich                               virtio_has_feature(features, VIRTIO_NET_F_RSS) ||
89395129d6fSCornelia Huck                               virtio_has_feature(features, VIRTIO_NET_F_MQ));
8946e790746SPaolo Bonzini 
895ef546f12SCornelia Huck     virtio_net_set_mrg_rx_bufs(n,
89695129d6fSCornelia Huck                                virtio_has_feature(features,
897bb9d17f8SCornelia Huck                                                   VIRTIO_NET_F_MRG_RXBUF),
89895129d6fSCornelia Huck                                virtio_has_feature(features,
899e22f0603SYuri Benditovich                                                   VIRTIO_F_VERSION_1),
900e22f0603SYuri Benditovich                                virtio_has_feature(features,
901e22f0603SYuri Benditovich                                                   VIRTIO_NET_F_HASH_REPORT));
9026e790746SPaolo Bonzini 
9032974e916SYuri Benditovich     n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9042974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4);
9052974e916SYuri Benditovich     n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9062974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6);
907e22f0603SYuri Benditovich     n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS);
9082974e916SYuri Benditovich 
9096e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
910644c9858SDmitry Fleytman         n->curr_guest_offloads =
911644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
912644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
9136e790746SPaolo Bonzini     }
9146e790746SPaolo Bonzini 
9156e790746SPaolo Bonzini     for (i = 0;  i < n->max_queues; i++) {
9166e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
9176e790746SPaolo Bonzini 
918ed8b4afeSNikolay Nikolaev         if (!get_vhost_net(nc->peer)) {
9196e790746SPaolo Bonzini             continue;
9206e790746SPaolo Bonzini         }
921ed8b4afeSNikolay Nikolaev         vhost_net_ack_features(get_vhost_net(nc->peer), features);
9226e790746SPaolo Bonzini     }
9230b1eaa88SStefan Fritsch 
92495129d6fSCornelia Huck     if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
9250b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
9260b1eaa88SStefan Fritsch     } else {
9270b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
9280b1eaa88SStefan Fritsch     }
9299711cd0dSJens Freimann 
9309711cd0dSJens Freimann     if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) {
9319711cd0dSJens Freimann         qapi_event_send_failover_negotiated(n->netclient_name);
932d73415a3SStefan Hajnoczi         qatomic_set(&n->primary_should_be_hidden, false);
9339711cd0dSJens Freimann         failover_add_primary(n, &err);
9349711cd0dSJens Freimann         if (err) {
9359711cd0dSJens Freimann             n->primary_dev = virtio_connect_failover_devices(n, n->qdev, &err);
9369711cd0dSJens Freimann             if (err) {
9379711cd0dSJens Freimann                 goto out_err;
9389711cd0dSJens Freimann             }
9399711cd0dSJens Freimann             failover_add_primary(n, &err);
9409711cd0dSJens Freimann             if (err) {
9419711cd0dSJens Freimann                 goto out_err;
9429711cd0dSJens Freimann             }
9439711cd0dSJens Freimann         }
9449711cd0dSJens Freimann     }
9459711cd0dSJens Freimann     return;
9469711cd0dSJens Freimann 
9479711cd0dSJens Freimann out_err:
9489711cd0dSJens Freimann     if (err) {
9499711cd0dSJens Freimann         warn_report_err(err);
9509711cd0dSJens Freimann     }
9516e790746SPaolo Bonzini }
9526e790746SPaolo Bonzini 
9536e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
9546e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
9556e790746SPaolo Bonzini {
9566e790746SPaolo Bonzini     uint8_t on;
9576e790746SPaolo Bonzini     size_t s;
958b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
9596e790746SPaolo Bonzini 
9606e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
9616e790746SPaolo Bonzini     if (s != sizeof(on)) {
9626e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9636e790746SPaolo Bonzini     }
9646e790746SPaolo Bonzini 
9656e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
9666e790746SPaolo Bonzini         n->promisc = on;
9676e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
9686e790746SPaolo Bonzini         n->allmulti = on;
9696e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
9706e790746SPaolo Bonzini         n->alluni = on;
9716e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
9726e790746SPaolo Bonzini         n->nomulti = on;
9736e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
9746e790746SPaolo Bonzini         n->nouni = on;
9756e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
9766e790746SPaolo Bonzini         n->nobcast = on;
9776e790746SPaolo Bonzini     } else {
9786e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9796e790746SPaolo Bonzini     }
9806e790746SPaolo Bonzini 
981b1be4280SAmos Kong     rxfilter_notify(nc);
982b1be4280SAmos Kong 
9836e790746SPaolo Bonzini     return VIRTIO_NET_OK;
9846e790746SPaolo Bonzini }
9856e790746SPaolo Bonzini 
986644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
987644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
988644c9858SDmitry Fleytman {
989644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
990644c9858SDmitry Fleytman     uint64_t offloads;
991644c9858SDmitry Fleytman     size_t s;
992644c9858SDmitry Fleytman 
99395129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
994644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
995644c9858SDmitry Fleytman     }
996644c9858SDmitry Fleytman 
997644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
998644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
999644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1000644c9858SDmitry Fleytman     }
1001644c9858SDmitry Fleytman 
1002644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
1003644c9858SDmitry Fleytman         uint64_t supported_offloads;
1004644c9858SDmitry Fleytman 
1005189ae6bbSJason Wang         offloads = virtio_ldq_p(vdev, &offloads);
1006189ae6bbSJason Wang 
1007644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
1008644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1009644c9858SDmitry Fleytman         }
1010644c9858SDmitry Fleytman 
10112974e916SYuri Benditovich         n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10122974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4);
10132974e916SYuri Benditovich         n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10142974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6);
10152974e916SYuri Benditovich         virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT);
10162974e916SYuri Benditovich 
1017644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
1018644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
1019644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1020644c9858SDmitry Fleytman         }
1021644c9858SDmitry Fleytman 
1022644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
1023644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1024644c9858SDmitry Fleytman 
1025644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
1026644c9858SDmitry Fleytman     } else {
1027644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1028644c9858SDmitry Fleytman     }
1029644c9858SDmitry Fleytman }
1030644c9858SDmitry Fleytman 
10316e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
10326e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
10336e790746SPaolo Bonzini {
10341399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10356e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
10366e790746SPaolo Bonzini     size_t s;
1037b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10386e790746SPaolo Bonzini 
10396e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
10406e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
10416e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
10426e790746SPaolo Bonzini         }
10436e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
10446e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
10456e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1046b1be4280SAmos Kong         rxfilter_notify(nc);
1047b1be4280SAmos Kong 
10486e790746SPaolo Bonzini         return VIRTIO_NET_OK;
10496e790746SPaolo Bonzini     }
10506e790746SPaolo Bonzini 
10516e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
10526e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10536e790746SPaolo Bonzini     }
10546e790746SPaolo Bonzini 
1055cae2e556SAmos Kong     int in_use = 0;
1056cae2e556SAmos Kong     int first_multi = 0;
1057cae2e556SAmos Kong     uint8_t uni_overflow = 0;
1058cae2e556SAmos Kong     uint8_t multi_overflow = 0;
1059cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
10606e790746SPaolo Bonzini 
10616e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10626e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10631399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10646e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1065b1be4280SAmos Kong         goto error;
10666e790746SPaolo Bonzini     }
10676e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10686e790746SPaolo Bonzini 
10696e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
1070b1be4280SAmos Kong         goto error;
10716e790746SPaolo Bonzini     }
10726e790746SPaolo Bonzini 
10736e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
1074cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
10756e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
10766e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1077b1be4280SAmos Kong             goto error;
10786e790746SPaolo Bonzini         }
1079cae2e556SAmos Kong         in_use += mac_data.entries;
10806e790746SPaolo Bonzini     } else {
1081cae2e556SAmos Kong         uni_overflow = 1;
10826e790746SPaolo Bonzini     }
10836e790746SPaolo Bonzini 
10846e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
10856e790746SPaolo Bonzini 
1086cae2e556SAmos Kong     first_multi = in_use;
10876e790746SPaolo Bonzini 
10886e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10896e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10901399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10916e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1092b1be4280SAmos Kong         goto error;
10936e790746SPaolo Bonzini     }
10946e790746SPaolo Bonzini 
10956e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10966e790746SPaolo Bonzini 
10976e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
1098b1be4280SAmos Kong         goto error;
10996e790746SPaolo Bonzini     }
11006e790746SPaolo Bonzini 
1101edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
1102cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
11036e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
11046e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1105b1be4280SAmos Kong             goto error;
11066e790746SPaolo Bonzini         }
1107cae2e556SAmos Kong         in_use += mac_data.entries;
11086e790746SPaolo Bonzini     } else {
1109cae2e556SAmos Kong         multi_overflow = 1;
11106e790746SPaolo Bonzini     }
11116e790746SPaolo Bonzini 
1112cae2e556SAmos Kong     n->mac_table.in_use = in_use;
1113cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
1114cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
1115cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
1116cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
1117cae2e556SAmos Kong     g_free(macs);
1118b1be4280SAmos Kong     rxfilter_notify(nc);
1119b1be4280SAmos Kong 
11206e790746SPaolo Bonzini     return VIRTIO_NET_OK;
1121b1be4280SAmos Kong 
1122b1be4280SAmos Kong error:
1123cae2e556SAmos Kong     g_free(macs);
1124b1be4280SAmos Kong     return VIRTIO_NET_ERR;
11256e790746SPaolo Bonzini }
11266e790746SPaolo Bonzini 
11276e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
11286e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
11296e790746SPaolo Bonzini {
11301399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
11316e790746SPaolo Bonzini     uint16_t vid;
11326e790746SPaolo Bonzini     size_t s;
1133b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
11346e790746SPaolo Bonzini 
11356e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
11361399c60dSRusty Russell     vid = virtio_lduw_p(vdev, &vid);
11376e790746SPaolo Bonzini     if (s != sizeof(vid)) {
11386e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11396e790746SPaolo Bonzini     }
11406e790746SPaolo Bonzini 
11416e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
11426e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11436e790746SPaolo Bonzini 
11446e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
11456e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
11466e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
11476e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
11486e790746SPaolo Bonzini     else
11496e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11506e790746SPaolo Bonzini 
1151b1be4280SAmos Kong     rxfilter_notify(nc);
1152b1be4280SAmos Kong 
11536e790746SPaolo Bonzini     return VIRTIO_NET_OK;
11546e790746SPaolo Bonzini }
11556e790746SPaolo Bonzini 
1156f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
1157f57fcf70SJason Wang                                       struct iovec *iov, unsigned int iov_cnt)
1158f57fcf70SJason Wang {
11599d8c6a25SDr. David Alan Gilbert     trace_virtio_net_handle_announce(n->announce_timer.round);
1160f57fcf70SJason Wang     if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
1161f57fcf70SJason Wang         n->status & VIRTIO_NET_S_ANNOUNCE) {
1162f57fcf70SJason Wang         n->status &= ~VIRTIO_NET_S_ANNOUNCE;
11639d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
11649d8c6a25SDr. David Alan Gilbert             qemu_announce_timer_step(&n->announce_timer);
1165f57fcf70SJason Wang         }
1166f57fcf70SJason Wang         return VIRTIO_NET_OK;
1167f57fcf70SJason Wang     } else {
1168f57fcf70SJason Wang         return VIRTIO_NET_ERR;
1169f57fcf70SJason Wang     }
1170f57fcf70SJason Wang }
1171f57fcf70SJason Wang 
117259079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n)
117359079029SYuri Benditovich {
117459079029SYuri Benditovich     if (n->rss_data.enabled) {
117559079029SYuri Benditovich         trace_virtio_net_rss_disable();
117659079029SYuri Benditovich     }
117759079029SYuri Benditovich     n->rss_data.enabled = false;
117859079029SYuri Benditovich }
117959079029SYuri Benditovich 
118059079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n,
1181e22f0603SYuri Benditovich                                       struct iovec *iov,
1182e22f0603SYuri Benditovich                                       unsigned int iov_cnt,
1183e22f0603SYuri Benditovich                                       bool do_rss)
118459079029SYuri Benditovich {
118559079029SYuri Benditovich     VirtIODevice *vdev = VIRTIO_DEVICE(n);
118659079029SYuri Benditovich     struct virtio_net_rss_config cfg;
118759079029SYuri Benditovich     size_t s, offset = 0, size_get;
118859079029SYuri Benditovich     uint16_t queues, i;
118959079029SYuri Benditovich     struct {
119059079029SYuri Benditovich         uint16_t us;
119159079029SYuri Benditovich         uint8_t b;
119259079029SYuri Benditovich     } QEMU_PACKED temp;
119359079029SYuri Benditovich     const char *err_msg = "";
119459079029SYuri Benditovich     uint32_t err_value = 0;
119559079029SYuri Benditovich 
1196e22f0603SYuri Benditovich     if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) {
119759079029SYuri Benditovich         err_msg = "RSS is not negotiated";
119859079029SYuri Benditovich         goto error;
119959079029SYuri Benditovich     }
1200e22f0603SYuri Benditovich     if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) {
1201e22f0603SYuri Benditovich         err_msg = "Hash report is not negotiated";
1202e22f0603SYuri Benditovich         goto error;
1203e22f0603SYuri Benditovich     }
120459079029SYuri Benditovich     size_get = offsetof(struct virtio_net_rss_config, indirection_table);
120559079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get);
120659079029SYuri Benditovich     if (s != size_get) {
120759079029SYuri Benditovich         err_msg = "Short command buffer";
120859079029SYuri Benditovich         err_value = (uint32_t)s;
120959079029SYuri Benditovich         goto error;
121059079029SYuri Benditovich     }
121159079029SYuri Benditovich     n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types);
121259079029SYuri Benditovich     n->rss_data.indirections_len =
121359079029SYuri Benditovich         virtio_lduw_p(vdev, &cfg.indirection_table_mask);
121459079029SYuri Benditovich     n->rss_data.indirections_len++;
1215e22f0603SYuri Benditovich     if (!do_rss) {
1216e22f0603SYuri Benditovich         n->rss_data.indirections_len = 1;
1217e22f0603SYuri Benditovich     }
121859079029SYuri Benditovich     if (!is_power_of_2(n->rss_data.indirections_len)) {
121959079029SYuri Benditovich         err_msg = "Invalid size of indirection table";
122059079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
122159079029SYuri Benditovich         goto error;
122259079029SYuri Benditovich     }
122359079029SYuri Benditovich     if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) {
122459079029SYuri Benditovich         err_msg = "Too large indirection table";
122559079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
122659079029SYuri Benditovich         goto error;
122759079029SYuri Benditovich     }
1228e22f0603SYuri Benditovich     n->rss_data.default_queue = do_rss ?
1229e22f0603SYuri Benditovich         virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0;
123059079029SYuri Benditovich     if (n->rss_data.default_queue >= n->max_queues) {
123159079029SYuri Benditovich         err_msg = "Invalid default queue";
123259079029SYuri Benditovich         err_value = n->rss_data.default_queue;
123359079029SYuri Benditovich         goto error;
123459079029SYuri Benditovich     }
123559079029SYuri Benditovich     offset += size_get;
123659079029SYuri Benditovich     size_get = sizeof(uint16_t) * n->rss_data.indirections_len;
123759079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
123859079029SYuri Benditovich     n->rss_data.indirections_table = g_malloc(size_get);
123959079029SYuri Benditovich     if (!n->rss_data.indirections_table) {
124059079029SYuri Benditovich         err_msg = "Can't allocate indirections table";
124159079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
124259079029SYuri Benditovich         goto error;
124359079029SYuri Benditovich     }
124459079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset,
124559079029SYuri Benditovich                    n->rss_data.indirections_table, size_get);
124659079029SYuri Benditovich     if (s != size_get) {
124759079029SYuri Benditovich         err_msg = "Short indirection table buffer";
124859079029SYuri Benditovich         err_value = (uint32_t)s;
124959079029SYuri Benditovich         goto error;
125059079029SYuri Benditovich     }
125159079029SYuri Benditovich     for (i = 0; i < n->rss_data.indirections_len; ++i) {
125259079029SYuri Benditovich         uint16_t val = n->rss_data.indirections_table[i];
125359079029SYuri Benditovich         n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val);
125459079029SYuri Benditovich     }
125559079029SYuri Benditovich     offset += size_get;
125659079029SYuri Benditovich     size_get = sizeof(temp);
125759079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get);
125859079029SYuri Benditovich     if (s != size_get) {
125959079029SYuri Benditovich         err_msg = "Can't get queues";
126059079029SYuri Benditovich         err_value = (uint32_t)s;
126159079029SYuri Benditovich         goto error;
126259079029SYuri Benditovich     }
1263e22f0603SYuri Benditovich     queues = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queues;
126459079029SYuri Benditovich     if (queues == 0 || queues > n->max_queues) {
126559079029SYuri Benditovich         err_msg = "Invalid number of queues";
126659079029SYuri Benditovich         err_value = queues;
126759079029SYuri Benditovich         goto error;
126859079029SYuri Benditovich     }
126959079029SYuri Benditovich     if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) {
127059079029SYuri Benditovich         err_msg = "Invalid key size";
127159079029SYuri Benditovich         err_value = temp.b;
127259079029SYuri Benditovich         goto error;
127359079029SYuri Benditovich     }
127459079029SYuri Benditovich     if (!temp.b && n->rss_data.hash_types) {
127559079029SYuri Benditovich         err_msg = "No key provided";
127659079029SYuri Benditovich         err_value = 0;
127759079029SYuri Benditovich         goto error;
127859079029SYuri Benditovich     }
127959079029SYuri Benditovich     if (!temp.b && !n->rss_data.hash_types) {
128059079029SYuri Benditovich         virtio_net_disable_rss(n);
128159079029SYuri Benditovich         return queues;
128259079029SYuri Benditovich     }
128359079029SYuri Benditovich     offset += size_get;
128459079029SYuri Benditovich     size_get = temp.b;
128559079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get);
128659079029SYuri Benditovich     if (s != size_get) {
128759079029SYuri Benditovich         err_msg = "Can get key buffer";
128859079029SYuri Benditovich         err_value = (uint32_t)s;
128959079029SYuri Benditovich         goto error;
129059079029SYuri Benditovich     }
129159079029SYuri Benditovich     n->rss_data.enabled = true;
129259079029SYuri Benditovich     trace_virtio_net_rss_enable(n->rss_data.hash_types,
129359079029SYuri Benditovich                                 n->rss_data.indirections_len,
129459079029SYuri Benditovich                                 temp.b);
129559079029SYuri Benditovich     return queues;
129659079029SYuri Benditovich error:
129759079029SYuri Benditovich     trace_virtio_net_rss_error(err_msg, err_value);
129859079029SYuri Benditovich     virtio_net_disable_rss(n);
129959079029SYuri Benditovich     return 0;
130059079029SYuri Benditovich }
130159079029SYuri Benditovich 
13026e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
13036e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
13046e790746SPaolo Bonzini {
130517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
13066e790746SPaolo Bonzini     uint16_t queues;
13076e790746SPaolo Bonzini 
130859079029SYuri Benditovich     virtio_net_disable_rss(n);
1309e22f0603SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) {
1310e22f0603SYuri Benditovich         queues = virtio_net_handle_rss(n, iov, iov_cnt, false);
1311e22f0603SYuri Benditovich         return queues ? VIRTIO_NET_OK : VIRTIO_NET_ERR;
1312e22f0603SYuri Benditovich     }
131359079029SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) {
1314e22f0603SYuri Benditovich         queues = virtio_net_handle_rss(n, iov, iov_cnt, true);
131559079029SYuri Benditovich     } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
131659079029SYuri Benditovich         struct virtio_net_ctrl_mq mq;
131759079029SYuri Benditovich         size_t s;
131859079029SYuri Benditovich         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) {
131959079029SYuri Benditovich             return VIRTIO_NET_ERR;
132059079029SYuri Benditovich         }
13216e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
13226e790746SPaolo Bonzini         if (s != sizeof(mq)) {
13236e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
13246e790746SPaolo Bonzini         }
132559079029SYuri Benditovich         queues = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
13266e790746SPaolo Bonzini 
132759079029SYuri Benditovich     } else {
13286e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
13296e790746SPaolo Bonzini     }
13306e790746SPaolo Bonzini 
13316e790746SPaolo Bonzini     if (queues < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
13326e790746SPaolo Bonzini         queues > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
13336e790746SPaolo Bonzini         queues > n->max_queues ||
13346e790746SPaolo Bonzini         !n->multiqueue) {
13356e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
13366e790746SPaolo Bonzini     }
13376e790746SPaolo Bonzini 
13386e790746SPaolo Bonzini     n->curr_queues = queues;
13396e790746SPaolo Bonzini     /* stop the backend before changing the number of queues to avoid handling a
13406e790746SPaolo Bonzini      * disabled queue */
134117a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
13426e790746SPaolo Bonzini     virtio_net_set_queues(n);
13436e790746SPaolo Bonzini 
13446e790746SPaolo Bonzini     return VIRTIO_NET_OK;
13456e790746SPaolo Bonzini }
1346ba7eadb5SGreg Kurz 
13476e790746SPaolo Bonzini static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
13486e790746SPaolo Bonzini {
134917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
13506e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
13516e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
135251b19ebeSPaolo Bonzini     VirtQueueElement *elem;
13536e790746SPaolo Bonzini     size_t s;
1354771b6ed3SJason Wang     struct iovec *iov, *iov2;
13556e790746SPaolo Bonzini     unsigned int iov_cnt;
13566e790746SPaolo Bonzini 
135751b19ebeSPaolo Bonzini     for (;;) {
135851b19ebeSPaolo Bonzini         elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
135951b19ebeSPaolo Bonzini         if (!elem) {
136051b19ebeSPaolo Bonzini             break;
136151b19ebeSPaolo Bonzini         }
136251b19ebeSPaolo Bonzini         if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) ||
136351b19ebeSPaolo Bonzini             iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) {
1364ba7eadb5SGreg Kurz             virtio_error(vdev, "virtio-net ctrl missing headers");
1365ba7eadb5SGreg Kurz             virtqueue_detach_element(vq, elem, 0);
1366ba7eadb5SGreg Kurz             g_free(elem);
1367ba7eadb5SGreg Kurz             break;
13686e790746SPaolo Bonzini         }
13696e790746SPaolo Bonzini 
137051b19ebeSPaolo Bonzini         iov_cnt = elem->out_num;
137151b19ebeSPaolo Bonzini         iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num);
13726e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl));
13736e790746SPaolo Bonzini         iov_discard_front(&iov, &iov_cnt, sizeof(ctrl));
13746e790746SPaolo Bonzini         if (s != sizeof(ctrl)) {
13756e790746SPaolo Bonzini             status = VIRTIO_NET_ERR;
13766e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
13776e790746SPaolo Bonzini             status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt);
13786e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
13796e790746SPaolo Bonzini             status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt);
13806e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
13816e790746SPaolo Bonzini             status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt);
1382f57fcf70SJason Wang         } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
1383f57fcf70SJason Wang             status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt);
13846e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
13856e790746SPaolo Bonzini             status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt);
1386644c9858SDmitry Fleytman         } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
1387644c9858SDmitry Fleytman             status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt);
13886e790746SPaolo Bonzini         }
13896e790746SPaolo Bonzini 
139051b19ebeSPaolo Bonzini         s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status));
13916e790746SPaolo Bonzini         assert(s == sizeof(status));
13926e790746SPaolo Bonzini 
139351b19ebeSPaolo Bonzini         virtqueue_push(vq, elem, sizeof(status));
13946e790746SPaolo Bonzini         virtio_notify(vdev, vq);
1395771b6ed3SJason Wang         g_free(iov2);
139651b19ebeSPaolo Bonzini         g_free(elem);
13976e790746SPaolo Bonzini     }
13986e790746SPaolo Bonzini }
13996e790746SPaolo Bonzini 
14006e790746SPaolo Bonzini /* RX */
14016e790746SPaolo Bonzini 
14026e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
14036e790746SPaolo Bonzini {
140417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
14056e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
14066e790746SPaolo Bonzini 
14076e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
14086e790746SPaolo Bonzini }
14096e790746SPaolo Bonzini 
1410b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc)
14116e790746SPaolo Bonzini {
14126e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
141317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
14146e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
14156e790746SPaolo Bonzini 
141617a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
1417b8c4b67eSPhilippe Mathieu-Daudé         return false;
14186e790746SPaolo Bonzini     }
14196e790746SPaolo Bonzini 
14206e790746SPaolo Bonzini     if (nc->queue_index >= n->curr_queues) {
1421b8c4b67eSPhilippe Mathieu-Daudé         return false;
14226e790746SPaolo Bonzini     }
14236e790746SPaolo Bonzini 
14246e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
142517a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
1426b8c4b67eSPhilippe Mathieu-Daudé         return false;
14276e790746SPaolo Bonzini     }
14286e790746SPaolo Bonzini 
1429b8c4b67eSPhilippe Mathieu-Daudé     return true;
14306e790746SPaolo Bonzini }
14316e790746SPaolo Bonzini 
14326e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
14336e790746SPaolo Bonzini {
14346e790746SPaolo Bonzini     VirtIONet *n = q->n;
14356e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
14366e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
14376e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
14386e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
14396e790746SPaolo Bonzini 
14406e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
14416e790746SPaolo Bonzini          * available after the above check but before notification was
14426e790746SPaolo Bonzini          * enabled, check for available buffers again.
14436e790746SPaolo Bonzini          */
14446e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
14456e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
14466e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
14476e790746SPaolo Bonzini             return 0;
14486e790746SPaolo Bonzini         }
14496e790746SPaolo Bonzini     }
14506e790746SPaolo Bonzini 
14516e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
14526e790746SPaolo Bonzini     return 1;
14536e790746SPaolo Bonzini }
14546e790746SPaolo Bonzini 
14551399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
1456032a74a1SCédric Le Goater {
14571399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->hdr_len);
14581399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->gso_size);
14591399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_start);
14601399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_offset);
1461032a74a1SCédric Le Goater }
1462032a74a1SCédric Le Goater 
14636e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
14646e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
14656e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
14666e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
14676e790746SPaolo Bonzini  * dhclient yet.
14686e790746SPaolo Bonzini  *
14696e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
14706e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
14716e790746SPaolo Bonzini  * kernels.
14726e790746SPaolo Bonzini  *
14736e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
14746e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
14756e790746SPaolo Bonzini  * cache.
14766e790746SPaolo Bonzini  */
14776e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
14786e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
14796e790746SPaolo Bonzini {
14806e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
14816e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
14826e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
14836e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
14846e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
14856e790746SPaolo Bonzini         net_checksum_calculate(buf, size);
14866e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
14876e790746SPaolo Bonzini     }
14886e790746SPaolo Bonzini }
14896e790746SPaolo Bonzini 
14906e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
14916e790746SPaolo Bonzini                            const void *buf, size_t size)
14926e790746SPaolo Bonzini {
14936e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
14946e790746SPaolo Bonzini         /* FIXME this cast is evil */
14956e790746SPaolo Bonzini         void *wbuf = (void *)buf;
14966e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
14976e790746SPaolo Bonzini                                     size - n->host_hdr_len);
14981bfa316cSGreg Kurz 
14991bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
15001399c60dSRusty Russell             virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
15011bfa316cSGreg Kurz         }
15026e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
15036e790746SPaolo Bonzini     } else {
15046e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
15056e790746SPaolo Bonzini             .flags = 0,
15066e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
15076e790746SPaolo Bonzini         };
15086e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
15096e790746SPaolo Bonzini     }
15106e790746SPaolo Bonzini }
15116e790746SPaolo Bonzini 
15126e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
15136e790746SPaolo Bonzini {
15146e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
15156e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
15166e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
15176e790746SPaolo Bonzini     int i;
15186e790746SPaolo Bonzini 
15196e790746SPaolo Bonzini     if (n->promisc)
15206e790746SPaolo Bonzini         return 1;
15216e790746SPaolo Bonzini 
15226e790746SPaolo Bonzini     ptr += n->host_hdr_len;
15236e790746SPaolo Bonzini 
15246e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
15257542d3e7SPeter Maydell         int vid = lduw_be_p(ptr + 14) & 0xfff;
15266e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
15276e790746SPaolo Bonzini             return 0;
15286e790746SPaolo Bonzini     }
15296e790746SPaolo Bonzini 
15306e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
15316e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
15326e790746SPaolo Bonzini             return !n->nobcast;
15336e790746SPaolo Bonzini         } else if (n->nomulti) {
15346e790746SPaolo Bonzini             return 0;
15356e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
15366e790746SPaolo Bonzini             return 1;
15376e790746SPaolo Bonzini         }
15386e790746SPaolo Bonzini 
15396e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
15406e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
15416e790746SPaolo Bonzini                 return 1;
15426e790746SPaolo Bonzini             }
15436e790746SPaolo Bonzini         }
15446e790746SPaolo Bonzini     } else { // unicast
15456e790746SPaolo Bonzini         if (n->nouni) {
15466e790746SPaolo Bonzini             return 0;
15476e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
15486e790746SPaolo Bonzini             return 1;
15496e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
15506e790746SPaolo Bonzini             return 1;
15516e790746SPaolo Bonzini         }
15526e790746SPaolo Bonzini 
15536e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
15546e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
15556e790746SPaolo Bonzini                 return 1;
15566e790746SPaolo Bonzini             }
15576e790746SPaolo Bonzini         }
15586e790746SPaolo Bonzini     }
15596e790746SPaolo Bonzini 
15606e790746SPaolo Bonzini     return 0;
15616e790746SPaolo Bonzini }
15626e790746SPaolo Bonzini 
15634474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4,
15644474e37aSYuri Benditovich                                         bool isip6,
15654474e37aSYuri Benditovich                                         bool isudp,
15664474e37aSYuri Benditovich                                         bool istcp,
15674474e37aSYuri Benditovich                                         uint32_t types)
15684474e37aSYuri Benditovich {
15694474e37aSYuri Benditovich     if (isip4) {
15704474e37aSYuri Benditovich         if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) {
15714474e37aSYuri Benditovich             return NetPktRssIpV4Tcp;
15724474e37aSYuri Benditovich         }
15734474e37aSYuri Benditovich         if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) {
15744474e37aSYuri Benditovich             return NetPktRssIpV4Udp;
15754474e37aSYuri Benditovich         }
15764474e37aSYuri Benditovich         if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) {
15774474e37aSYuri Benditovich             return NetPktRssIpV4;
15784474e37aSYuri Benditovich         }
15794474e37aSYuri Benditovich     } else if (isip6) {
15804474e37aSYuri Benditovich         uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX |
15814474e37aSYuri Benditovich                         VIRTIO_NET_RSS_HASH_TYPE_TCPv6;
15824474e37aSYuri Benditovich 
15834474e37aSYuri Benditovich         if (istcp && (types & mask)) {
15844474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ?
15854474e37aSYuri Benditovich                 NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp;
15864474e37aSYuri Benditovich         }
15874474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6;
15884474e37aSYuri Benditovich         if (isudp && (types & mask)) {
15894474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ?
15904474e37aSYuri Benditovich                 NetPktRssIpV6UdpEx : NetPktRssIpV6Udp;
15914474e37aSYuri Benditovich         }
15924474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6;
15934474e37aSYuri Benditovich         if (types & mask) {
15944474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ?
15954474e37aSYuri Benditovich                 NetPktRssIpV6Ex : NetPktRssIpV6;
15964474e37aSYuri Benditovich         }
15974474e37aSYuri Benditovich     }
15984474e37aSYuri Benditovich     return 0xff;
15994474e37aSYuri Benditovich }
16004474e37aSYuri Benditovich 
1601e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report,
1602e22f0603SYuri Benditovich                                    uint32_t hash)
1603e22f0603SYuri Benditovich {
1604e22f0603SYuri Benditovich     struct virtio_net_hdr_v1_hash *hdr = (void *)buf;
1605e22f0603SYuri Benditovich     hdr->hash_value = hash;
1606e22f0603SYuri Benditovich     hdr->hash_report = report;
1607e22f0603SYuri Benditovich }
1608e22f0603SYuri Benditovich 
16094474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf,
161097cd965cSPaolo Bonzini                                   size_t size)
16116e790746SPaolo Bonzini {
16126e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1613e22f0603SYuri Benditovich     unsigned int index = nc->queue_index, new_index = index;
16144474e37aSYuri Benditovich     struct NetRxPkt *pkt = n->rx_pkt;
16154474e37aSYuri Benditovich     uint8_t net_hash_type;
16164474e37aSYuri Benditovich     uint32_t hash;
16174474e37aSYuri Benditovich     bool isip4, isip6, isudp, istcp;
1618e22f0603SYuri Benditovich     static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = {
1619e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv4,
1620e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv4,
1621e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6,
1622e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6,
1623e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6_EX,
1624e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6_EX,
1625e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv4,
1626e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6,
1627e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6_EX
1628e22f0603SYuri Benditovich     };
16294474e37aSYuri Benditovich 
16304474e37aSYuri Benditovich     net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len,
16314474e37aSYuri Benditovich                              size - n->host_hdr_len);
16324474e37aSYuri Benditovich     net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp);
16334474e37aSYuri Benditovich     if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) {
16344474e37aSYuri Benditovich         istcp = isudp = false;
16354474e37aSYuri Benditovich     }
16364474e37aSYuri Benditovich     if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) {
16374474e37aSYuri Benditovich         istcp = isudp = false;
16384474e37aSYuri Benditovich     }
16394474e37aSYuri Benditovich     net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp,
16404474e37aSYuri Benditovich                                              n->rss_data.hash_types);
16414474e37aSYuri Benditovich     if (net_hash_type > NetPktRssIpV6UdpEx) {
1642e22f0603SYuri Benditovich         if (n->rss_data.populate_hash) {
1643e22f0603SYuri Benditovich             virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0);
1644e22f0603SYuri Benditovich         }
1645e22f0603SYuri Benditovich         return n->rss_data.redirect ? n->rss_data.default_queue : -1;
16464474e37aSYuri Benditovich     }
16474474e37aSYuri Benditovich 
16484474e37aSYuri Benditovich     hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key);
1649e22f0603SYuri Benditovich 
1650e22f0603SYuri Benditovich     if (n->rss_data.populate_hash) {
1651e22f0603SYuri Benditovich         virtio_set_packet_hash(buf, reports[net_hash_type], hash);
1652e22f0603SYuri Benditovich     }
1653e22f0603SYuri Benditovich 
1654e22f0603SYuri Benditovich     if (n->rss_data.redirect) {
16554474e37aSYuri Benditovich         new_index = hash & (n->rss_data.indirections_len - 1);
16564474e37aSYuri Benditovich         new_index = n->rss_data.indirections_table[new_index];
16574474e37aSYuri Benditovich     }
1658e22f0603SYuri Benditovich 
1659e22f0603SYuri Benditovich     return (index == new_index) ? -1 : new_index;
16604474e37aSYuri Benditovich }
16614474e37aSYuri Benditovich 
16624474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf,
16634474e37aSYuri Benditovich                                       size_t size, bool no_rss)
16644474e37aSYuri Benditovich {
16654474e37aSYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
16666e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
166717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
16686e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
16696e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
16706e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
16716e790746SPaolo Bonzini     size_t offset, i, guest_offset;
16726e790746SPaolo Bonzini 
16736e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
16746e790746SPaolo Bonzini         return -1;
16756e790746SPaolo Bonzini     }
16766e790746SPaolo Bonzini 
16774474e37aSYuri Benditovich     if (!no_rss && n->rss_data.enabled) {
16784474e37aSYuri Benditovich         int index = virtio_net_process_rss(nc, buf, size);
16794474e37aSYuri Benditovich         if (index >= 0) {
16804474e37aSYuri Benditovich             NetClientState *nc2 = qemu_get_subqueue(n->nic, index);
16814474e37aSYuri Benditovich             return virtio_net_receive_rcu(nc2, buf, size, true);
16824474e37aSYuri Benditovich         }
16834474e37aSYuri Benditovich     }
16844474e37aSYuri Benditovich 
16856e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
16866e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
16876e790746SPaolo Bonzini         return 0;
16886e790746SPaolo Bonzini     }
16896e790746SPaolo Bonzini 
16906e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
16916e790746SPaolo Bonzini         return size;
16926e790746SPaolo Bonzini 
16936e790746SPaolo Bonzini     offset = i = 0;
16946e790746SPaolo Bonzini 
16956e790746SPaolo Bonzini     while (offset < size) {
169651b19ebeSPaolo Bonzini         VirtQueueElement *elem;
16976e790746SPaolo Bonzini         int len, total;
169851b19ebeSPaolo Bonzini         const struct iovec *sg;
16996e790746SPaolo Bonzini 
17006e790746SPaolo Bonzini         total = 0;
17016e790746SPaolo Bonzini 
170251b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
170351b19ebeSPaolo Bonzini         if (!elem) {
1704ba10b9c0SGreg Kurz             if (i) {
1705ba10b9c0SGreg Kurz                 virtio_error(vdev, "virtio-net unexpected empty queue: "
17066e790746SPaolo Bonzini                              "i %zd mergeable %d offset %zd, size %zd, "
1707019a3edbSGerd Hoffmann                              "guest hdr len %zd, host hdr len %zd "
1708019a3edbSGerd Hoffmann                              "guest features 0x%" PRIx64,
17096e790746SPaolo Bonzini                              i, n->mergeable_rx_bufs, offset, size,
1710019a3edbSGerd Hoffmann                              n->guest_hdr_len, n->host_hdr_len,
1711019a3edbSGerd Hoffmann                              vdev->guest_features);
1712ba10b9c0SGreg Kurz             }
1713ba10b9c0SGreg Kurz             return -1;
17146e790746SPaolo Bonzini         }
17156e790746SPaolo Bonzini 
171651b19ebeSPaolo Bonzini         if (elem->in_num < 1) {
1717ba10b9c0SGreg Kurz             virtio_error(vdev,
1718ba10b9c0SGreg Kurz                          "virtio-net receive queue contains no in buffers");
1719ba10b9c0SGreg Kurz             virtqueue_detach_element(q->rx_vq, elem, 0);
1720ba10b9c0SGreg Kurz             g_free(elem);
1721ba10b9c0SGreg Kurz             return -1;
17226e790746SPaolo Bonzini         }
17236e790746SPaolo Bonzini 
172451b19ebeSPaolo Bonzini         sg = elem->in_sg;
17256e790746SPaolo Bonzini         if (i == 0) {
17266e790746SPaolo Bonzini             assert(offset == 0);
17276e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
17286e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
172951b19ebeSPaolo Bonzini                                     sg, elem->in_num,
17306e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
17316e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
17326e790746SPaolo Bonzini             }
17336e790746SPaolo Bonzini 
173451b19ebeSPaolo Bonzini             receive_header(n, sg, elem->in_num, buf, size);
1735e22f0603SYuri Benditovich             if (n->rss_data.populate_hash) {
1736e22f0603SYuri Benditovich                 offset = sizeof(mhdr);
1737e22f0603SYuri Benditovich                 iov_from_buf(sg, elem->in_num, offset,
1738e22f0603SYuri Benditovich                              buf + offset, n->host_hdr_len - sizeof(mhdr));
1739e22f0603SYuri Benditovich             }
17406e790746SPaolo Bonzini             offset = n->host_hdr_len;
17416e790746SPaolo Bonzini             total += n->guest_hdr_len;
17426e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
17436e790746SPaolo Bonzini         } else {
17446e790746SPaolo Bonzini             guest_offset = 0;
17456e790746SPaolo Bonzini         }
17466e790746SPaolo Bonzini 
17476e790746SPaolo Bonzini         /* copy in packet.  ugh */
174851b19ebeSPaolo Bonzini         len = iov_from_buf(sg, elem->in_num, guest_offset,
17496e790746SPaolo Bonzini                            buf + offset, size - offset);
17506e790746SPaolo Bonzini         total += len;
17516e790746SPaolo Bonzini         offset += len;
17526e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
17536e790746SPaolo Bonzini          * must have consumed the complete packet.
17546e790746SPaolo Bonzini          * Otherwise, drop it. */
17556e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
175627e57efeSLadi Prosek             virtqueue_unpop(q->rx_vq, elem, total);
175751b19ebeSPaolo Bonzini             g_free(elem);
17586e790746SPaolo Bonzini             return size;
17596e790746SPaolo Bonzini         }
17606e790746SPaolo Bonzini 
17616e790746SPaolo Bonzini         /* signal other side */
176251b19ebeSPaolo Bonzini         virtqueue_fill(q->rx_vq, elem, total, i++);
176351b19ebeSPaolo Bonzini         g_free(elem);
17646e790746SPaolo Bonzini     }
17656e790746SPaolo Bonzini 
17666e790746SPaolo Bonzini     if (mhdr_cnt) {
17671399c60dSRusty Russell         virtio_stw_p(vdev, &mhdr.num_buffers, i);
17686e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
17696e790746SPaolo Bonzini                      0,
17706e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
17716e790746SPaolo Bonzini     }
17726e790746SPaolo Bonzini 
17736e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
177417a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
17756e790746SPaolo Bonzini 
17766e790746SPaolo Bonzini     return size;
17776e790746SPaolo Bonzini }
17786e790746SPaolo Bonzini 
17792974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf,
178097cd965cSPaolo Bonzini                                   size_t size)
178197cd965cSPaolo Bonzini {
1782068ddfa9SDr. David Alan Gilbert     RCU_READ_LOCK_GUARD();
178397cd965cSPaolo Bonzini 
17844474e37aSYuri Benditovich     return virtio_net_receive_rcu(nc, buf, size, false);
178597cd965cSPaolo Bonzini }
178697cd965cSPaolo Bonzini 
17872974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain,
17882974e916SYuri Benditovich                                          const uint8_t *buf,
17892974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
17902974e916SYuri Benditovich {
17912974e916SYuri Benditovich     uint16_t ip_hdrlen;
17922974e916SYuri Benditovich     struct ip_header *ip;
17932974e916SYuri Benditovich 
17942974e916SYuri Benditovich     ip = (struct ip_header *)(buf + chain->n->guest_hdr_len
17952974e916SYuri Benditovich                               + sizeof(struct eth_header));
17962974e916SYuri Benditovich     unit->ip = (void *)ip;
17972974e916SYuri Benditovich     ip_hdrlen = (ip->ip_ver_len & 0xF) << 2;
17982974e916SYuri Benditovich     unit->ip_plen = &ip->ip_len;
17992974e916SYuri Benditovich     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen);
18002974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
18012974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen;
18022974e916SYuri Benditovich }
18032974e916SYuri Benditovich 
18042974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain,
18052974e916SYuri Benditovich                                          const uint8_t *buf,
18062974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
18072974e916SYuri Benditovich {
18082974e916SYuri Benditovich     struct ip6_header *ip6;
18092974e916SYuri Benditovich 
18102974e916SYuri Benditovich     ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len
18112974e916SYuri Benditovich                                  + sizeof(struct eth_header));
18122974e916SYuri Benditovich     unit->ip = ip6;
18132974e916SYuri Benditovich     unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
181478ee6bd0SPhilippe Mathieu-Daudé     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip)
18152974e916SYuri Benditovich                                         + sizeof(struct ip6_header));
18162974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
18172974e916SYuri Benditovich 
18182974e916SYuri Benditovich     /* There is a difference between payload lenght in ipv4 and v6,
18192974e916SYuri Benditovich        ip header is excluded in ipv6 */
18202974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen;
18212974e916SYuri Benditovich }
18222974e916SYuri Benditovich 
18232974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain,
18242974e916SYuri Benditovich                                        VirtioNetRscSeg *seg)
18252974e916SYuri Benditovich {
18262974e916SYuri Benditovich     int ret;
1827dd3d85e8SYuri Benditovich     struct virtio_net_hdr_v1 *h;
18282974e916SYuri Benditovich 
1829dd3d85e8SYuri Benditovich     h = (struct virtio_net_hdr_v1 *)seg->buf;
18302974e916SYuri Benditovich     h->flags = 0;
18312974e916SYuri Benditovich     h->gso_type = VIRTIO_NET_HDR_GSO_NONE;
18322974e916SYuri Benditovich 
18332974e916SYuri Benditovich     if (seg->is_coalesced) {
1834dd3d85e8SYuri Benditovich         h->rsc.segments = seg->packets;
1835dd3d85e8SYuri Benditovich         h->rsc.dup_acks = seg->dup_ack;
18362974e916SYuri Benditovich         h->flags = VIRTIO_NET_HDR_F_RSC_INFO;
18372974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
18382974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
18392974e916SYuri Benditovich         } else {
18402974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
18412974e916SYuri Benditovich         }
18422974e916SYuri Benditovich     }
18432974e916SYuri Benditovich 
18442974e916SYuri Benditovich     ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size);
18452974e916SYuri Benditovich     QTAILQ_REMOVE(&chain->buffers, seg, next);
18462974e916SYuri Benditovich     g_free(seg->buf);
18472974e916SYuri Benditovich     g_free(seg);
18482974e916SYuri Benditovich 
18492974e916SYuri Benditovich     return ret;
18502974e916SYuri Benditovich }
18512974e916SYuri Benditovich 
18522974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq)
18532974e916SYuri Benditovich {
18542974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn;
18552974e916SYuri Benditovich     VirtioNetRscChain *chain = (VirtioNetRscChain *)opq;
18562974e916SYuri Benditovich 
18572974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) {
18582974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
18592974e916SYuri Benditovich             chain->stat.purge_failed++;
18602974e916SYuri Benditovich             continue;
18612974e916SYuri Benditovich         }
18622974e916SYuri Benditovich     }
18632974e916SYuri Benditovich 
18642974e916SYuri Benditovich     chain->stat.timer++;
18652974e916SYuri Benditovich     if (!QTAILQ_EMPTY(&chain->buffers)) {
18662974e916SYuri Benditovich         timer_mod(chain->drain_timer,
18672974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
18682974e916SYuri Benditovich     }
18692974e916SYuri Benditovich }
18702974e916SYuri Benditovich 
18712974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n)
18722974e916SYuri Benditovich {
18732974e916SYuri Benditovich     VirtioNetRscChain *chain, *rn_chain;
18742974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn_seg;
18752974e916SYuri Benditovich 
18762974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) {
18772974e916SYuri Benditovich         QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) {
18782974e916SYuri Benditovich             QTAILQ_REMOVE(&chain->buffers, seg, next);
18792974e916SYuri Benditovich             g_free(seg->buf);
18802974e916SYuri Benditovich             g_free(seg);
18812974e916SYuri Benditovich         }
18822974e916SYuri Benditovich 
18832974e916SYuri Benditovich         timer_del(chain->drain_timer);
18842974e916SYuri Benditovich         timer_free(chain->drain_timer);
18852974e916SYuri Benditovich         QTAILQ_REMOVE(&n->rsc_chains, chain, next);
18862974e916SYuri Benditovich         g_free(chain);
18872974e916SYuri Benditovich     }
18882974e916SYuri Benditovich }
18892974e916SYuri Benditovich 
18902974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain,
18912974e916SYuri Benditovich                                      NetClientState *nc,
18922974e916SYuri Benditovich                                      const uint8_t *buf, size_t size)
18932974e916SYuri Benditovich {
18942974e916SYuri Benditovich     uint16_t hdr_len;
18952974e916SYuri Benditovich     VirtioNetRscSeg *seg;
18962974e916SYuri Benditovich 
18972974e916SYuri Benditovich     hdr_len = chain->n->guest_hdr_len;
18982974e916SYuri Benditovich     seg = g_malloc(sizeof(VirtioNetRscSeg));
18992974e916SYuri Benditovich     seg->buf = g_malloc(hdr_len + sizeof(struct eth_header)
19002974e916SYuri Benditovich         + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD);
19012974e916SYuri Benditovich     memcpy(seg->buf, buf, size);
19022974e916SYuri Benditovich     seg->size = size;
19032974e916SYuri Benditovich     seg->packets = 1;
19042974e916SYuri Benditovich     seg->dup_ack = 0;
19052974e916SYuri Benditovich     seg->is_coalesced = 0;
19062974e916SYuri Benditovich     seg->nc = nc;
19072974e916SYuri Benditovich 
19082974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&chain->buffers, seg, next);
19092974e916SYuri Benditovich     chain->stat.cache++;
19102974e916SYuri Benditovich 
19112974e916SYuri Benditovich     switch (chain->proto) {
19122974e916SYuri Benditovich     case ETH_P_IP:
19132974e916SYuri Benditovich         virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit);
19142974e916SYuri Benditovich         break;
19152974e916SYuri Benditovich     case ETH_P_IPV6:
19162974e916SYuri Benditovich         virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit);
19172974e916SYuri Benditovich         break;
19182974e916SYuri Benditovich     default:
19192974e916SYuri Benditovich         g_assert_not_reached();
19202974e916SYuri Benditovich     }
19212974e916SYuri Benditovich }
19222974e916SYuri Benditovich 
19232974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain,
19242974e916SYuri Benditovich                                          VirtioNetRscSeg *seg,
19252974e916SYuri Benditovich                                          const uint8_t *buf,
19262974e916SYuri Benditovich                                          struct tcp_header *n_tcp,
19272974e916SYuri Benditovich                                          struct tcp_header *o_tcp)
19282974e916SYuri Benditovich {
19292974e916SYuri Benditovich     uint32_t nack, oack;
19302974e916SYuri Benditovich     uint16_t nwin, owin;
19312974e916SYuri Benditovich 
19322974e916SYuri Benditovich     nack = htonl(n_tcp->th_ack);
19332974e916SYuri Benditovich     nwin = htons(n_tcp->th_win);
19342974e916SYuri Benditovich     oack = htonl(o_tcp->th_ack);
19352974e916SYuri Benditovich     owin = htons(o_tcp->th_win);
19362974e916SYuri Benditovich 
19372974e916SYuri Benditovich     if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) {
19382974e916SYuri Benditovich         chain->stat.ack_out_of_win++;
19392974e916SYuri Benditovich         return RSC_FINAL;
19402974e916SYuri Benditovich     } else if (nack == oack) {
19412974e916SYuri Benditovich         /* duplicated ack or window probe */
19422974e916SYuri Benditovich         if (nwin == owin) {
19432974e916SYuri Benditovich             /* duplicated ack, add dup ack count due to whql test up to 1 */
19442974e916SYuri Benditovich             chain->stat.dup_ack++;
19452974e916SYuri Benditovich             return RSC_FINAL;
19462974e916SYuri Benditovich         } else {
19472974e916SYuri Benditovich             /* Coalesce window update */
19482974e916SYuri Benditovich             o_tcp->th_win = n_tcp->th_win;
19492974e916SYuri Benditovich             chain->stat.win_update++;
19502974e916SYuri Benditovich             return RSC_COALESCE;
19512974e916SYuri Benditovich         }
19522974e916SYuri Benditovich     } else {
19532974e916SYuri Benditovich         /* pure ack, go to 'C', finalize*/
19542974e916SYuri Benditovich         chain->stat.pure_ack++;
19552974e916SYuri Benditovich         return RSC_FINAL;
19562974e916SYuri Benditovich     }
19572974e916SYuri Benditovich }
19582974e916SYuri Benditovich 
19592974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain,
19602974e916SYuri Benditovich                                             VirtioNetRscSeg *seg,
19612974e916SYuri Benditovich                                             const uint8_t *buf,
19622974e916SYuri Benditovich                                             VirtioNetRscUnit *n_unit)
19632974e916SYuri Benditovich {
19642974e916SYuri Benditovich     void *data;
19652974e916SYuri Benditovich     uint16_t o_ip_len;
19662974e916SYuri Benditovich     uint32_t nseq, oseq;
19672974e916SYuri Benditovich     VirtioNetRscUnit *o_unit;
19682974e916SYuri Benditovich 
19692974e916SYuri Benditovich     o_unit = &seg->unit;
19702974e916SYuri Benditovich     o_ip_len = htons(*o_unit->ip_plen);
19712974e916SYuri Benditovich     nseq = htonl(n_unit->tcp->th_seq);
19722974e916SYuri Benditovich     oseq = htonl(o_unit->tcp->th_seq);
19732974e916SYuri Benditovich 
19742974e916SYuri Benditovich     /* out of order or retransmitted. */
19752974e916SYuri Benditovich     if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) {
19762974e916SYuri Benditovich         chain->stat.data_out_of_win++;
19772974e916SYuri Benditovich         return RSC_FINAL;
19782974e916SYuri Benditovich     }
19792974e916SYuri Benditovich 
19802974e916SYuri Benditovich     data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen;
19812974e916SYuri Benditovich     if (nseq == oseq) {
19822974e916SYuri Benditovich         if ((o_unit->payload == 0) && n_unit->payload) {
19832974e916SYuri Benditovich             /* From no payload to payload, normal case, not a dup ack or etc */
19842974e916SYuri Benditovich             chain->stat.data_after_pure_ack++;
19852974e916SYuri Benditovich             goto coalesce;
19862974e916SYuri Benditovich         } else {
19872974e916SYuri Benditovich             return virtio_net_rsc_handle_ack(chain, seg, buf,
19882974e916SYuri Benditovich                                              n_unit->tcp, o_unit->tcp);
19892974e916SYuri Benditovich         }
19902974e916SYuri Benditovich     } else if ((nseq - oseq) != o_unit->payload) {
19912974e916SYuri Benditovich         /* Not a consistent packet, out of order */
19922974e916SYuri Benditovich         chain->stat.data_out_of_order++;
19932974e916SYuri Benditovich         return RSC_FINAL;
19942974e916SYuri Benditovich     } else {
19952974e916SYuri Benditovich coalesce:
19962974e916SYuri Benditovich         if ((o_ip_len + n_unit->payload) > chain->max_payload) {
19972974e916SYuri Benditovich             chain->stat.over_size++;
19982974e916SYuri Benditovich             return RSC_FINAL;
19992974e916SYuri Benditovich         }
20002974e916SYuri Benditovich 
20012974e916SYuri Benditovich         /* Here comes the right data, the payload length in v4/v6 is different,
20022974e916SYuri Benditovich            so use the field value to update and record the new data len */
20032974e916SYuri Benditovich         o_unit->payload += n_unit->payload; /* update new data len */
20042974e916SYuri Benditovich 
20052974e916SYuri Benditovich         /* update field in ip header */
20062974e916SYuri Benditovich         *o_unit->ip_plen = htons(o_ip_len + n_unit->payload);
20072974e916SYuri Benditovich 
20082974e916SYuri Benditovich         /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced
20092974e916SYuri Benditovich            for windows guest, while this may change the behavior for linux
20102974e916SYuri Benditovich            guest (only if it uses RSC feature). */
20112974e916SYuri Benditovich         o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags;
20122974e916SYuri Benditovich 
20132974e916SYuri Benditovich         o_unit->tcp->th_ack = n_unit->tcp->th_ack;
20142974e916SYuri Benditovich         o_unit->tcp->th_win = n_unit->tcp->th_win;
20152974e916SYuri Benditovich 
20162974e916SYuri Benditovich         memmove(seg->buf + seg->size, data, n_unit->payload);
20172974e916SYuri Benditovich         seg->size += n_unit->payload;
20182974e916SYuri Benditovich         seg->packets++;
20192974e916SYuri Benditovich         chain->stat.coalesced++;
20202974e916SYuri Benditovich         return RSC_COALESCE;
20212974e916SYuri Benditovich     }
20222974e916SYuri Benditovich }
20232974e916SYuri Benditovich 
20242974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain,
20252974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
20262974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
20272974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
20282974e916SYuri Benditovich {
20292974e916SYuri Benditovich     struct ip_header *ip1, *ip2;
20302974e916SYuri Benditovich 
20312974e916SYuri Benditovich     ip1 = (struct ip_header *)(unit->ip);
20322974e916SYuri Benditovich     ip2 = (struct ip_header *)(seg->unit.ip);
20332974e916SYuri Benditovich     if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst)
20342974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
20352974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
20362974e916SYuri Benditovich         chain->stat.no_match++;
20372974e916SYuri Benditovich         return RSC_NO_MATCH;
20382974e916SYuri Benditovich     }
20392974e916SYuri Benditovich 
20402974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
20412974e916SYuri Benditovich }
20422974e916SYuri Benditovich 
20432974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain,
20442974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
20452974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
20462974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
20472974e916SYuri Benditovich {
20482974e916SYuri Benditovich     struct ip6_header *ip1, *ip2;
20492974e916SYuri Benditovich 
20502974e916SYuri Benditovich     ip1 = (struct ip6_header *)(unit->ip);
20512974e916SYuri Benditovich     ip2 = (struct ip6_header *)(seg->unit.ip);
20522974e916SYuri Benditovich     if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address))
20532974e916SYuri Benditovich         || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address))
20542974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
20552974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
20562974e916SYuri Benditovich             chain->stat.no_match++;
20572974e916SYuri Benditovich             return RSC_NO_MATCH;
20582974e916SYuri Benditovich     }
20592974e916SYuri Benditovich 
20602974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
20612974e916SYuri Benditovich }
20622974e916SYuri Benditovich 
20632974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain
20642974e916SYuri Benditovich  * to prevent out of order */
20652974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain,
20662974e916SYuri Benditovich                                          struct tcp_header *tcp)
20672974e916SYuri Benditovich {
20682974e916SYuri Benditovich     uint16_t tcp_hdr;
20692974e916SYuri Benditovich     uint16_t tcp_flag;
20702974e916SYuri Benditovich 
20712974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags);
20722974e916SYuri Benditovich     tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10;
20732974e916SYuri Benditovich     tcp_flag &= VIRTIO_NET_TCP_FLAG;
20742974e916SYuri Benditovich     if (tcp_flag & TH_SYN) {
20752974e916SYuri Benditovich         chain->stat.tcp_syn++;
20762974e916SYuri Benditovich         return RSC_BYPASS;
20772974e916SYuri Benditovich     }
20782974e916SYuri Benditovich 
20792974e916SYuri Benditovich     if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) {
20802974e916SYuri Benditovich         chain->stat.tcp_ctrl_drain++;
20812974e916SYuri Benditovich         return RSC_FINAL;
20822974e916SYuri Benditovich     }
20832974e916SYuri Benditovich 
20842974e916SYuri Benditovich     if (tcp_hdr > sizeof(struct tcp_header)) {
20852974e916SYuri Benditovich         chain->stat.tcp_all_opt++;
20862974e916SYuri Benditovich         return RSC_FINAL;
20872974e916SYuri Benditovich     }
20882974e916SYuri Benditovich 
20892974e916SYuri Benditovich     return RSC_CANDIDATE;
20902974e916SYuri Benditovich }
20912974e916SYuri Benditovich 
20922974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain,
20932974e916SYuri Benditovich                                          NetClientState *nc,
20942974e916SYuri Benditovich                                          const uint8_t *buf, size_t size,
20952974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
20962974e916SYuri Benditovich {
20972974e916SYuri Benditovich     int ret;
20982974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
20992974e916SYuri Benditovich 
21002974e916SYuri Benditovich     if (QTAILQ_EMPTY(&chain->buffers)) {
21012974e916SYuri Benditovich         chain->stat.empty_cache++;
21022974e916SYuri Benditovich         virtio_net_rsc_cache_buf(chain, nc, buf, size);
21032974e916SYuri Benditovich         timer_mod(chain->drain_timer,
21042974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
21052974e916SYuri Benditovich         return size;
21062974e916SYuri Benditovich     }
21072974e916SYuri Benditovich 
21082974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
21092974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
21102974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit);
21112974e916SYuri Benditovich         } else {
21122974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit);
21132974e916SYuri Benditovich         }
21142974e916SYuri Benditovich 
21152974e916SYuri Benditovich         if (ret == RSC_FINAL) {
21162974e916SYuri Benditovich             if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
21172974e916SYuri Benditovich                 /* Send failed */
21182974e916SYuri Benditovich                 chain->stat.final_failed++;
21192974e916SYuri Benditovich                 return 0;
21202974e916SYuri Benditovich             }
21212974e916SYuri Benditovich 
21222974e916SYuri Benditovich             /* Send current packet */
21232974e916SYuri Benditovich             return virtio_net_do_receive(nc, buf, size);
21242974e916SYuri Benditovich         } else if (ret == RSC_NO_MATCH) {
21252974e916SYuri Benditovich             continue;
21262974e916SYuri Benditovich         } else {
21272974e916SYuri Benditovich             /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */
21282974e916SYuri Benditovich             seg->is_coalesced = 1;
21292974e916SYuri Benditovich             return size;
21302974e916SYuri Benditovich         }
21312974e916SYuri Benditovich     }
21322974e916SYuri Benditovich 
21332974e916SYuri Benditovich     chain->stat.no_match_cache++;
21342974e916SYuri Benditovich     virtio_net_rsc_cache_buf(chain, nc, buf, size);
21352974e916SYuri Benditovich     return size;
21362974e916SYuri Benditovich }
21372974e916SYuri Benditovich 
21382974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */
21392974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain,
21402974e916SYuri Benditovich                                         NetClientState *nc,
21412974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21422974e916SYuri Benditovich                                         uint16_t ip_start, uint16_t ip_size,
21432974e916SYuri Benditovich                                         uint16_t tcp_port)
21442974e916SYuri Benditovich {
21452974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
21462974e916SYuri Benditovich     uint32_t ppair1, ppair2;
21472974e916SYuri Benditovich 
21482974e916SYuri Benditovich     ppair1 = *(uint32_t *)(buf + tcp_port);
21492974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
21502974e916SYuri Benditovich         ppair2 = *(uint32_t *)(seg->buf + tcp_port);
21512974e916SYuri Benditovich         if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size)
21522974e916SYuri Benditovich             || (ppair1 != ppair2)) {
21532974e916SYuri Benditovich             continue;
21542974e916SYuri Benditovich         }
21552974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
21562974e916SYuri Benditovich             chain->stat.drain_failed++;
21572974e916SYuri Benditovich         }
21582974e916SYuri Benditovich 
21592974e916SYuri Benditovich         break;
21602974e916SYuri Benditovich     }
21612974e916SYuri Benditovich 
21622974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
21632974e916SYuri Benditovich }
21642974e916SYuri Benditovich 
21652974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain,
21662974e916SYuri Benditovich                                             struct ip_header *ip,
21672974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
21682974e916SYuri Benditovich {
21692974e916SYuri Benditovich     uint16_t ip_len;
21702974e916SYuri Benditovich 
21712974e916SYuri Benditovich     /* Not an ipv4 packet */
21722974e916SYuri Benditovich     if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) {
21732974e916SYuri Benditovich         chain->stat.ip_option++;
21742974e916SYuri Benditovich         return RSC_BYPASS;
21752974e916SYuri Benditovich     }
21762974e916SYuri Benditovich 
21772974e916SYuri Benditovich     /* Don't handle packets with ip option */
21782974e916SYuri Benditovich     if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) {
21792974e916SYuri Benditovich         chain->stat.ip_option++;
21802974e916SYuri Benditovich         return RSC_BYPASS;
21812974e916SYuri Benditovich     }
21822974e916SYuri Benditovich 
21832974e916SYuri Benditovich     if (ip->ip_p != IPPROTO_TCP) {
21842974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
21852974e916SYuri Benditovich         return RSC_BYPASS;
21862974e916SYuri Benditovich     }
21872974e916SYuri Benditovich 
21882974e916SYuri Benditovich     /* Don't handle packets with ip fragment */
21892974e916SYuri Benditovich     if (!(htons(ip->ip_off) & IP_DF)) {
21902974e916SYuri Benditovich         chain->stat.ip_frag++;
21912974e916SYuri Benditovich         return RSC_BYPASS;
21922974e916SYuri Benditovich     }
21932974e916SYuri Benditovich 
21942974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
21952974e916SYuri Benditovich     if (IPTOS_ECN(ip->ip_tos)) {
21962974e916SYuri Benditovich         chain->stat.ip_ecn++;
21972974e916SYuri Benditovich         return RSC_BYPASS;
21982974e916SYuri Benditovich     }
21992974e916SYuri Benditovich 
22002974e916SYuri Benditovich     ip_len = htons(ip->ip_len);
22012974e916SYuri Benditovich     if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header))
22022974e916SYuri Benditovich         || ip_len > (size - chain->n->guest_hdr_len -
22032974e916SYuri Benditovich                      sizeof(struct eth_header))) {
22042974e916SYuri Benditovich         chain->stat.ip_hacked++;
22052974e916SYuri Benditovich         return RSC_BYPASS;
22062974e916SYuri Benditovich     }
22072974e916SYuri Benditovich 
22082974e916SYuri Benditovich     return RSC_CANDIDATE;
22092974e916SYuri Benditovich }
22102974e916SYuri Benditovich 
22112974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain,
22122974e916SYuri Benditovich                                       NetClientState *nc,
22132974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
22142974e916SYuri Benditovich {
22152974e916SYuri Benditovich     int32_t ret;
22162974e916SYuri Benditovich     uint16_t hdr_len;
22172974e916SYuri Benditovich     VirtioNetRscUnit unit;
22182974e916SYuri Benditovich 
22192974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
22202974e916SYuri Benditovich 
22212974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)
22222974e916SYuri Benditovich         + sizeof(struct tcp_header))) {
22232974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
22242974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22252974e916SYuri Benditovich     }
22262974e916SYuri Benditovich 
22272974e916SYuri Benditovich     virtio_net_rsc_extract_unit4(chain, buf, &unit);
22282974e916SYuri Benditovich     if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size)
22292974e916SYuri Benditovich         != RSC_CANDIDATE) {
22302974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22312974e916SYuri Benditovich     }
22322974e916SYuri Benditovich 
22332974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
22342974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
22352974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22362974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
22372974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
22382974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 12),
22392974e916SYuri Benditovich                 VIRTIO_NET_IP4_ADDR_SIZE,
22402974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header));
22412974e916SYuri Benditovich     }
22422974e916SYuri Benditovich 
22432974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
22442974e916SYuri Benditovich }
22452974e916SYuri Benditovich 
22462974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain,
22472974e916SYuri Benditovich                                             struct ip6_header *ip6,
22482974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
22492974e916SYuri Benditovich {
22502974e916SYuri Benditovich     uint16_t ip_len;
22512974e916SYuri Benditovich 
22522974e916SYuri Benditovich     if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4)
22532974e916SYuri Benditovich         != IP_HEADER_VERSION_6) {
22542974e916SYuri Benditovich         return RSC_BYPASS;
22552974e916SYuri Benditovich     }
22562974e916SYuri Benditovich 
22572974e916SYuri Benditovich     /* Both option and protocol is checked in this */
22582974e916SYuri Benditovich     if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) {
22592974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
22602974e916SYuri Benditovich         return RSC_BYPASS;
22612974e916SYuri Benditovich     }
22622974e916SYuri Benditovich 
22632974e916SYuri Benditovich     ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
22642974e916SYuri Benditovich     if (ip_len < sizeof(struct tcp_header) ||
22652974e916SYuri Benditovich         ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header)
22662974e916SYuri Benditovich                   - sizeof(struct ip6_header))) {
22672974e916SYuri Benditovich         chain->stat.ip_hacked++;
22682974e916SYuri Benditovich         return RSC_BYPASS;
22692974e916SYuri Benditovich     }
22702974e916SYuri Benditovich 
22712974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
22722974e916SYuri Benditovich     if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) {
22732974e916SYuri Benditovich         chain->stat.ip_ecn++;
22742974e916SYuri Benditovich         return RSC_BYPASS;
22752974e916SYuri Benditovich     }
22762974e916SYuri Benditovich 
22772974e916SYuri Benditovich     return RSC_CANDIDATE;
22782974e916SYuri Benditovich }
22792974e916SYuri Benditovich 
22802974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc,
22812974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
22822974e916SYuri Benditovich {
22832974e916SYuri Benditovich     int32_t ret;
22842974e916SYuri Benditovich     uint16_t hdr_len;
22852974e916SYuri Benditovich     VirtioNetRscChain *chain;
22862974e916SYuri Benditovich     VirtioNetRscUnit unit;
22872974e916SYuri Benditovich 
22882974e916SYuri Benditovich     chain = (VirtioNetRscChain *)opq;
22892974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
22902974e916SYuri Benditovich 
22912974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header)
22922974e916SYuri Benditovich         + sizeof(tcp_header))) {
22932974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22942974e916SYuri Benditovich     }
22952974e916SYuri Benditovich 
22962974e916SYuri Benditovich     virtio_net_rsc_extract_unit6(chain, buf, &unit);
22972974e916SYuri Benditovich     if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain,
22982974e916SYuri Benditovich                                                  unit.ip, buf, size)) {
22992974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23002974e916SYuri Benditovich     }
23012974e916SYuri Benditovich 
23022974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
23032974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
23042974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23052974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
23062974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
23072974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 8),
23082974e916SYuri Benditovich                 VIRTIO_NET_IP6_ADDR_SIZE,
23092974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header)
23102974e916SYuri Benditovich                 + sizeof(struct ip6_header));
23112974e916SYuri Benditovich     }
23122974e916SYuri Benditovich 
23132974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
23142974e916SYuri Benditovich }
23152974e916SYuri Benditovich 
23162974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n,
23172974e916SYuri Benditovich                                                       NetClientState *nc,
23182974e916SYuri Benditovich                                                       uint16_t proto)
23192974e916SYuri Benditovich {
23202974e916SYuri Benditovich     VirtioNetRscChain *chain;
23212974e916SYuri Benditovich 
23222974e916SYuri Benditovich     if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) {
23232974e916SYuri Benditovich         return NULL;
23242974e916SYuri Benditovich     }
23252974e916SYuri Benditovich 
23262974e916SYuri Benditovich     QTAILQ_FOREACH(chain, &n->rsc_chains, next) {
23272974e916SYuri Benditovich         if (chain->proto == proto) {
23282974e916SYuri Benditovich             return chain;
23292974e916SYuri Benditovich         }
23302974e916SYuri Benditovich     }
23312974e916SYuri Benditovich 
23322974e916SYuri Benditovich     chain = g_malloc(sizeof(*chain));
23332974e916SYuri Benditovich     chain->n = n;
23342974e916SYuri Benditovich     chain->proto = proto;
23352974e916SYuri Benditovich     if (proto == (uint16_t)ETH_P_IP) {
23362974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD;
23372974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
23382974e916SYuri Benditovich     } else {
23392974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD;
23402974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
23412974e916SYuri Benditovich     }
23422974e916SYuri Benditovich     chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST,
23432974e916SYuri Benditovich                                       virtio_net_rsc_purge, chain);
23442974e916SYuri Benditovich     memset(&chain->stat, 0, sizeof(chain->stat));
23452974e916SYuri Benditovich 
23462974e916SYuri Benditovich     QTAILQ_INIT(&chain->buffers);
23472974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next);
23482974e916SYuri Benditovich 
23492974e916SYuri Benditovich     return chain;
23502974e916SYuri Benditovich }
23512974e916SYuri Benditovich 
23522974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc,
23532974e916SYuri Benditovich                                       const uint8_t *buf,
23542974e916SYuri Benditovich                                       size_t size)
23552974e916SYuri Benditovich {
23562974e916SYuri Benditovich     uint16_t proto;
23572974e916SYuri Benditovich     VirtioNetRscChain *chain;
23582974e916SYuri Benditovich     struct eth_header *eth;
23592974e916SYuri Benditovich     VirtIONet *n;
23602974e916SYuri Benditovich 
23612974e916SYuri Benditovich     n = qemu_get_nic_opaque(nc);
23622974e916SYuri Benditovich     if (size < (n->host_hdr_len + sizeof(struct eth_header))) {
23632974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23642974e916SYuri Benditovich     }
23652974e916SYuri Benditovich 
23662974e916SYuri Benditovich     eth = (struct eth_header *)(buf + n->guest_hdr_len);
23672974e916SYuri Benditovich     proto = htons(eth->h_proto);
23682974e916SYuri Benditovich 
23692974e916SYuri Benditovich     chain = virtio_net_rsc_lookup_chain(n, nc, proto);
23702974e916SYuri Benditovich     if (chain) {
23712974e916SYuri Benditovich         chain->stat.received++;
23722974e916SYuri Benditovich         if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) {
23732974e916SYuri Benditovich             return virtio_net_rsc_receive4(chain, nc, buf, size);
23742974e916SYuri Benditovich         } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) {
23752974e916SYuri Benditovich             return virtio_net_rsc_receive6(chain, nc, buf, size);
23762974e916SYuri Benditovich         }
23772974e916SYuri Benditovich     }
23782974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
23792974e916SYuri Benditovich }
23802974e916SYuri Benditovich 
23812974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf,
23822974e916SYuri Benditovich                                   size_t size)
23832974e916SYuri Benditovich {
23842974e916SYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
23852974e916SYuri Benditovich     if ((n->rsc4_enabled || n->rsc6_enabled)) {
23862974e916SYuri Benditovich         return virtio_net_rsc_receive(nc, buf, size);
23872974e916SYuri Benditovich     } else {
23882974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23892974e916SYuri Benditovich     }
23902974e916SYuri Benditovich }
23912974e916SYuri Benditovich 
23926e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
23936e790746SPaolo Bonzini 
23946e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
23956e790746SPaolo Bonzini {
23966e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
23976e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
239817a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
23996e790746SPaolo Bonzini 
240051b19ebeSPaolo Bonzini     virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
240117a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
24026e790746SPaolo Bonzini 
240351b19ebeSPaolo Bonzini     g_free(q->async_tx.elem);
240451b19ebeSPaolo Bonzini     q->async_tx.elem = NULL;
24056e790746SPaolo Bonzini 
24066e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
24076e790746SPaolo Bonzini     virtio_net_flush_tx(q);
24086e790746SPaolo Bonzini }
24096e790746SPaolo Bonzini 
24106e790746SPaolo Bonzini /* TX */
24116e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
24126e790746SPaolo Bonzini {
24136e790746SPaolo Bonzini     VirtIONet *n = q->n;
241417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
241551b19ebeSPaolo Bonzini     VirtQueueElement *elem;
24166e790746SPaolo Bonzini     int32_t num_packets = 0;
24176e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
241817a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
24196e790746SPaolo Bonzini         return num_packets;
24206e790746SPaolo Bonzini     }
24216e790746SPaolo Bonzini 
242251b19ebeSPaolo Bonzini     if (q->async_tx.elem) {
24236e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
24246e790746SPaolo Bonzini         return num_packets;
24256e790746SPaolo Bonzini     }
24266e790746SPaolo Bonzini 
242751b19ebeSPaolo Bonzini     for (;;) {
2428bd89dd98SJason Wang         ssize_t ret;
242951b19ebeSPaolo Bonzini         unsigned int out_num;
243051b19ebeSPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
2431feb93f36SJason Wang         struct virtio_net_hdr_mrg_rxbuf mhdr;
24326e790746SPaolo Bonzini 
243351b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
243451b19ebeSPaolo Bonzini         if (!elem) {
243551b19ebeSPaolo Bonzini             break;
243651b19ebeSPaolo Bonzini         }
243751b19ebeSPaolo Bonzini 
243851b19ebeSPaolo Bonzini         out_num = elem->out_num;
243951b19ebeSPaolo Bonzini         out_sg = elem->out_sg;
24406e790746SPaolo Bonzini         if (out_num < 1) {
2441fa5e56c2SGreg Kurz             virtio_error(vdev, "virtio-net header not in first element");
2442fa5e56c2SGreg Kurz             virtqueue_detach_element(q->tx_vq, elem, 0);
2443fa5e56c2SGreg Kurz             g_free(elem);
2444fa5e56c2SGreg Kurz             return -EINVAL;
24456e790746SPaolo Bonzini         }
24466e790746SPaolo Bonzini 
2447032a74a1SCédric Le Goater         if (n->has_vnet_hdr) {
2448feb93f36SJason Wang             if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
2449feb93f36SJason Wang                 n->guest_hdr_len) {
2450fa5e56c2SGreg Kurz                 virtio_error(vdev, "virtio-net header incorrect");
2451fa5e56c2SGreg Kurz                 virtqueue_detach_element(q->tx_vq, elem, 0);
2452fa5e56c2SGreg Kurz                 g_free(elem);
2453fa5e56c2SGreg Kurz                 return -EINVAL;
2454032a74a1SCédric Le Goater             }
24551bfa316cSGreg Kurz             if (n->needs_vnet_hdr_swap) {
2456feb93f36SJason Wang                 virtio_net_hdr_swap(vdev, (void *) &mhdr);
2457feb93f36SJason Wang                 sg2[0].iov_base = &mhdr;
2458feb93f36SJason Wang                 sg2[0].iov_len = n->guest_hdr_len;
2459feb93f36SJason Wang                 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
2460feb93f36SJason Wang                                    out_sg, out_num,
2461feb93f36SJason Wang                                    n->guest_hdr_len, -1);
2462feb93f36SJason Wang                 if (out_num == VIRTQUEUE_MAX_SIZE) {
2463feb93f36SJason Wang                     goto drop;
2464032a74a1SCédric Le Goater                 }
2465feb93f36SJason Wang                 out_num += 1;
2466feb93f36SJason Wang                 out_sg = sg2;
2467feb93f36SJason Wang             }
2468feb93f36SJason Wang         }
24696e790746SPaolo Bonzini         /*
24706e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
24716e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
24726e790746SPaolo Bonzini          * that host is interested in.
24736e790746SPaolo Bonzini          */
24746e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
24756e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
24766e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
24776e790746SPaolo Bonzini                                        out_sg, out_num,
24786e790746SPaolo Bonzini                                        0, n->host_hdr_len);
24796e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
24806e790746SPaolo Bonzini                              out_sg, out_num,
24816e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
24826e790746SPaolo Bonzini             out_num = sg_num;
24836e790746SPaolo Bonzini             out_sg = sg;
24846e790746SPaolo Bonzini         }
24856e790746SPaolo Bonzini 
24866e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
24876e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
24886e790746SPaolo Bonzini         if (ret == 0) {
24896e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
24906e790746SPaolo Bonzini             q->async_tx.elem = elem;
24916e790746SPaolo Bonzini             return -EBUSY;
24926e790746SPaolo Bonzini         }
24936e790746SPaolo Bonzini 
2494feb93f36SJason Wang drop:
249551b19ebeSPaolo Bonzini         virtqueue_push(q->tx_vq, elem, 0);
249617a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
249751b19ebeSPaolo Bonzini         g_free(elem);
24986e790746SPaolo Bonzini 
24996e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
25006e790746SPaolo Bonzini             break;
25016e790746SPaolo Bonzini         }
25026e790746SPaolo Bonzini     }
25036e790746SPaolo Bonzini     return num_packets;
25046e790746SPaolo Bonzini }
25056e790746SPaolo Bonzini 
25066e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
25076e790746SPaolo Bonzini {
250817a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
25096e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
25106e790746SPaolo Bonzini 
2511283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2512283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2513283e2c2aSYuri Benditovich         return;
2514283e2c2aSYuri Benditovich     }
2515283e2c2aSYuri Benditovich 
25166e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
251717a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
25186e790746SPaolo Bonzini         q->tx_waiting = 1;
25196e790746SPaolo Bonzini         return;
25206e790746SPaolo Bonzini     }
25216e790746SPaolo Bonzini 
25226e790746SPaolo Bonzini     if (q->tx_waiting) {
25236e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 1);
2524bc72ad67SAlex Bligh         timer_del(q->tx_timer);
25256e790746SPaolo Bonzini         q->tx_waiting = 0;
2526fa5e56c2SGreg Kurz         if (virtio_net_flush_tx(q) == -EINVAL) {
2527fa5e56c2SGreg Kurz             return;
2528fa5e56c2SGreg Kurz         }
25296e790746SPaolo Bonzini     } else {
2530bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
2531bc72ad67SAlex Bligh                        qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
25326e790746SPaolo Bonzini         q->tx_waiting = 1;
25336e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
25346e790746SPaolo Bonzini     }
25356e790746SPaolo Bonzini }
25366e790746SPaolo Bonzini 
25376e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
25386e790746SPaolo Bonzini {
253917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
25406e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
25416e790746SPaolo Bonzini 
2542283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2543283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2544283e2c2aSYuri Benditovich         return;
2545283e2c2aSYuri Benditovich     }
2546283e2c2aSYuri Benditovich 
25476e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
25486e790746SPaolo Bonzini         return;
25496e790746SPaolo Bonzini     }
25506e790746SPaolo Bonzini     q->tx_waiting = 1;
25516e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
255217a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
25536e790746SPaolo Bonzini         return;
25546e790746SPaolo Bonzini     }
25556e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
25566e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
25576e790746SPaolo Bonzini }
25586e790746SPaolo Bonzini 
25596e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
25606e790746SPaolo Bonzini {
25616e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
25626e790746SPaolo Bonzini     VirtIONet *n = q->n;
256317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2564e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2565e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2566e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2567e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2568e8bcf842SMichael S. Tsirkin         return;
2569e8bcf842SMichael S. Tsirkin     }
25706e790746SPaolo Bonzini 
25716e790746SPaolo Bonzini     q->tx_waiting = 0;
25726e790746SPaolo Bonzini 
25736e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
257417a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
25756e790746SPaolo Bonzini         return;
257617a0ca55SKONRAD Frederic     }
25776e790746SPaolo Bonzini 
25786e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
25796e790746SPaolo Bonzini     virtio_net_flush_tx(q);
25806e790746SPaolo Bonzini }
25816e790746SPaolo Bonzini 
25826e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
25836e790746SPaolo Bonzini {
25846e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
25856e790746SPaolo Bonzini     VirtIONet *n = q->n;
258617a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
25876e790746SPaolo Bonzini     int32_t ret;
25886e790746SPaolo Bonzini 
2589e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2590e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2591e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2592e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2593e8bcf842SMichael S. Tsirkin         return;
2594e8bcf842SMichael S. Tsirkin     }
25956e790746SPaolo Bonzini 
25966e790746SPaolo Bonzini     q->tx_waiting = 0;
25976e790746SPaolo Bonzini 
25986e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
259917a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
26006e790746SPaolo Bonzini         return;
260117a0ca55SKONRAD Frederic     }
26026e790746SPaolo Bonzini 
26036e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
2604fa5e56c2SGreg Kurz     if (ret == -EBUSY || ret == -EINVAL) {
2605fa5e56c2SGreg Kurz         return; /* Notification re-enable handled by tx_complete or device
2606fa5e56c2SGreg Kurz                  * broken */
26076e790746SPaolo Bonzini     }
26086e790746SPaolo Bonzini 
26096e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
26106e790746SPaolo Bonzini      * more coming and immediately reschedule */
26116e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
26126e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
26136e790746SPaolo Bonzini         q->tx_waiting = 1;
26146e790746SPaolo Bonzini         return;
26156e790746SPaolo Bonzini     }
26166e790746SPaolo Bonzini 
26176e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
26186e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
26196e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
26206e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2621fa5e56c2SGreg Kurz     ret = virtio_net_flush_tx(q);
2622fa5e56c2SGreg Kurz     if (ret == -EINVAL) {
2623fa5e56c2SGreg Kurz         return;
2624fa5e56c2SGreg Kurz     } else if (ret > 0) {
26256e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
26266e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
26276e790746SPaolo Bonzini         q->tx_waiting = 1;
26286e790746SPaolo Bonzini     }
26296e790746SPaolo Bonzini }
26306e790746SPaolo Bonzini 
2631f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index)
2632f9d6dbf0SWen Congyang {
2633f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2634f9d6dbf0SWen Congyang 
26351c0fbfa3SMichael S. Tsirkin     n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
26361c0fbfa3SMichael S. Tsirkin                                            virtio_net_handle_rx);
26379b02e161SWei Wang 
2638f9d6dbf0SWen Congyang     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
2639f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
26409b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
26419b02e161SWei Wang                              virtio_net_handle_tx_timer);
2642f9d6dbf0SWen Congyang         n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
2643f9d6dbf0SWen Congyang                                               virtio_net_tx_timer,
2644f9d6dbf0SWen Congyang                                               &n->vqs[index]);
2645f9d6dbf0SWen Congyang     } else {
2646f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
26479b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
26489b02e161SWei Wang                              virtio_net_handle_tx_bh);
2649f9d6dbf0SWen Congyang         n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
2650f9d6dbf0SWen Congyang     }
2651f9d6dbf0SWen Congyang 
2652f9d6dbf0SWen Congyang     n->vqs[index].tx_waiting = 0;
2653f9d6dbf0SWen Congyang     n->vqs[index].n = n;
2654f9d6dbf0SWen Congyang }
2655f9d6dbf0SWen Congyang 
2656f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index)
2657f9d6dbf0SWen Congyang {
2658f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2659f9d6dbf0SWen Congyang     VirtIONetQueue *q = &n->vqs[index];
2660f9d6dbf0SWen Congyang     NetClientState *nc = qemu_get_subqueue(n->nic, index);
2661f9d6dbf0SWen Congyang 
2662f9d6dbf0SWen Congyang     qemu_purge_queued_packets(nc);
2663f9d6dbf0SWen Congyang 
2664f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2);
2665f9d6dbf0SWen Congyang     if (q->tx_timer) {
2666f9d6dbf0SWen Congyang         timer_del(q->tx_timer);
2667f9d6dbf0SWen Congyang         timer_free(q->tx_timer);
2668f989c30cSYunjian Wang         q->tx_timer = NULL;
2669f9d6dbf0SWen Congyang     } else {
2670f9d6dbf0SWen Congyang         qemu_bh_delete(q->tx_bh);
2671f989c30cSYunjian Wang         q->tx_bh = NULL;
2672f9d6dbf0SWen Congyang     }
2673f989c30cSYunjian Wang     q->tx_waiting = 0;
2674f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2 + 1);
2675f9d6dbf0SWen Congyang }
2676f9d6dbf0SWen Congyang 
2677f9d6dbf0SWen Congyang static void virtio_net_change_num_queues(VirtIONet *n, int new_max_queues)
2678f9d6dbf0SWen Congyang {
2679f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2680f9d6dbf0SWen Congyang     int old_num_queues = virtio_get_num_queues(vdev);
2681f9d6dbf0SWen Congyang     int new_num_queues = new_max_queues * 2 + 1;
2682f9d6dbf0SWen Congyang     int i;
2683f9d6dbf0SWen Congyang 
2684f9d6dbf0SWen Congyang     assert(old_num_queues >= 3);
2685f9d6dbf0SWen Congyang     assert(old_num_queues % 2 == 1);
2686f9d6dbf0SWen Congyang 
2687f9d6dbf0SWen Congyang     if (old_num_queues == new_num_queues) {
2688f9d6dbf0SWen Congyang         return;
2689f9d6dbf0SWen Congyang     }
2690f9d6dbf0SWen Congyang 
2691f9d6dbf0SWen Congyang     /*
2692f9d6dbf0SWen Congyang      * We always need to remove and add ctrl vq if
2693f9d6dbf0SWen Congyang      * old_num_queues != new_num_queues. Remove ctrl_vq first,
269420f86a75SYuval Shaia      * and then we only enter one of the following two loops.
2695f9d6dbf0SWen Congyang      */
2696f9d6dbf0SWen Congyang     virtio_del_queue(vdev, old_num_queues - 1);
2697f9d6dbf0SWen Congyang 
2698f9d6dbf0SWen Congyang     for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
2699f9d6dbf0SWen Congyang         /* new_num_queues < old_num_queues */
2700f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i / 2);
2701f9d6dbf0SWen Congyang     }
2702f9d6dbf0SWen Congyang 
2703f9d6dbf0SWen Congyang     for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
2704f9d6dbf0SWen Congyang         /* new_num_queues > old_num_queues */
2705f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i / 2);
2706f9d6dbf0SWen Congyang     }
2707f9d6dbf0SWen Congyang 
2708f9d6dbf0SWen Congyang     /* add ctrl_vq last */
2709f9d6dbf0SWen Congyang     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
2710f9d6dbf0SWen Congyang }
2711f9d6dbf0SWen Congyang 
2712ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
27136e790746SPaolo Bonzini {
2714f9d6dbf0SWen Congyang     int max = multiqueue ? n->max_queues : 1;
2715f9d6dbf0SWen Congyang 
27166e790746SPaolo Bonzini     n->multiqueue = multiqueue;
2717f9d6dbf0SWen Congyang     virtio_net_change_num_queues(n, max);
27186e790746SPaolo Bonzini 
27196e790746SPaolo Bonzini     virtio_net_set_queues(n);
27206e790746SPaolo Bonzini }
27216e790746SPaolo Bonzini 
2722982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id)
2723037dab2fSGreg Kurz {
2724982b78c5SDr. David Alan Gilbert     VirtIONet *n = opaque;
2725982b78c5SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2726037dab2fSGreg Kurz     int i, link_down;
2727037dab2fSGreg Kurz 
27289d8c6a25SDr. David Alan Gilbert     trace_virtio_net_post_load_device();
2729982b78c5SDr. David Alan Gilbert     virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs,
273095129d6fSCornelia Huck                                virtio_vdev_has_feature(vdev,
2731e22f0603SYuri Benditovich                                                        VIRTIO_F_VERSION_1),
2732e22f0603SYuri Benditovich                                virtio_vdev_has_feature(vdev,
2733e22f0603SYuri Benditovich                                                        VIRTIO_NET_F_HASH_REPORT));
27346e790746SPaolo Bonzini 
27356e790746SPaolo Bonzini     /* MAC_TABLE_ENTRIES may be different from the saved image */
2736982b78c5SDr. David Alan Gilbert     if (n->mac_table.in_use > MAC_TABLE_ENTRIES) {
27376e790746SPaolo Bonzini         n->mac_table.in_use = 0;
27386e790746SPaolo Bonzini     }
27396e790746SPaolo Bonzini 
2740982b78c5SDr. David Alan Gilbert     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
27416c666823SMichael S. Tsirkin         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
27426c666823SMichael S. Tsirkin     }
27436c666823SMichael S. Tsirkin 
27447788c3f2SMikhail Sennikovsky     /*
27457788c3f2SMikhail Sennikovsky      * curr_guest_offloads will be later overwritten by the
27467788c3f2SMikhail Sennikovsky      * virtio_set_features_nocheck call done from the virtio_load.
27477788c3f2SMikhail Sennikovsky      * Here we make sure it is preserved and restored accordingly
27487788c3f2SMikhail Sennikovsky      * in the virtio_net_post_load_virtio callback.
27497788c3f2SMikhail Sennikovsky      */
27507788c3f2SMikhail Sennikovsky     n->saved_guest_offloads = n->curr_guest_offloads;
27516c666823SMichael S. Tsirkin 
27526e790746SPaolo Bonzini     virtio_net_set_queues(n);
27536e790746SPaolo Bonzini 
27546e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
27556e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
27566e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
27576e790746SPaolo Bonzini             break;
27586e790746SPaolo Bonzini         }
27596e790746SPaolo Bonzini     }
27606e790746SPaolo Bonzini     n->mac_table.first_multi = i;
27616e790746SPaolo Bonzini 
27626e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
27636e790746SPaolo Bonzini      * to link status bit in n->status */
27646e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
27656e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
27666e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
27676e790746SPaolo Bonzini     }
27686e790746SPaolo Bonzini 
27696c666823SMichael S. Tsirkin     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
27706c666823SMichael S. Tsirkin         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
27719d8c6a25SDr. David Alan Gilbert         qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
27729d8c6a25SDr. David Alan Gilbert                                   QEMU_CLOCK_VIRTUAL,
27739d8c6a25SDr. David Alan Gilbert                                   virtio_net_announce_timer, n);
27749d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
27759d8c6a25SDr. David Alan Gilbert             timer_mod(n->announce_timer.tm,
27769d8c6a25SDr. David Alan Gilbert                       qemu_clock_get_ms(n->announce_timer.type));
27779d8c6a25SDr. David Alan Gilbert         } else {
2778944458b6SDr. David Alan Gilbert             qemu_announce_timer_del(&n->announce_timer, false);
27799d8c6a25SDr. David Alan Gilbert         }
27806c666823SMichael S. Tsirkin     }
27816c666823SMichael S. Tsirkin 
2782e41b7114SYuri Benditovich     if (n->rss_data.enabled) {
2783e41b7114SYuri Benditovich         trace_virtio_net_rss_enable(n->rss_data.hash_types,
2784e41b7114SYuri Benditovich                                     n->rss_data.indirections_len,
2785e41b7114SYuri Benditovich                                     sizeof(n->rss_data.key));
2786e41b7114SYuri Benditovich     } else {
2787e41b7114SYuri Benditovich         trace_virtio_net_rss_disable();
2788e41b7114SYuri Benditovich     }
27896e790746SPaolo Bonzini     return 0;
27906e790746SPaolo Bonzini }
27916e790746SPaolo Bonzini 
27927788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev)
27937788c3f2SMikhail Sennikovsky {
27947788c3f2SMikhail Sennikovsky     VirtIONet *n = VIRTIO_NET(vdev);
27957788c3f2SMikhail Sennikovsky     /*
27967788c3f2SMikhail Sennikovsky      * The actual needed state is now in saved_guest_offloads,
27977788c3f2SMikhail Sennikovsky      * see virtio_net_post_load_device for detail.
27987788c3f2SMikhail Sennikovsky      * Restore it back and apply the desired offloads.
27997788c3f2SMikhail Sennikovsky      */
28007788c3f2SMikhail Sennikovsky     n->curr_guest_offloads = n->saved_guest_offloads;
28017788c3f2SMikhail Sennikovsky     if (peer_has_vnet_hdr(n)) {
28027788c3f2SMikhail Sennikovsky         virtio_net_apply_guest_offloads(n);
28037788c3f2SMikhail Sennikovsky     }
28047788c3f2SMikhail Sennikovsky 
28057788c3f2SMikhail Sennikovsky     return 0;
28067788c3f2SMikhail Sennikovsky }
28077788c3f2SMikhail Sennikovsky 
2808982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */
2809982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = {
2810982b78c5SDr. David Alan Gilbert     .name = "virtio-net-queue-tx_waiting",
2811982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2812982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(tx_waiting, VirtIONetQueue),
2813982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2814982b78c5SDr. David Alan Gilbert    },
2815982b78c5SDr. David Alan Gilbert };
2816982b78c5SDr. David Alan Gilbert 
2817982b78c5SDr. David Alan Gilbert static bool max_queues_gt_1(void *opaque, int version_id)
2818982b78c5SDr. David Alan Gilbert {
2819982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->max_queues > 1;
2820982b78c5SDr. David Alan Gilbert }
2821982b78c5SDr. David Alan Gilbert 
2822982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id)
2823982b78c5SDr. David Alan Gilbert {
2824982b78c5SDr. David Alan Gilbert     return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque),
2825982b78c5SDr. David Alan Gilbert                                    VIRTIO_NET_F_CTRL_GUEST_OFFLOADS);
2826982b78c5SDr. David Alan Gilbert }
2827982b78c5SDr. David Alan Gilbert 
2828982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id)
2829982b78c5SDr. David Alan Gilbert {
2830982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES;
2831982b78c5SDr. David Alan Gilbert }
2832982b78c5SDr. David Alan Gilbert 
2833982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id)
2834982b78c5SDr. David Alan Gilbert {
2835982b78c5SDr. David Alan Gilbert     return !mac_table_fits(opaque, version_id);
2836982b78c5SDr. David Alan Gilbert }
2837982b78c5SDr. David Alan Gilbert 
2838982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods
2839982b78c5SDr. David Alan Gilbert  * although only some fields are used by each.
2840982b78c5SDr. David Alan Gilbert  */
2841982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp {
2842982b78c5SDr. David Alan Gilbert     VirtIONet      *parent;
2843982b78c5SDr. David Alan Gilbert     VirtIONetQueue *vqs_1;
2844982b78c5SDr. David Alan Gilbert     uint16_t        curr_queues_1;
2845982b78c5SDr. David Alan Gilbert     uint8_t         has_ufo;
2846982b78c5SDr. David Alan Gilbert     uint32_t        has_vnet_hdr;
2847982b78c5SDr. David Alan Gilbert };
2848982b78c5SDr. David Alan Gilbert 
2849982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than
2850982b78c5SDr. David Alan Gilbert  * the 1st entry in the queues and only if there's more than one
2851982b78c5SDr. David Alan Gilbert  * entry.  We use the tmp mechanism to calculate a temporary
2852982b78c5SDr. David Alan Gilbert  * pointer and count and also validate the count.
2853982b78c5SDr. David Alan Gilbert  */
2854982b78c5SDr. David Alan Gilbert 
285544b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque)
2856982b78c5SDr. David Alan Gilbert {
2857982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2858982b78c5SDr. David Alan Gilbert 
2859982b78c5SDr. David Alan Gilbert     tmp->vqs_1 = tmp->parent->vqs + 1;
2860982b78c5SDr. David Alan Gilbert     tmp->curr_queues_1 = tmp->parent->curr_queues - 1;
2861982b78c5SDr. David Alan Gilbert     if (tmp->parent->curr_queues == 0) {
2862982b78c5SDr. David Alan Gilbert         tmp->curr_queues_1 = 0;
2863982b78c5SDr. David Alan Gilbert     }
286444b1ff31SDr. David Alan Gilbert 
286544b1ff31SDr. David Alan Gilbert     return 0;
2866982b78c5SDr. David Alan Gilbert }
2867982b78c5SDr. David Alan Gilbert 
2868982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque)
2869982b78c5SDr. David Alan Gilbert {
2870982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2871982b78c5SDr. David Alan Gilbert 
2872982b78c5SDr. David Alan Gilbert     /* Reuse the pointer setup from save */
2873982b78c5SDr. David Alan Gilbert     virtio_net_tx_waiting_pre_save(opaque);
2874982b78c5SDr. David Alan Gilbert 
2875982b78c5SDr. David Alan Gilbert     if (tmp->parent->curr_queues > tmp->parent->max_queues) {
2876982b78c5SDr. David Alan Gilbert         error_report("virtio-net: curr_queues %x > max_queues %x",
2877982b78c5SDr. David Alan Gilbert             tmp->parent->curr_queues, tmp->parent->max_queues);
2878982b78c5SDr. David Alan Gilbert 
2879982b78c5SDr. David Alan Gilbert         return -EINVAL;
2880982b78c5SDr. David Alan Gilbert     }
2881982b78c5SDr. David Alan Gilbert 
2882982b78c5SDr. David Alan Gilbert     return 0; /* all good */
2883982b78c5SDr. David Alan Gilbert }
2884982b78c5SDr. David Alan Gilbert 
2885982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = {
2886982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-tx_waiting",
2887982b78c5SDr. David Alan Gilbert     .pre_load  = virtio_net_tx_waiting_pre_load,
2888982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_tx_waiting_pre_save,
2889982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2890982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp,
2891982b78c5SDr. David Alan Gilbert                                      curr_queues_1,
2892982b78c5SDr. David Alan Gilbert                                      vmstate_virtio_net_queue_tx_waiting,
2893982b78c5SDr. David Alan Gilbert                                      struct VirtIONetQueue),
2894982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2895982b78c5SDr. David Alan Gilbert     },
2896982b78c5SDr. David Alan Gilbert };
2897982b78c5SDr. David Alan Gilbert 
2898982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the
2899982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
2900982b78c5SDr. David Alan Gilbert  */
2901982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id)
2902982b78c5SDr. David Alan Gilbert {
2903982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2904982b78c5SDr. David Alan Gilbert 
2905982b78c5SDr. David Alan Gilbert     if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) {
2906982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires TUN_F_UFO support");
2907982b78c5SDr. David Alan Gilbert         return -EINVAL;
2908982b78c5SDr. David Alan Gilbert     }
2909982b78c5SDr. David Alan Gilbert 
2910982b78c5SDr. David Alan Gilbert     return 0;
2911982b78c5SDr. David Alan Gilbert }
2912982b78c5SDr. David Alan Gilbert 
291344b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque)
2914982b78c5SDr. David Alan Gilbert {
2915982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2916982b78c5SDr. David Alan Gilbert 
2917982b78c5SDr. David Alan Gilbert     tmp->has_ufo = tmp->parent->has_ufo;
291844b1ff31SDr. David Alan Gilbert 
291944b1ff31SDr. David Alan Gilbert     return 0;
2920982b78c5SDr. David Alan Gilbert }
2921982b78c5SDr. David Alan Gilbert 
2922982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = {
2923982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-ufo",
2924982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_ufo_post_load,
2925982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_ufo_pre_save,
2926982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2927982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp),
2928982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2929982b78c5SDr. David Alan Gilbert     },
2930982b78c5SDr. David Alan Gilbert };
2931982b78c5SDr. David Alan Gilbert 
2932982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the
2933982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
2934982b78c5SDr. David Alan Gilbert  */
2935982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id)
2936982b78c5SDr. David Alan Gilbert {
2937982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2938982b78c5SDr. David Alan Gilbert 
2939982b78c5SDr. David Alan Gilbert     if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) {
2940982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires vnet_hdr=on");
2941982b78c5SDr. David Alan Gilbert         return -EINVAL;
2942982b78c5SDr. David Alan Gilbert     }
2943982b78c5SDr. David Alan Gilbert 
2944982b78c5SDr. David Alan Gilbert     return 0;
2945982b78c5SDr. David Alan Gilbert }
2946982b78c5SDr. David Alan Gilbert 
294744b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque)
2948982b78c5SDr. David Alan Gilbert {
2949982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2950982b78c5SDr. David Alan Gilbert 
2951982b78c5SDr. David Alan Gilbert     tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr;
295244b1ff31SDr. David Alan Gilbert 
295344b1ff31SDr. David Alan Gilbert     return 0;
2954982b78c5SDr. David Alan Gilbert }
2955982b78c5SDr. David Alan Gilbert 
2956982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = {
2957982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-vnet",
2958982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_vnet_post_load,
2959982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_vnet_pre_save,
2960982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2961982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp),
2962982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2963982b78c5SDr. David Alan Gilbert     },
2964982b78c5SDr. David Alan Gilbert };
2965982b78c5SDr. David Alan Gilbert 
2966e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque)
2967e41b7114SYuri Benditovich {
2968e41b7114SYuri Benditovich     return VIRTIO_NET(opaque)->rss_data.enabled;
2969e41b7114SYuri Benditovich }
2970e41b7114SYuri Benditovich 
2971e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = {
2972e41b7114SYuri Benditovich     .name      = "virtio-net-device/rss",
2973e41b7114SYuri Benditovich     .version_id = 1,
2974e41b7114SYuri Benditovich     .minimum_version_id = 1,
2975e41b7114SYuri Benditovich     .needed = virtio_net_rss_needed,
2976e41b7114SYuri Benditovich     .fields = (VMStateField[]) {
2977e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.enabled, VirtIONet),
2978e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.redirect, VirtIONet),
2979e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.populate_hash, VirtIONet),
2980e41b7114SYuri Benditovich         VMSTATE_UINT32(rss_data.hash_types, VirtIONet),
2981e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.indirections_len, VirtIONet),
2982e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.default_queue, VirtIONet),
2983e41b7114SYuri Benditovich         VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet,
2984e41b7114SYuri Benditovich                             VIRTIO_NET_RSS_MAX_KEY_SIZE),
2985e41b7114SYuri Benditovich         VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet,
2986e41b7114SYuri Benditovich                                     rss_data.indirections_len, 0,
2987e41b7114SYuri Benditovich                                     vmstate_info_uint16, uint16_t),
2988e41b7114SYuri Benditovich         VMSTATE_END_OF_LIST()
2989e41b7114SYuri Benditovich     },
2990e41b7114SYuri Benditovich };
2991e41b7114SYuri Benditovich 
2992982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = {
2993982b78c5SDr. David Alan Gilbert     .name = "virtio-net-device",
2994982b78c5SDr. David Alan Gilbert     .version_id = VIRTIO_NET_VM_VERSION,
2995982b78c5SDr. David Alan Gilbert     .minimum_version_id = VIRTIO_NET_VM_VERSION,
2996982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_post_load_device,
2997982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2998982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN),
2999982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_POINTER(vqs, VirtIONet,
3000982b78c5SDr. David Alan Gilbert                                vmstate_virtio_net_queue_tx_waiting,
3001982b78c5SDr. David Alan Gilbert                                VirtIONetQueue),
3002982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet),
3003982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16(status, VirtIONet),
3004982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(promisc, VirtIONet),
3005982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(allmulti, VirtIONet),
3006982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mac_table.in_use, VirtIONet),
3007982b78c5SDr. David Alan Gilbert 
3008982b78c5SDr. David Alan Gilbert         /* Guarded pair: If it fits we load it, else we throw it away
3009982b78c5SDr. David Alan Gilbert          * - can happen if source has a larger MAC table.; post-load
3010982b78c5SDr. David Alan Gilbert          *  sets flags in this case.
3011982b78c5SDr. David Alan Gilbert          */
3012982b78c5SDr. David Alan Gilbert         VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet,
3013982b78c5SDr. David Alan Gilbert                                 0, mac_table_fits, mac_table.in_use,
3014982b78c5SDr. David Alan Gilbert                                  ETH_ALEN),
3015982b78c5SDr. David Alan Gilbert         VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0,
3016982b78c5SDr. David Alan Gilbert                                      mac_table.in_use, ETH_ALEN),
3017982b78c5SDr. David Alan Gilbert 
3018982b78c5SDr. David Alan Gilbert         /* Note: This is an array of uint32's that's always been saved as a
3019982b78c5SDr. David Alan Gilbert          * buffer; hold onto your endiannesses; it's actually used as a bitmap
3020982b78c5SDr. David Alan Gilbert          * but based on the uint.
3021982b78c5SDr. David Alan Gilbert          */
3022982b78c5SDr. David Alan Gilbert         VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3),
3023982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3024982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_vnet),
3025982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet),
3026982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet),
3027982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(alluni, VirtIONet),
3028982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nomulti, VirtIONet),
3029982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nouni, VirtIONet),
3030982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nobcast, VirtIONet),
3031982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3032982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_ufo),
3033982b78c5SDr. David Alan Gilbert         VMSTATE_SINGLE_TEST(max_queues, VirtIONet, max_queues_gt_1, 0,
3034982b78c5SDr. David Alan Gilbert                             vmstate_info_uint16_equal, uint16_t),
3035982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16_TEST(curr_queues, VirtIONet, max_queues_gt_1),
3036982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3037982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_tx_waiting),
3038982b78c5SDr. David Alan Gilbert         VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet,
3039982b78c5SDr. David Alan Gilbert                             has_ctrl_guest_offloads),
3040982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3041982b78c5SDr. David Alan Gilbert    },
3042e41b7114SYuri Benditovich     .subsections = (const VMStateDescription * []) {
3043e41b7114SYuri Benditovich         &vmstate_virtio_net_rss,
3044e41b7114SYuri Benditovich         NULL
3045e41b7114SYuri Benditovich     }
3046982b78c5SDr. David Alan Gilbert };
3047982b78c5SDr. David Alan Gilbert 
30486e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
3049f394b2e2SEric Blake     .type = NET_CLIENT_DRIVER_NIC,
30506e790746SPaolo Bonzini     .size = sizeof(NICState),
30516e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
30526e790746SPaolo Bonzini     .receive = virtio_net_receive,
30536e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
3054b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
3055b2c929f0SDr. David Alan Gilbert     .announce = virtio_net_announce,
30566e790746SPaolo Bonzini };
30576e790746SPaolo Bonzini 
30586e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
30596e790746SPaolo Bonzini {
306017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
30616e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
30626e790746SPaolo Bonzini     assert(n->vhost_started);
3063ed8b4afeSNikolay Nikolaev     return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
30646e790746SPaolo Bonzini }
30656e790746SPaolo Bonzini 
30666e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
30676e790746SPaolo Bonzini                                            bool mask)
30686e790746SPaolo Bonzini {
306917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
30706e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
30716e790746SPaolo Bonzini     assert(n->vhost_started);
3072ed8b4afeSNikolay Nikolaev     vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
30736e790746SPaolo Bonzini                              vdev, idx, mask);
30746e790746SPaolo Bonzini }
30756e790746SPaolo Bonzini 
3076019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
30776e790746SPaolo Bonzini {
30780cd09c3aSCornelia Huck     virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
3079a93e599dSMaxime Coquelin 
3080ba550851SStefano Garzarella     n->config_size = virtio_feature_get_config_size(feature_sizes,
3081ba550851SStefano Garzarella                                                     host_features);
308217ec5a86SKONRAD Frederic }
30836e790746SPaolo Bonzini 
30848a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
30858a253ec2SKONRAD Frederic                                    const char *type)
30868a253ec2SKONRAD Frederic {
30878a253ec2SKONRAD Frederic     /*
30888a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
30898a253ec2SKONRAD Frederic      */
30908a253ec2SKONRAD Frederic     assert(type != NULL);
30918a253ec2SKONRAD Frederic 
30928a253ec2SKONRAD Frederic     g_free(n->netclient_name);
30938a253ec2SKONRAD Frederic     g_free(n->netclient_type);
30948a253ec2SKONRAD Frederic     n->netclient_name = g_strdup(name);
30958a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
30968a253ec2SKONRAD Frederic }
30978a253ec2SKONRAD Frederic 
30989711cd0dSJens Freimann static bool failover_unplug_primary(VirtIONet *n)
30999711cd0dSJens Freimann {
31009711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
31019711cd0dSJens Freimann     PCIDevice *pci_dev;
31029711cd0dSJens Freimann     Error *err = NULL;
31039711cd0dSJens Freimann 
31049711cd0dSJens Freimann     hotplug_ctrl = qdev_get_hotplug_handler(n->primary_dev);
31059711cd0dSJens Freimann     if (hotplug_ctrl) {
31069711cd0dSJens Freimann         pci_dev = PCI_DEVICE(n->primary_dev);
31079711cd0dSJens Freimann         pci_dev->partially_hotplugged = true;
31089711cd0dSJens Freimann         hotplug_handler_unplug_request(hotplug_ctrl, n->primary_dev, &err);
31099711cd0dSJens Freimann         if (err) {
31109711cd0dSJens Freimann             error_report_err(err);
31119711cd0dSJens Freimann             return false;
31129711cd0dSJens Freimann         }
31139711cd0dSJens Freimann     } else {
31149711cd0dSJens Freimann         return false;
31159711cd0dSJens Freimann     }
31169711cd0dSJens Freimann     return true;
31179711cd0dSJens Freimann }
31189711cd0dSJens Freimann 
31199711cd0dSJens Freimann static bool failover_replug_primary(VirtIONet *n, Error **errp)
31209711cd0dSJens Freimann {
31215a0948d3SMarkus Armbruster     Error *err = NULL;
31229711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
31239711cd0dSJens Freimann     PCIDevice *pdev = PCI_DEVICE(n->primary_dev);
31249711cd0dSJens Freimann 
31259711cd0dSJens Freimann     if (!pdev->partially_hotplugged) {
31269711cd0dSJens Freimann         return true;
31279711cd0dSJens Freimann     }
31289711cd0dSJens Freimann     if (!n->primary_device_opts) {
31299711cd0dSJens Freimann         n->primary_device_opts = qemu_opts_from_qdict(
31309711cd0dSJens Freimann                 qemu_find_opts("device"),
31319711cd0dSJens Freimann                 n->primary_device_dict, errp);
3132150ab54aSJens Freimann         if (!n->primary_device_opts) {
31335a0948d3SMarkus Armbruster             return false;
31349711cd0dSJens Freimann         }
3135150ab54aSJens Freimann     }
31369711cd0dSJens Freimann     n->primary_bus = n->primary_dev->parent_bus;
3137150ab54aSJens Freimann     if (!n->primary_bus) {
3138150ab54aSJens Freimann         error_setg(errp, "virtio_net: couldn't find primary bus");
31395a0948d3SMarkus Armbruster         return false;
31409711cd0dSJens Freimann     }
3141bb755ba4SPaolo Bonzini     qdev_set_parent_bus(n->primary_dev, n->primary_bus, &error_abort);
31429711cd0dSJens Freimann     n->primary_should_be_hidden = false;
3143235e59cfSMarkus Armbruster     if (!qemu_opt_set_bool(n->primary_device_opts,
3144a5f9b9dfSMarkus Armbruster                            "partially_hotplugged", true, errp)) {
3145a5f9b9dfSMarkus Armbruster         return false;
31465a0948d3SMarkus Armbruster     }
31479711cd0dSJens Freimann     hotplug_ctrl = qdev_get_hotplug_handler(n->primary_dev);
31489711cd0dSJens Freimann     if (hotplug_ctrl) {
31495a0948d3SMarkus Armbruster         hotplug_handler_pre_plug(hotplug_ctrl, n->primary_dev, &err);
31505a0948d3SMarkus Armbruster         if (err) {
31515a0948d3SMarkus Armbruster             goto out;
31525a0948d3SMarkus Armbruster         }
3153ca72efccSMarkus Armbruster         hotplug_handler_plug(hotplug_ctrl, n->primary_dev, &err);
31549711cd0dSJens Freimann     }
3155150ab54aSJens Freimann 
3156150ab54aSJens Freimann out:
31575a0948d3SMarkus Armbruster     error_propagate(errp, err);
31585a0948d3SMarkus Armbruster     return !err;
31599711cd0dSJens Freimann }
31609711cd0dSJens Freimann 
31619711cd0dSJens Freimann static void virtio_net_handle_migration_primary(VirtIONet *n,
31629711cd0dSJens Freimann                                                 MigrationState *s)
31639711cd0dSJens Freimann {
31649711cd0dSJens Freimann     bool should_be_hidden;
31659711cd0dSJens Freimann     Error *err = NULL;
31669711cd0dSJens Freimann 
3167d73415a3SStefan Hajnoczi     should_be_hidden = qatomic_read(&n->primary_should_be_hidden);
31689711cd0dSJens Freimann 
31699711cd0dSJens Freimann     if (!n->primary_dev) {
31709711cd0dSJens Freimann         n->primary_dev = virtio_connect_failover_devices(n, n->qdev, &err);
31719711cd0dSJens Freimann         if (!n->primary_dev) {
31729711cd0dSJens Freimann             return;
31739711cd0dSJens Freimann         }
31749711cd0dSJens Freimann     }
31759711cd0dSJens Freimann 
31764dbac1aeSMarkus Armbruster     if (migration_in_setup(s) && !should_be_hidden) {
31779711cd0dSJens Freimann         if (failover_unplug_primary(n)) {
31783cad405bSMarc-André Lureau             vmstate_unregister(VMSTATE_IF(n->primary_dev),
31793cad405bSMarc-André Lureau                     qdev_get_vmsd(n->primary_dev),
31809711cd0dSJens Freimann                     n->primary_dev);
31819711cd0dSJens Freimann             qapi_event_send_unplug_primary(n->primary_device_id);
3182d73415a3SStefan Hajnoczi             qatomic_set(&n->primary_should_be_hidden, true);
31839711cd0dSJens Freimann         } else {
31849711cd0dSJens Freimann             warn_report("couldn't unplug primary device");
31859711cd0dSJens Freimann         }
31869711cd0dSJens Freimann     } else if (migration_has_failed(s)) {
3187150ab54aSJens Freimann         /* We already unplugged the device let's plug it back */
31889711cd0dSJens Freimann         if (!failover_replug_primary(n, &err)) {
31899711cd0dSJens Freimann             if (err) {
31909711cd0dSJens Freimann                 error_report_err(err);
31919711cd0dSJens Freimann             }
31929711cd0dSJens Freimann         }
31939711cd0dSJens Freimann     }
31949711cd0dSJens Freimann }
31959711cd0dSJens Freimann 
31969711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data)
31979711cd0dSJens Freimann {
31989711cd0dSJens Freimann     MigrationState *s = data;
31999711cd0dSJens Freimann     VirtIONet *n = container_of(notifier, VirtIONet, migration_state);
32009711cd0dSJens Freimann     virtio_net_handle_migration_primary(n, s);
32019711cd0dSJens Freimann }
32029711cd0dSJens Freimann 
32039711cd0dSJens Freimann static int virtio_net_primary_should_be_hidden(DeviceListener *listener,
32049711cd0dSJens Freimann             QemuOpts *device_opts)
32059711cd0dSJens Freimann {
32069711cd0dSJens Freimann     VirtIONet *n = container_of(listener, VirtIONet, primary_listener);
32074d0e59acSJens Freimann     bool match_found = false;
32084d0e59acSJens Freimann     bool hide = false;
32099711cd0dSJens Freimann 
32104d0e59acSJens Freimann     if (!device_opts) {
32114d0e59acSJens Freimann         return -1;
32124d0e59acSJens Freimann     }
32139711cd0dSJens Freimann     n->primary_device_dict = qemu_opts_to_qdict(device_opts,
32149711cd0dSJens Freimann             n->primary_device_dict);
32159711cd0dSJens Freimann     if (n->primary_device_dict) {
32169711cd0dSJens Freimann         g_free(n->standby_id);
32179711cd0dSJens Freimann         n->standby_id = g_strdup(qdict_get_try_str(n->primary_device_dict,
32189711cd0dSJens Freimann                     "failover_pair_id"));
32199711cd0dSJens Freimann     }
32204d0e59acSJens Freimann     if (g_strcmp0(n->standby_id, n->netclient_name) == 0) {
32219711cd0dSJens Freimann         match_found = true;
32229711cd0dSJens Freimann     } else {
32239711cd0dSJens Freimann         match_found = false;
32249711cd0dSJens Freimann         hide = false;
32259711cd0dSJens Freimann         g_free(n->standby_id);
32269711cd0dSJens Freimann         n->primary_device_dict = NULL;
32279711cd0dSJens Freimann         goto out;
32289711cd0dSJens Freimann     }
32299711cd0dSJens Freimann 
32309711cd0dSJens Freimann     n->primary_device_opts = device_opts;
32319711cd0dSJens Freimann 
32329711cd0dSJens Freimann     /* primary_should_be_hidden is set during feature negotiation */
3233d73415a3SStefan Hajnoczi     hide = qatomic_read(&n->primary_should_be_hidden);
32349711cd0dSJens Freimann 
32359711cd0dSJens Freimann     if (n->primary_device_dict) {
32369711cd0dSJens Freimann         g_free(n->primary_device_id);
32379711cd0dSJens Freimann         n->primary_device_id = g_strdup(qdict_get_try_str(
32389711cd0dSJens Freimann                     n->primary_device_dict, "id"));
32399711cd0dSJens Freimann         if (!n->primary_device_id) {
32409711cd0dSJens Freimann             warn_report("primary_device_id not set");
32419711cd0dSJens Freimann         }
32429711cd0dSJens Freimann     }
32439711cd0dSJens Freimann 
32449711cd0dSJens Freimann out:
32459711cd0dSJens Freimann     if (match_found && hide) {
32469711cd0dSJens Freimann         return 1;
32479711cd0dSJens Freimann     } else if (match_found && !hide) {
32489711cd0dSJens Freimann         return 0;
32499711cd0dSJens Freimann     } else {
32509711cd0dSJens Freimann         return -1;
32519711cd0dSJens Freimann     }
32529711cd0dSJens Freimann }
32539711cd0dSJens Freimann 
3254e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
325517ec5a86SKONRAD Frederic {
3256e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3257284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3258284a32f0SAndreas Färber     NetClientState *nc;
32591773d9eeSKONRAD Frederic     int i;
326017ec5a86SKONRAD Frederic 
3261a93e599dSMaxime Coquelin     if (n->net_conf.mtu) {
3262127833eeSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_MTU);
3263a93e599dSMaxime Coquelin     }
3264a93e599dSMaxime Coquelin 
32659473939eSJason Baron     if (n->net_conf.duplex_str) {
32669473939eSJason Baron         if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) {
32679473939eSJason Baron             n->net_conf.duplex = DUPLEX_HALF;
32689473939eSJason Baron         } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) {
32699473939eSJason Baron             n->net_conf.duplex = DUPLEX_FULL;
32709473939eSJason Baron         } else {
32719473939eSJason Baron             error_setg(errp, "'duplex' must be 'half' or 'full'");
3272843c4cfcSMarkus Armbruster             return;
32739473939eSJason Baron         }
32749473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
32759473939eSJason Baron     } else {
32769473939eSJason Baron         n->net_conf.duplex = DUPLEX_UNKNOWN;
32779473939eSJason Baron     }
32789473939eSJason Baron 
32799473939eSJason Baron     if (n->net_conf.speed < SPEED_UNKNOWN) {
32809473939eSJason Baron         error_setg(errp, "'speed' must be between 0 and INT_MAX");
3281843c4cfcSMarkus Armbruster         return;
3282843c4cfcSMarkus Armbruster     }
3283843c4cfcSMarkus Armbruster     if (n->net_conf.speed >= 0) {
32849473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
32859473939eSJason Baron     }
32869473939eSJason Baron 
32879711cd0dSJens Freimann     if (n->failover) {
32889711cd0dSJens Freimann         n->primary_listener.should_be_hidden =
32899711cd0dSJens Freimann             virtio_net_primary_should_be_hidden;
3290d73415a3SStefan Hajnoczi         qatomic_set(&n->primary_should_be_hidden, true);
32919711cd0dSJens Freimann         device_listener_register(&n->primary_listener);
32929711cd0dSJens Freimann         n->migration_state.notify = virtio_net_migration_state_notifier;
32939711cd0dSJens Freimann         add_migration_state_change_notifier(&n->migration_state);
32949711cd0dSJens Freimann         n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY);
32959711cd0dSJens Freimann     }
32969711cd0dSJens Freimann 
3297da3e8a23SShannon Zhao     virtio_net_set_config_size(n, n->host_features);
3298284a32f0SAndreas Färber     virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size);
329917ec5a86SKONRAD Frederic 
33001c0fbfa3SMichael S. Tsirkin     /*
33011c0fbfa3SMichael S. Tsirkin      * We set a lower limit on RX queue size to what it always was.
33021c0fbfa3SMichael S. Tsirkin      * Guests that want a smaller ring can always resize it without
33031c0fbfa3SMichael S. Tsirkin      * help from us (using virtio 1 and up).
33041c0fbfa3SMichael S. Tsirkin      */
33051c0fbfa3SMichael S. Tsirkin     if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
33061c0fbfa3SMichael S. Tsirkin         n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
33075f997fd1SMichal Privoznik         !is_power_of_2(n->net_conf.rx_queue_size)) {
33081c0fbfa3SMichael S. Tsirkin         error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
33091c0fbfa3SMichael S. Tsirkin                    "must be a power of 2 between %d and %d.",
33101c0fbfa3SMichael S. Tsirkin                    n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
33111c0fbfa3SMichael S. Tsirkin                    VIRTQUEUE_MAX_SIZE);
33121c0fbfa3SMichael S. Tsirkin         virtio_cleanup(vdev);
33131c0fbfa3SMichael S. Tsirkin         return;
33141c0fbfa3SMichael S. Tsirkin     }
33151c0fbfa3SMichael S. Tsirkin 
33169b02e161SWei Wang     if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE ||
33179b02e161SWei Wang         n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE ||
33189b02e161SWei Wang         !is_power_of_2(n->net_conf.tx_queue_size)) {
33199b02e161SWei Wang         error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), "
33209b02e161SWei Wang                    "must be a power of 2 between %d and %d",
33219b02e161SWei Wang                    n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE,
33229b02e161SWei Wang                    VIRTQUEUE_MAX_SIZE);
33239b02e161SWei Wang         virtio_cleanup(vdev);
33249b02e161SWei Wang         return;
33259b02e161SWei Wang     }
33269b02e161SWei Wang 
3327575a1c0eSJiri Pirko     n->max_queues = MAX(n->nic_conf.peers.queues, 1);
332887b3bd1cSJason Wang     if (n->max_queues * 2 + 1 > VIRTIO_QUEUE_MAX) {
33297e0e736eSJason Wang         error_setg(errp, "Invalid number of queues (= %" PRIu32 "), "
3330631b22eaSStefan Weil                    "must be a positive integer less than %d.",
333187b3bd1cSJason Wang                    n->max_queues, (VIRTIO_QUEUE_MAX - 1) / 2);
33327e0e736eSJason Wang         virtio_cleanup(vdev);
33337e0e736eSJason Wang         return;
33347e0e736eSJason Wang     }
33356e790746SPaolo Bonzini     n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queues);
33366e790746SPaolo Bonzini     n->curr_queues = 1;
33371773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
33386e790746SPaolo Bonzini 
33391773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
33401773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
33410765691eSMarkus Armbruster         warn_report("virtio-net: "
33426e790746SPaolo Bonzini                     "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
33431773d9eeSKONRAD Frederic                     n->net_conf.tx);
33440765691eSMarkus Armbruster         error_printf("Defaulting to \"bh\"");
33456e790746SPaolo Bonzini     }
33466e790746SPaolo Bonzini 
33472eef278bSMichael S. Tsirkin     n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n),
33482eef278bSMichael S. Tsirkin                                     n->net_conf.tx_queue_size);
33499b02e161SWei Wang 
3350da51a335SJason Wang     for (i = 0; i < n->max_queues; i++) {
3351f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i);
3352da51a335SJason Wang     }
3353da51a335SJason Wang 
335417a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
33551773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
33561773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
33576e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
33589d8c6a25SDr. David Alan Gilbert     qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
33599d8c6a25SDr. David Alan Gilbert                               QEMU_CLOCK_VIRTUAL,
3360f57fcf70SJason Wang                               virtio_net_announce_timer, n);
3361b2c929f0SDr. David Alan Gilbert     n->announce_timer.round = 0;
33626e790746SPaolo Bonzini 
33638a253ec2SKONRAD Frederic     if (n->netclient_type) {
33648a253ec2SKONRAD Frederic         /*
33658a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
33668a253ec2SKONRAD Frederic          */
33678a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
33688a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
33698a253ec2SKONRAD Frederic     } else {
33701773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
3371284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
33728a253ec2SKONRAD Frederic     }
33738a253ec2SKONRAD Frederic 
33746e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
33756e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
33766e790746SPaolo Bonzini         for (i = 0; i < n->max_queues; i++) {
3377d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
33786e790746SPaolo Bonzini         }
33796e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
33806e790746SPaolo Bonzini     } else {
33816e790746SPaolo Bonzini         n->host_hdr_len = 0;
33826e790746SPaolo Bonzini     }
33836e790746SPaolo Bonzini 
33841773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
33856e790746SPaolo Bonzini 
33866e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
33871773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
3388e22f0603SYuri Benditovich     virtio_net_set_mrg_rx_bufs(n, 0, 0, 0);
33896e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
33906e790746SPaolo Bonzini 
33916e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
33926e790746SPaolo Bonzini 
33936e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
33946e790746SPaolo Bonzini 
3395b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
3396b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
3397b1be4280SAmos Kong 
3398*e87936eaSCindy Lu    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
3399*e87936eaSCindy Lu         struct virtio_net_config netcfg = {};
3400*e87936eaSCindy Lu         memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN);
3401*e87936eaSCindy Lu         vhost_net_set_config(get_vhost_net(nc->peer),
3402*e87936eaSCindy Lu             (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER);
3403*e87936eaSCindy Lu     }
34042974e916SYuri Benditovich     QTAILQ_INIT(&n->rsc_chains);
3405284a32f0SAndreas Färber     n->qdev = dev;
34064474e37aSYuri Benditovich 
34074474e37aSYuri Benditovich     net_rx_pkt_init(&n->rx_pkt, false);
340817ec5a86SKONRAD Frederic }
340917ec5a86SKONRAD Frederic 
3410b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev)
341117ec5a86SKONRAD Frederic {
3412306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3413306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3414f9d6dbf0SWen Congyang     int i, max_queues;
341517ec5a86SKONRAD Frederic 
341617ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
341717ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
341817ec5a86SKONRAD Frederic 
34198a253ec2SKONRAD Frederic     g_free(n->netclient_name);
34208a253ec2SKONRAD Frederic     n->netclient_name = NULL;
34218a253ec2SKONRAD Frederic     g_free(n->netclient_type);
34228a253ec2SKONRAD Frederic     n->netclient_type = NULL;
34238a253ec2SKONRAD Frederic 
342417ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
342517ec5a86SKONRAD Frederic     g_free(n->vlans);
342617ec5a86SKONRAD Frederic 
34279711cd0dSJens Freimann     if (n->failover) {
342865018100SJuan Quintela         device_listener_unregister(&n->primary_listener);
34299711cd0dSJens Freimann         g_free(n->primary_device_id);
34309711cd0dSJens Freimann         g_free(n->standby_id);
34319711cd0dSJens Freimann         qobject_unref(n->primary_device_dict);
34329711cd0dSJens Freimann         n->primary_device_dict = NULL;
34339711cd0dSJens Freimann     }
34349711cd0dSJens Freimann 
3435f9d6dbf0SWen Congyang     max_queues = n->multiqueue ? n->max_queues : 1;
3436f9d6dbf0SWen Congyang     for (i = 0; i < max_queues; i++) {
3437f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i);
343817ec5a86SKONRAD Frederic     }
3439d945d9f1SYuri Benditovich     /* delete also control vq */
3440d945d9f1SYuri Benditovich     virtio_del_queue(vdev, max_queues * 2);
3441944458b6SDr. David Alan Gilbert     qemu_announce_timer_del(&n->announce_timer, false);
344217ec5a86SKONRAD Frederic     g_free(n->vqs);
344317ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
34442974e916SYuri Benditovich     virtio_net_rsc_cleanup(n);
344559079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
34464474e37aSYuri Benditovich     net_rx_pkt_uninit(n->rx_pkt);
34476a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
344817ec5a86SKONRAD Frederic }
344917ec5a86SKONRAD Frederic 
345017ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
345117ec5a86SKONRAD Frederic {
345217ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
345317ec5a86SKONRAD Frederic 
345417ec5a86SKONRAD Frederic     /*
345517ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
345617ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
345717ec5a86SKONRAD Frederic      */
345817ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
3459aa4197c3SGonglei     device_add_bootindex_property(obj, &n->nic_conf.bootindex,
3460aa4197c3SGonglei                                   "bootindex", "/ethernet-phy@0",
346140c2281cSMarkus Armbruster                                   DEVICE(n));
346217ec5a86SKONRAD Frederic }
346317ec5a86SKONRAD Frederic 
346444b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque)
34654d45dcfbSHalil Pasic {
34664d45dcfbSHalil Pasic     VirtIONet *n = opaque;
34674d45dcfbSHalil Pasic 
34684d45dcfbSHalil Pasic     /* At this point, backend must be stopped, otherwise
34694d45dcfbSHalil Pasic      * it might keep writing to memory. */
34704d45dcfbSHalil Pasic     assert(!n->vhost_started);
347144b1ff31SDr. David Alan Gilbert 
347244b1ff31SDr. David Alan Gilbert     return 0;
34734d45dcfbSHalil Pasic }
34744d45dcfbSHalil Pasic 
34759711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque)
34769711cd0dSJens Freimann {
34779711cd0dSJens Freimann     DeviceState *dev = opaque;
34789711cd0dSJens Freimann     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
34799711cd0dSJens Freimann     VirtIONet *n = VIRTIO_NET(vdev);
34809711cd0dSJens Freimann 
3481284f42a5SJens Freimann     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) {
3482284f42a5SJens Freimann         return false;
3483284f42a5SJens Freimann     }
34849711cd0dSJens Freimann     return n->primary_dev ? n->primary_dev->pending_deleted_event : false;
34859711cd0dSJens Freimann }
34869711cd0dSJens Freimann 
34879711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque)
34889711cd0dSJens Freimann {
34899711cd0dSJens Freimann     DeviceState *dev = opaque;
34909711cd0dSJens Freimann     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
34919711cd0dSJens Freimann 
34929711cd0dSJens Freimann     return vdc->primary_unplug_pending(dev);
34939711cd0dSJens Freimann }
34949711cd0dSJens Freimann 
34954d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = {
34964d45dcfbSHalil Pasic     .name = "virtio-net",
34974d45dcfbSHalil Pasic     .minimum_version_id = VIRTIO_NET_VM_VERSION,
34984d45dcfbSHalil Pasic     .version_id = VIRTIO_NET_VM_VERSION,
34994d45dcfbSHalil Pasic     .fields = (VMStateField[]) {
35004d45dcfbSHalil Pasic         VMSTATE_VIRTIO_DEVICE,
35014d45dcfbSHalil Pasic         VMSTATE_END_OF_LIST()
35024d45dcfbSHalil Pasic     },
35034d45dcfbSHalil Pasic     .pre_save = virtio_net_pre_save,
35049711cd0dSJens Freimann     .dev_unplug_pending = dev_unplug_pending,
35054d45dcfbSHalil Pasic };
3506290c2428SDr. David Alan Gilbert 
350717ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
3508127833eeSJason Baron     DEFINE_PROP_BIT64("csum", VirtIONet, host_features,
3509127833eeSJason Baron                     VIRTIO_NET_F_CSUM, true),
3510127833eeSJason Baron     DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features,
351187108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_CSUM, true),
3512127833eeSJason Baron     DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
3513127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features,
351487108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO4, true),
3515127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features,
351687108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO6, true),
3517127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features,
351887108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ECN, true),
3519127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features,
352087108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_UFO, true),
3521127833eeSJason Baron     DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features,
352287108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ANNOUNCE, true),
3523127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features,
352487108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO4, true),
3525127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features,
352687108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO6, true),
3527127833eeSJason Baron     DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features,
352887108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_ECN, true),
3529127833eeSJason Baron     DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features,
353087108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_UFO, true),
3531127833eeSJason Baron     DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features,
353287108bb2SShannon Zhao                     VIRTIO_NET_F_MRG_RXBUF, true),
3533127833eeSJason Baron     DEFINE_PROP_BIT64("status", VirtIONet, host_features,
353487108bb2SShannon Zhao                     VIRTIO_NET_F_STATUS, true),
3535127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features,
353687108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VQ, true),
3537127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features,
353887108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX, true),
3539127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features,
354087108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VLAN, true),
3541127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features,
354287108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX_EXTRA, true),
3543127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features,
354487108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_MAC_ADDR, true),
3545127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features,
354687108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
3547127833eeSJason Baron     DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
354859079029SYuri Benditovich     DEFINE_PROP_BIT64("rss", VirtIONet, host_features,
354959079029SYuri Benditovich                     VIRTIO_NET_F_RSS, false),
3550e22f0603SYuri Benditovich     DEFINE_PROP_BIT64("hash", VirtIONet, host_features,
3551e22f0603SYuri Benditovich                     VIRTIO_NET_F_HASH_REPORT, false),
35522974e916SYuri Benditovich     DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features,
35532974e916SYuri Benditovich                     VIRTIO_NET_F_RSC_EXT, false),
35542974e916SYuri Benditovich     DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout,
35552974e916SYuri Benditovich                        VIRTIO_NET_RSC_DEFAULT_INTERVAL),
355617ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
355717ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
355817ec5a86SKONRAD Frederic                        TX_TIMER_INTERVAL),
355917ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
356017ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
35611c0fbfa3SMichael S. Tsirkin     DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
35621c0fbfa3SMichael S. Tsirkin                        VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
35639b02e161SWei Wang     DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size,
35649b02e161SWei Wang                        VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE),
3565a93e599dSMaxime Coquelin     DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0),
356675ebec11SMaxime Coquelin     DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend,
356775ebec11SMaxime Coquelin                      true),
35689473939eSJason Baron     DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN),
35699473939eSJason Baron     DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str),
35709711cd0dSJens Freimann     DEFINE_PROP_BOOL("failover", VirtIONet, failover, false),
357117ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
357217ec5a86SKONRAD Frederic };
357317ec5a86SKONRAD Frederic 
357417ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
357517ec5a86SKONRAD Frederic {
357617ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
357717ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
3578e6f746b3SAndreas Färber 
35794f67d30bSMarc-André Lureau     device_class_set_props(dc, virtio_net_properties);
3580290c2428SDr. David Alan Gilbert     dc->vmsd = &vmstate_virtio_net;
3581125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
3582e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
3583306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
358417ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
358517ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
358617ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
358717ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
358817ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
358917ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
359017ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
359117ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
359217ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
35932a083ffdSMichael S. Tsirkin     vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO);
35947788c3f2SMikhail Sennikovsky     vdc->post_load = virtio_net_post_load_virtio;
3595982b78c5SDr. David Alan Gilbert     vdc->vmsd = &vmstate_virtio_net_device;
35969711cd0dSJens Freimann     vdc->primary_unplug_pending = primary_unplug_pending;
359717ec5a86SKONRAD Frederic }
359817ec5a86SKONRAD Frederic 
359917ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
360017ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
360117ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
360217ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
360317ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
360417ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
360517ec5a86SKONRAD Frederic };
360617ec5a86SKONRAD Frederic 
360717ec5a86SKONRAD Frederic static void virtio_register_types(void)
360817ec5a86SKONRAD Frederic {
360917ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
361017ec5a86SKONRAD Frederic }
361117ec5a86SKONRAD Frederic 
361217ec5a86SKONRAD Frederic type_init(virtio_register_types)
3613