xref: /openbmc/qemu/hw/net/virtio-net.c (revision 108a64818e69be0a97cde3838d768f2d9910c08b)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
149b8bfe21SPeter Maydell #include "qemu/osdep.h"
159711cd0dSJens Freimann #include "qemu/atomic.h"
166e790746SPaolo Bonzini #include "qemu/iov.h"
17db725815SMarkus Armbruster #include "qemu/main-loop.h"
180b8fa32fSMarkus Armbruster #include "qemu/module.h"
196e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
206e790746SPaolo Bonzini #include "net/net.h"
216e790746SPaolo Bonzini #include "net/checksum.h"
226e790746SPaolo Bonzini #include "net/tap.h"
236e790746SPaolo Bonzini #include "qemu/error-report.h"
246e790746SPaolo Bonzini #include "qemu/timer.h"
259711cd0dSJens Freimann #include "qemu/option.h"
269711cd0dSJens Freimann #include "qemu/option_int.h"
279711cd0dSJens Freimann #include "qemu/config-file.h"
289711cd0dSJens Freimann #include "qapi/qmp/qdict.h"
296e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
306e790746SPaolo Bonzini #include "net/vhost_net.h"
319d8c6a25SDr. David Alan Gilbert #include "net/announce.h"
3217ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
33e688df6bSMarkus Armbruster #include "qapi/error.h"
349af23989SMarkus Armbruster #include "qapi/qapi-events-net.h"
35a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h"
369711cd0dSJens Freimann #include "qapi/qapi-types-migration.h"
379711cd0dSJens Freimann #include "qapi/qapi-events-migration.h"
381399c60dSRusty Russell #include "hw/virtio/virtio-access.h"
39f8d806c9SJuan Quintela #include "migration/misc.h"
409473939eSJason Baron #include "standard-headers/linux/ethtool.h"
412f780b6aSMarkus Armbruster #include "sysemu/sysemu.h"
429d8c6a25SDr. David Alan Gilbert #include "trace.h"
439711cd0dSJens Freimann #include "monitor/qdev.h"
449711cd0dSJens Freimann #include "hw/pci/pci.h"
454474e37aSYuri Benditovich #include "net_rx_pkt.h"
46*108a6481SCindy Lu #include "hw/virtio/vhost.h"
476e790746SPaolo Bonzini 
486e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
496e790746SPaolo Bonzini 
506e790746SPaolo Bonzini #define MAC_TABLE_ENTRIES    64
516e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
526e790746SPaolo Bonzini 
531c0fbfa3SMichael S. Tsirkin /* previously fixed value */
541c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
559b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256
569b02e161SWei Wang 
571c0fbfa3SMichael S. Tsirkin /* for now, only allow larger queues; with virtio-1, guest can downsize */
581c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
599b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE
601c0fbfa3SMichael S. Tsirkin 
612974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE   8        /* ipv4 saddr + daddr */
622974e916SYuri Benditovich 
632974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG         0x3F
642974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH   0xF000
652974e916SYuri Benditovich 
662974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */
672974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header))
682974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535
692974e916SYuri Benditovich 
702974e916SYuri Benditovich /* header length value in ip header without option */
712974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5
722974e916SYuri Benditovich 
732974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE   32      /* ipv6 saddr + daddr */
742974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD
752974e916SYuri Benditovich 
762974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance
772974e916SYuri Benditovich    a lot, and should be tuned carefully, '300000'(300us) is the recommended
782974e916SYuri Benditovich    value to pass the WHQL test, '50000' can gain 2x netperf throughput with
792974e916SYuri Benditovich    tso/gso/gro 'off'. */
802974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000
812974e916SYuri Benditovich 
8259079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \
8359079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \
8459079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \
8559079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \
8659079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \
8759079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \
8859079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \
8959079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \
9059079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDP_EX)
9159079029SYuri Benditovich 
926e790746SPaolo Bonzini static VirtIOFeature feature_sizes[] = {
93127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MAC,
945d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mac)},
95127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_STATUS,
965d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, status)},
97127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MQ,
985d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
99127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MTU,
1005d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mtu)},
1019473939eSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX,
1025d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, duplex)},
103e22f0603SYuri Benditovich     {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT),
10459079029SYuri Benditovich      .end = endof(struct virtio_net_config, supported_hash_types)},
1056e790746SPaolo Bonzini     {}
1066e790746SPaolo Bonzini };
1076e790746SPaolo Bonzini 
1086e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
1096e790746SPaolo Bonzini {
1106e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1116e790746SPaolo Bonzini 
1126e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
1136e790746SPaolo Bonzini }
1146e790746SPaolo Bonzini 
1156e790746SPaolo Bonzini static int vq2q(int queue_index)
1166e790746SPaolo Bonzini {
1176e790746SPaolo Bonzini     return queue_index / 2;
1186e790746SPaolo Bonzini }
1196e790746SPaolo Bonzini 
1206e790746SPaolo Bonzini /* TODO
1216e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
1226e790746SPaolo Bonzini  */
1236e790746SPaolo Bonzini 
1246e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
1256e790746SPaolo Bonzini {
12617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1276e790746SPaolo Bonzini     struct virtio_net_config netcfg;
1286e790746SPaolo Bonzini 
129*108a6481SCindy Lu     int ret = 0;
130*108a6481SCindy Lu     memset(&netcfg, 0 , sizeof(struct virtio_net_config));
1311399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.status, n->status);
1321399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queues);
133a93e599dSMaxime Coquelin     virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu);
1346e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
1359473939eSJason Baron     virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed);
1369473939eSJason Baron     netcfg.duplex = n->net_conf.duplex;
13759079029SYuri Benditovich     netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE;
13859079029SYuri Benditovich     virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length,
139e22f0603SYuri Benditovich                  virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ?
140e22f0603SYuri Benditovich                  VIRTIO_NET_RSS_MAX_TABLE_LEN : 1);
14159079029SYuri Benditovich     virtio_stl_p(vdev, &netcfg.supported_hash_types,
14259079029SYuri Benditovich                  VIRTIO_NET_RSS_SUPPORTED_HASHES);
1436e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
144*108a6481SCindy Lu 
145*108a6481SCindy Lu     NetClientState *nc = qemu_get_queue(n->nic);
146*108a6481SCindy Lu     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
147*108a6481SCindy Lu         ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
148*108a6481SCindy Lu                              n->config_size);
149*108a6481SCindy Lu     if (ret != -1) {
150*108a6481SCindy Lu         memcpy(config, &netcfg, n->config_size);
151*108a6481SCindy Lu     }
152*108a6481SCindy Lu     }
1536e790746SPaolo Bonzini }
1546e790746SPaolo Bonzini 
1556e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
1566e790746SPaolo Bonzini {
15717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1586e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
1596e790746SPaolo Bonzini 
1606e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
1616e790746SPaolo Bonzini 
16295129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
16395129d6fSCornelia Huck         !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
1646e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
1656e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
1666e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1676e790746SPaolo Bonzini     }
168*108a6481SCindy Lu 
169*108a6481SCindy Lu     NetClientState *nc = qemu_get_queue(n->nic);
170*108a6481SCindy Lu     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
171*108a6481SCindy Lu         vhost_net_set_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
172*108a6481SCindy Lu                                0, n->config_size,
173*108a6481SCindy Lu                         VHOST_SET_CONFIG_TYPE_MASTER);
174*108a6481SCindy Lu       }
1756e790746SPaolo Bonzini }
1766e790746SPaolo Bonzini 
1776e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
1786e790746SPaolo Bonzini {
17917a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1806e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
18117a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
1826e790746SPaolo Bonzini }
1836e790746SPaolo Bonzini 
184b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net)
185b2c929f0SDr. David Alan Gilbert {
186b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(net);
187b2c929f0SDr. David Alan Gilbert     trace_virtio_net_announce_notify();
188b2c929f0SDr. David Alan Gilbert 
189b2c929f0SDr. David Alan Gilbert     net->status |= VIRTIO_NET_S_ANNOUNCE;
190b2c929f0SDr. David Alan Gilbert     virtio_notify_config(vdev);
191b2c929f0SDr. David Alan Gilbert }
192b2c929f0SDr. David Alan Gilbert 
193f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque)
194f57fcf70SJason Wang {
195f57fcf70SJason Wang     VirtIONet *n = opaque;
1969d8c6a25SDr. David Alan Gilbert     trace_virtio_net_announce_timer(n->announce_timer.round);
197f57fcf70SJason Wang 
1989d8c6a25SDr. David Alan Gilbert     n->announce_timer.round--;
199b2c929f0SDr. David Alan Gilbert     virtio_net_announce_notify(n);
200b2c929f0SDr. David Alan Gilbert }
201b2c929f0SDr. David Alan Gilbert 
202b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc)
203b2c929f0SDr. David Alan Gilbert {
204b2c929f0SDr. David Alan Gilbert     VirtIONet *n = qemu_get_nic_opaque(nc);
205b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
206b2c929f0SDr. David Alan Gilbert 
207b2c929f0SDr. David Alan Gilbert     /*
208b2c929f0SDr. David Alan Gilbert      * Make sure the virtio migration announcement timer isn't running
209b2c929f0SDr. David Alan Gilbert      * If it is, let it trigger announcement so that we do not cause
210b2c929f0SDr. David Alan Gilbert      * confusion.
211b2c929f0SDr. David Alan Gilbert      */
212b2c929f0SDr. David Alan Gilbert     if (n->announce_timer.round) {
213b2c929f0SDr. David Alan Gilbert         return;
214b2c929f0SDr. David Alan Gilbert     }
215b2c929f0SDr. David Alan Gilbert 
216b2c929f0SDr. David Alan Gilbert     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
217b2c929f0SDr. David Alan Gilbert         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
218b2c929f0SDr. David Alan Gilbert             virtio_net_announce_notify(n);
219b2c929f0SDr. David Alan Gilbert     }
220f57fcf70SJason Wang }
221f57fcf70SJason Wang 
2226e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
2236e790746SPaolo Bonzini {
22417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2256e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
2266e790746SPaolo Bonzini     int queues = n->multiqueue ? n->max_queues : 1;
2276e790746SPaolo Bonzini 
228ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
2296e790746SPaolo Bonzini         return;
2306e790746SPaolo Bonzini     }
2316e790746SPaolo Bonzini 
2328c1ac475SRadim Krčmář     if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
2338c1ac475SRadim Krčmář         !!n->vhost_started) {
2346e790746SPaolo Bonzini         return;
2356e790746SPaolo Bonzini     }
2366e790746SPaolo Bonzini     if (!n->vhost_started) {
237086abc1cSMichael S. Tsirkin         int r, i;
238086abc1cSMichael S. Tsirkin 
2391bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
2401bfa316cSGreg Kurz             error_report("backend does not support %s vnet headers; "
2411bfa316cSGreg Kurz                          "falling back on userspace virtio",
2421bfa316cSGreg Kurz                          virtio_is_big_endian(vdev) ? "BE" : "LE");
2431bfa316cSGreg Kurz             return;
2441bfa316cSGreg Kurz         }
2451bfa316cSGreg Kurz 
246086abc1cSMichael S. Tsirkin         /* Any packets outstanding? Purge them to avoid touching rings
247086abc1cSMichael S. Tsirkin          * when vhost is running.
248086abc1cSMichael S. Tsirkin          */
249086abc1cSMichael S. Tsirkin         for (i = 0;  i < queues; i++) {
250086abc1cSMichael S. Tsirkin             NetClientState *qnc = qemu_get_subqueue(n->nic, i);
251086abc1cSMichael S. Tsirkin 
252086abc1cSMichael S. Tsirkin             /* Purge both directions: TX and RX. */
253086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
254086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
255086abc1cSMichael S. Tsirkin         }
256086abc1cSMichael S. Tsirkin 
257a93e599dSMaxime Coquelin         if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) {
258a93e599dSMaxime Coquelin             r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu);
259a93e599dSMaxime Coquelin             if (r < 0) {
260a93e599dSMaxime Coquelin                 error_report("%uBytes MTU not supported by the backend",
261a93e599dSMaxime Coquelin                              n->net_conf.mtu);
262a93e599dSMaxime Coquelin 
263a93e599dSMaxime Coquelin                 return;
264a93e599dSMaxime Coquelin             }
265a93e599dSMaxime Coquelin         }
266a93e599dSMaxime Coquelin 
2676e790746SPaolo Bonzini         n->vhost_started = 1;
26817a0ca55SKONRAD Frederic         r = vhost_net_start(vdev, n->nic->ncs, queues);
2696e790746SPaolo Bonzini         if (r < 0) {
2706e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
2716e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
2726e790746SPaolo Bonzini             n->vhost_started = 0;
2736e790746SPaolo Bonzini         }
2746e790746SPaolo Bonzini     } else {
27517a0ca55SKONRAD Frederic         vhost_net_stop(vdev, n->nic->ncs, queues);
2766e790746SPaolo Bonzini         n->vhost_started = 0;
2776e790746SPaolo Bonzini     }
2786e790746SPaolo Bonzini }
2796e790746SPaolo Bonzini 
2801bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
2811bfa316cSGreg Kurz                                           NetClientState *peer,
2821bfa316cSGreg Kurz                                           bool enable)
2831bfa316cSGreg Kurz {
2841bfa316cSGreg Kurz     if (virtio_is_big_endian(vdev)) {
2851bfa316cSGreg Kurz         return qemu_set_vnet_be(peer, enable);
2861bfa316cSGreg Kurz     } else {
2871bfa316cSGreg Kurz         return qemu_set_vnet_le(peer, enable);
2881bfa316cSGreg Kurz     }
2891bfa316cSGreg Kurz }
2901bfa316cSGreg Kurz 
2911bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
2921bfa316cSGreg Kurz                                        int queues, bool enable)
2931bfa316cSGreg Kurz {
2941bfa316cSGreg Kurz     int i;
2951bfa316cSGreg Kurz 
2961bfa316cSGreg Kurz     for (i = 0; i < queues; i++) {
2971bfa316cSGreg Kurz         if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
2981bfa316cSGreg Kurz             enable) {
2991bfa316cSGreg Kurz             while (--i >= 0) {
3001bfa316cSGreg Kurz                 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
3011bfa316cSGreg Kurz             }
3021bfa316cSGreg Kurz 
3031bfa316cSGreg Kurz             return true;
3041bfa316cSGreg Kurz         }
3051bfa316cSGreg Kurz     }
3061bfa316cSGreg Kurz 
3071bfa316cSGreg Kurz     return false;
3081bfa316cSGreg Kurz }
3091bfa316cSGreg Kurz 
3101bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
3111bfa316cSGreg Kurz {
3121bfa316cSGreg Kurz     VirtIODevice *vdev = VIRTIO_DEVICE(n);
3131bfa316cSGreg Kurz     int queues = n->multiqueue ? n->max_queues : 1;
3141bfa316cSGreg Kurz 
3151bfa316cSGreg Kurz     if (virtio_net_started(n, status)) {
3161bfa316cSGreg Kurz         /* Before using the device, we tell the network backend about the
3171bfa316cSGreg Kurz          * endianness to use when parsing vnet headers. If the backend
3181bfa316cSGreg Kurz          * can't do it, we fallback onto fixing the headers in the core
3191bfa316cSGreg Kurz          * virtio-net code.
3201bfa316cSGreg Kurz          */
3211bfa316cSGreg Kurz         n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
3221bfa316cSGreg Kurz                                                             queues, true);
3231bfa316cSGreg Kurz     } else if (virtio_net_started(n, vdev->status)) {
3241bfa316cSGreg Kurz         /* After using the device, we need to reset the network backend to
3251bfa316cSGreg Kurz          * the default (guest native endianness), otherwise the guest may
3261bfa316cSGreg Kurz          * lose network connectivity if it is rebooted into a different
3271bfa316cSGreg Kurz          * endianness.
3281bfa316cSGreg Kurz          */
3291bfa316cSGreg Kurz         virtio_net_set_vnet_endian(vdev, n->nic->ncs, queues, false);
3301bfa316cSGreg Kurz     }
3311bfa316cSGreg Kurz }
3321bfa316cSGreg Kurz 
333283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq)
334283e2c2aSYuri Benditovich {
335283e2c2aSYuri Benditovich     unsigned int dropped = virtqueue_drop_all(vq);
336283e2c2aSYuri Benditovich     if (dropped) {
337283e2c2aSYuri Benditovich         virtio_notify(vdev, vq);
338283e2c2aSYuri Benditovich     }
339283e2c2aSYuri Benditovich }
340283e2c2aSYuri Benditovich 
3416e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
3426e790746SPaolo Bonzini {
34317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3446e790746SPaolo Bonzini     VirtIONetQueue *q;
3456e790746SPaolo Bonzini     int i;
3466e790746SPaolo Bonzini     uint8_t queue_status;
3476e790746SPaolo Bonzini 
3481bfa316cSGreg Kurz     virtio_net_vnet_endian_status(n, status);
3496e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
3506e790746SPaolo Bonzini 
3516e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
35238705bb5SFam Zheng         NetClientState *ncs = qemu_get_subqueue(n->nic, i);
35338705bb5SFam Zheng         bool queue_started;
3546e790746SPaolo Bonzini         q = &n->vqs[i];
3556e790746SPaolo Bonzini 
3566e790746SPaolo Bonzini         if ((!n->multiqueue && i != 0) || i >= n->curr_queues) {
3576e790746SPaolo Bonzini             queue_status = 0;
3586e790746SPaolo Bonzini         } else {
3596e790746SPaolo Bonzini             queue_status = status;
3606e790746SPaolo Bonzini         }
36138705bb5SFam Zheng         queue_started =
36238705bb5SFam Zheng             virtio_net_started(n, queue_status) && !n->vhost_started;
36338705bb5SFam Zheng 
36438705bb5SFam Zheng         if (queue_started) {
36538705bb5SFam Zheng             qemu_flush_queued_packets(ncs);
36638705bb5SFam Zheng         }
3676e790746SPaolo Bonzini 
3686e790746SPaolo Bonzini         if (!q->tx_waiting) {
3696e790746SPaolo Bonzini             continue;
3706e790746SPaolo Bonzini         }
3716e790746SPaolo Bonzini 
37238705bb5SFam Zheng         if (queue_started) {
3736e790746SPaolo Bonzini             if (q->tx_timer) {
374bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
375bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
3766e790746SPaolo Bonzini             } else {
3776e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
3786e790746SPaolo Bonzini             }
3796e790746SPaolo Bonzini         } else {
3806e790746SPaolo Bonzini             if (q->tx_timer) {
381bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
3826e790746SPaolo Bonzini             } else {
3836e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
3846e790746SPaolo Bonzini             }
385283e2c2aSYuri Benditovich             if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 &&
38670e53e6eSJason Wang                 (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) &&
38770e53e6eSJason Wang                 vdev->vm_running) {
388283e2c2aSYuri Benditovich                 /* if tx is waiting we are likely have some packets in tx queue
389283e2c2aSYuri Benditovich                  * and disabled notification */
390283e2c2aSYuri Benditovich                 q->tx_waiting = 0;
391283e2c2aSYuri Benditovich                 virtio_queue_set_notification(q->tx_vq, 1);
392283e2c2aSYuri Benditovich                 virtio_net_drop_tx_queue_data(vdev, q->tx_vq);
393283e2c2aSYuri Benditovich             }
3946e790746SPaolo Bonzini         }
3956e790746SPaolo Bonzini     }
3966e790746SPaolo Bonzini }
3976e790746SPaolo Bonzini 
3986e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
3996e790746SPaolo Bonzini {
4006e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
40117a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
4026e790746SPaolo Bonzini     uint16_t old_status = n->status;
4036e790746SPaolo Bonzini 
4046e790746SPaolo Bonzini     if (nc->link_down)
4056e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
4066e790746SPaolo Bonzini     else
4076e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
4086e790746SPaolo Bonzini 
4096e790746SPaolo Bonzini     if (n->status != old_status)
41017a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
4116e790746SPaolo Bonzini 
41217a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
4136e790746SPaolo Bonzini }
4146e790746SPaolo Bonzini 
415b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
416b1be4280SAmos Kong {
417b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
418b1be4280SAmos Kong 
419b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
420ddfb0baaSMarkus Armbruster         char *path = object_get_canonical_path(OBJECT(n->qdev));
42106150279SWenchao Xia         qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
4223ab72385SPeter Xu                                               n->netclient_name, path);
42396e35046SAmos Kong         g_free(path);
424b1be4280SAmos Kong 
425b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
426b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
427b1be4280SAmos Kong     }
428b1be4280SAmos Kong }
429b1be4280SAmos Kong 
430f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
431f7bc8ef8SAmos Kong {
432f7bc8ef8SAmos Kong     intList *list, *entry;
433f7bc8ef8SAmos Kong     int i, j;
434f7bc8ef8SAmos Kong 
435f7bc8ef8SAmos Kong     list = NULL;
436f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
437f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
438f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
439f7bc8ef8SAmos Kong                 entry = g_malloc0(sizeof(*entry));
440f7bc8ef8SAmos Kong                 entry->value = (i << 5) + j;
441f7bc8ef8SAmos Kong                 entry->next = list;
442f7bc8ef8SAmos Kong                 list = entry;
443f7bc8ef8SAmos Kong             }
444f7bc8ef8SAmos Kong         }
445f7bc8ef8SAmos Kong     }
446f7bc8ef8SAmos Kong 
447f7bc8ef8SAmos Kong     return list;
448f7bc8ef8SAmos Kong }
449f7bc8ef8SAmos Kong 
450b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
451b1be4280SAmos Kong {
452b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
453f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
454b1be4280SAmos Kong     RxFilterInfo *info;
455b1be4280SAmos Kong     strList *str_list, *entry;
456f7bc8ef8SAmos Kong     int i;
457b1be4280SAmos Kong 
458b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
459b1be4280SAmos Kong     info->name = g_strdup(nc->name);
460b1be4280SAmos Kong     info->promiscuous = n->promisc;
461b1be4280SAmos Kong 
462b1be4280SAmos Kong     if (n->nouni) {
463b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
464b1be4280SAmos Kong     } else if (n->alluni) {
465b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
466b1be4280SAmos Kong     } else {
467b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
468b1be4280SAmos Kong     }
469b1be4280SAmos Kong 
470b1be4280SAmos Kong     if (n->nomulti) {
471b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
472b1be4280SAmos Kong     } else if (n->allmulti) {
473b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
474b1be4280SAmos Kong     } else {
475b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
476b1be4280SAmos Kong     }
477b1be4280SAmos Kong 
478b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
479b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
480b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
481b1be4280SAmos Kong 
482b0575ba4SScott Feldman     info->main_mac = qemu_mac_strdup_printf(n->mac);
483b1be4280SAmos Kong 
484b1be4280SAmos Kong     str_list = NULL;
485b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
486b1be4280SAmos Kong         entry = g_malloc0(sizeof(*entry));
487b0575ba4SScott Feldman         entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
488b1be4280SAmos Kong         entry->next = str_list;
489b1be4280SAmos Kong         str_list = entry;
490b1be4280SAmos Kong     }
491b1be4280SAmos Kong     info->unicast_table = str_list;
492b1be4280SAmos Kong 
493b1be4280SAmos Kong     str_list = NULL;
494b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
495b1be4280SAmos Kong         entry = g_malloc0(sizeof(*entry));
496b0575ba4SScott Feldman         entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
497b1be4280SAmos Kong         entry->next = str_list;
498b1be4280SAmos Kong         str_list = entry;
499b1be4280SAmos Kong     }
500b1be4280SAmos Kong     info->multicast_table = str_list;
501f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
502b1be4280SAmos Kong 
50395129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
504f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
505f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
506f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
507f7bc8ef8SAmos Kong     } else {
508f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
509b1be4280SAmos Kong     }
510b1be4280SAmos Kong 
511b1be4280SAmos Kong     /* enable event notification after query */
512b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
513b1be4280SAmos Kong 
514b1be4280SAmos Kong     return info;
515b1be4280SAmos Kong }
516b1be4280SAmos Kong 
5176e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
5186e790746SPaolo Bonzini {
51917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
52094b52958SGreg Kurz     int i;
5216e790746SPaolo Bonzini 
5226e790746SPaolo Bonzini     /* Reset back to compatibility mode */
5236e790746SPaolo Bonzini     n->promisc = 1;
5246e790746SPaolo Bonzini     n->allmulti = 0;
5256e790746SPaolo Bonzini     n->alluni = 0;
5266e790746SPaolo Bonzini     n->nomulti = 0;
5276e790746SPaolo Bonzini     n->nouni = 0;
5286e790746SPaolo Bonzini     n->nobcast = 0;
5296e790746SPaolo Bonzini     /* multiqueue is disabled by default */
5306e790746SPaolo Bonzini     n->curr_queues = 1;
5319d8c6a25SDr. David Alan Gilbert     timer_del(n->announce_timer.tm);
5329d8c6a25SDr. David Alan Gilbert     n->announce_timer.round = 0;
533f57fcf70SJason Wang     n->status &= ~VIRTIO_NET_S_ANNOUNCE;
5346e790746SPaolo Bonzini 
5356e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
5366e790746SPaolo Bonzini     n->mac_table.in_use = 0;
5376e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
5386e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
5396e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
5406e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
5416e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
542702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
5436e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
54494b52958SGreg Kurz 
54594b52958SGreg Kurz     /* Flush any async TX */
54694b52958SGreg Kurz     for (i = 0;  i < n->max_queues; i++) {
54794b52958SGreg Kurz         NetClientState *nc = qemu_get_subqueue(n->nic, i);
54894b52958SGreg Kurz 
54994b52958SGreg Kurz         if (nc->peer) {
55094b52958SGreg Kurz             qemu_flush_or_purge_queued_packets(nc->peer, true);
55194b52958SGreg Kurz             assert(!virtio_net_get_subqueue(nc)->async_tx.elem);
55294b52958SGreg Kurz         }
55394b52958SGreg Kurz     }
5546e790746SPaolo Bonzini }
5556e790746SPaolo Bonzini 
5566e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
5576e790746SPaolo Bonzini {
5586e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
5596e790746SPaolo Bonzini     if (!nc->peer) {
5606e790746SPaolo Bonzini         return;
5616e790746SPaolo Bonzini     }
5626e790746SPaolo Bonzini 
563d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
5646e790746SPaolo Bonzini }
5656e790746SPaolo Bonzini 
5666e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
5676e790746SPaolo Bonzini {
5686e790746SPaolo Bonzini     return n->has_vnet_hdr;
5696e790746SPaolo Bonzini }
5706e790746SPaolo Bonzini 
5716e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
5726e790746SPaolo Bonzini {
5736e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
5746e790746SPaolo Bonzini         return 0;
5756e790746SPaolo Bonzini 
576d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
5776e790746SPaolo Bonzini 
5786e790746SPaolo Bonzini     return n->has_ufo;
5796e790746SPaolo Bonzini }
5806e790746SPaolo Bonzini 
581bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
582e22f0603SYuri Benditovich                                        int version_1, int hash_report)
5836e790746SPaolo Bonzini {
5846e790746SPaolo Bonzini     int i;
5856e790746SPaolo Bonzini     NetClientState *nc;
5866e790746SPaolo Bonzini 
5876e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
5886e790746SPaolo Bonzini 
589bb9d17f8SCornelia Huck     if (version_1) {
590e22f0603SYuri Benditovich         n->guest_hdr_len = hash_report ?
591e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_v1_hash) :
592e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_mrg_rxbuf);
593e22f0603SYuri Benditovich         n->rss_data.populate_hash = !!hash_report;
594bb9d17f8SCornelia Huck     } else {
5956e790746SPaolo Bonzini         n->guest_hdr_len = n->mergeable_rx_bufs ?
596bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr_mrg_rxbuf) :
597bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr);
598bb9d17f8SCornelia Huck     }
5996e790746SPaolo Bonzini 
6006e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
6016e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
6026e790746SPaolo Bonzini 
6036e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
604d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
605d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
6066e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
6076e790746SPaolo Bonzini         }
6086e790746SPaolo Bonzini     }
6096e790746SPaolo Bonzini }
6106e790746SPaolo Bonzini 
6112eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n)
6122eef278bSMichael S. Tsirkin {
6132eef278bSMichael S. Tsirkin     NetClientState *peer = n->nic_conf.peers.ncs[0];
6142eef278bSMichael S. Tsirkin 
6152eef278bSMichael S. Tsirkin     /*
6162eef278bSMichael S. Tsirkin      * Backends other than vhost-user don't support max queue size.
6172eef278bSMichael S. Tsirkin      */
6182eef278bSMichael S. Tsirkin     if (!peer) {
6192eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6202eef278bSMichael S. Tsirkin     }
6212eef278bSMichael S. Tsirkin 
6222eef278bSMichael S. Tsirkin     if (peer->info->type != NET_CLIENT_DRIVER_VHOST_USER) {
6232eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6242eef278bSMichael S. Tsirkin     }
6252eef278bSMichael S. Tsirkin 
6262eef278bSMichael S. Tsirkin     return VIRTQUEUE_MAX_SIZE;
6272eef278bSMichael S. Tsirkin }
6282eef278bSMichael S. Tsirkin 
6296e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
6306e790746SPaolo Bonzini {
6316e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6326e790746SPaolo Bonzini 
6336e790746SPaolo Bonzini     if (!nc->peer) {
6346e790746SPaolo Bonzini         return 0;
6356e790746SPaolo Bonzini     }
6366e790746SPaolo Bonzini 
637f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6387263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 1);
6397263a0adSChangchun Ouyang     }
6407263a0adSChangchun Ouyang 
641f394b2e2SEric Blake     if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
6426e790746SPaolo Bonzini         return 0;
6436e790746SPaolo Bonzini     }
6446e790746SPaolo Bonzini 
6451074b879SJason Wang     if (n->max_queues == 1) {
6461074b879SJason Wang         return 0;
6471074b879SJason Wang     }
6481074b879SJason Wang 
6496e790746SPaolo Bonzini     return tap_enable(nc->peer);
6506e790746SPaolo Bonzini }
6516e790746SPaolo Bonzini 
6526e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
6536e790746SPaolo Bonzini {
6546e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6556e790746SPaolo Bonzini 
6566e790746SPaolo Bonzini     if (!nc->peer) {
6576e790746SPaolo Bonzini         return 0;
6586e790746SPaolo Bonzini     }
6596e790746SPaolo Bonzini 
660f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6617263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 0);
6627263a0adSChangchun Ouyang     }
6637263a0adSChangchun Ouyang 
664f394b2e2SEric Blake     if (nc->peer->info->type !=  NET_CLIENT_DRIVER_TAP) {
6656e790746SPaolo Bonzini         return 0;
6666e790746SPaolo Bonzini     }
6676e790746SPaolo Bonzini 
6686e790746SPaolo Bonzini     return tap_disable(nc->peer);
6696e790746SPaolo Bonzini }
6706e790746SPaolo Bonzini 
6716e790746SPaolo Bonzini static void virtio_net_set_queues(VirtIONet *n)
6726e790746SPaolo Bonzini {
6736e790746SPaolo Bonzini     int i;
674ddfa83eaSJoel Stanley     int r;
6756e790746SPaolo Bonzini 
67668b5f314SYuri Benditovich     if (n->nic->peer_deleted) {
67768b5f314SYuri Benditovich         return;
67868b5f314SYuri Benditovich     }
67968b5f314SYuri Benditovich 
6806e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
6816e790746SPaolo Bonzini         if (i < n->curr_queues) {
682ddfa83eaSJoel Stanley             r = peer_attach(n, i);
683ddfa83eaSJoel Stanley             assert(!r);
6846e790746SPaolo Bonzini         } else {
685ddfa83eaSJoel Stanley             r = peer_detach(n, i);
686ddfa83eaSJoel Stanley             assert(!r);
6876e790746SPaolo Bonzini         }
6886e790746SPaolo Bonzini     }
6896e790746SPaolo Bonzini }
6906e790746SPaolo Bonzini 
691ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
6926e790746SPaolo Bonzini 
6939d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
6949d5b731dSJason Wang                                         Error **errp)
6956e790746SPaolo Bonzini {
69617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
6976e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
6986e790746SPaolo Bonzini 
699da3e8a23SShannon Zhao     /* Firstly sync all virtio-net possible supported features */
700da3e8a23SShannon Zhao     features |= n->host_features;
701da3e8a23SShannon Zhao 
7020cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7036e790746SPaolo Bonzini 
7046e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
7050cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
7060cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7070cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7080cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
7096e790746SPaolo Bonzini 
7100cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
7110cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
7120cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
7130cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
714e22f0603SYuri Benditovich 
715e22f0603SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
7166e790746SPaolo Bonzini     }
7176e790746SPaolo Bonzini 
7186e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
7190cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
7200cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
7216e790746SPaolo Bonzini     }
7226e790746SPaolo Bonzini 
723ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
7246e790746SPaolo Bonzini         return features;
7256e790746SPaolo Bonzini     }
7262974e916SYuri Benditovich 
72759079029SYuri Benditovich     virtio_clear_feature(&features, VIRTIO_NET_F_RSS);
728e22f0603SYuri Benditovich     virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
72975ebec11SMaxime Coquelin     features = vhost_net_get_features(get_vhost_net(nc->peer), features);
73075ebec11SMaxime Coquelin     vdev->backend_features = features;
73175ebec11SMaxime Coquelin 
73275ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
73375ebec11SMaxime Coquelin             (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) {
73475ebec11SMaxime Coquelin         features |= (1ULL << VIRTIO_NET_F_MTU);
73575ebec11SMaxime Coquelin     }
73675ebec11SMaxime Coquelin 
73775ebec11SMaxime Coquelin     return features;
7386e790746SPaolo Bonzini }
7396e790746SPaolo Bonzini 
740019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
7416e790746SPaolo Bonzini {
742019a3edbSGerd Hoffmann     uint64_t features = 0;
7436e790746SPaolo Bonzini 
7446e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
7456e790746SPaolo Bonzini      * but also these: */
7460cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7470cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
7480cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7490cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7500cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
7516e790746SPaolo Bonzini 
7526e790746SPaolo Bonzini     return features;
7536e790746SPaolo Bonzini }
7546e790746SPaolo Bonzini 
755644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
756644c9858SDmitry Fleytman {
757ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
758644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
759644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
760644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
761644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
762644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
763644c9858SDmitry Fleytman }
764644c9858SDmitry Fleytman 
765644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
766644c9858SDmitry Fleytman {
767644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
768644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
769644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
770644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
771644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
772644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
773644c9858SDmitry Fleytman 
774644c9858SDmitry Fleytman     return guest_offloads_mask & features;
775644c9858SDmitry Fleytman }
776644c9858SDmitry Fleytman 
777644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
778644c9858SDmitry Fleytman {
779644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
780644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
781644c9858SDmitry Fleytman }
782644c9858SDmitry Fleytman 
7839711cd0dSJens Freimann static void failover_add_primary(VirtIONet *n, Error **errp)
7849711cd0dSJens Freimann {
7859711cd0dSJens Freimann     Error *err = NULL;
7869711cd0dSJens Freimann 
787117378bfSJens Freimann     if (n->primary_dev) {
788117378bfSJens Freimann         return;
789117378bfSJens Freimann     }
790117378bfSJens Freimann 
7919711cd0dSJens Freimann     n->primary_device_opts = qemu_opts_find(qemu_find_opts("device"),
7929711cd0dSJens Freimann             n->primary_device_id);
7939711cd0dSJens Freimann     if (n->primary_device_opts) {
7949711cd0dSJens Freimann         n->primary_dev = qdev_device_add(n->primary_device_opts, &err);
7959711cd0dSJens Freimann         if (err) {
7969711cd0dSJens Freimann             qemu_opts_del(n->primary_device_opts);
7979711cd0dSJens Freimann         }
7989711cd0dSJens Freimann         if (n->primary_dev) {
7999711cd0dSJens Freimann             n->primary_bus = n->primary_dev->parent_bus;
8009711cd0dSJens Freimann             if (err) {
8019711cd0dSJens Freimann                 qdev_unplug(n->primary_dev, &err);
8029711cd0dSJens Freimann                 qdev_set_id(n->primary_dev, "");
8039711cd0dSJens Freimann 
8049711cd0dSJens Freimann             }
8059711cd0dSJens Freimann         }
8069711cd0dSJens Freimann     } else {
8079711cd0dSJens Freimann         error_setg(errp, "Primary device not found");
8089711cd0dSJens Freimann         error_append_hint(errp, "Virtio-net failover will not work. Make "
8099711cd0dSJens Freimann             "sure primary device has parameter"
8109711cd0dSJens Freimann             " failover_pair_id=<virtio-net-id>\n");
8119711cd0dSJens Freimann }
8129711cd0dSJens Freimann     if (err) {
8139711cd0dSJens Freimann         error_propagate(errp, err);
8149711cd0dSJens Freimann     }
8159711cd0dSJens Freimann }
8169711cd0dSJens Freimann 
8179711cd0dSJens Freimann static int is_my_primary(void *opaque, QemuOpts *opts, Error **errp)
8189711cd0dSJens Freimann {
8199711cd0dSJens Freimann     VirtIONet *n = opaque;
8209711cd0dSJens Freimann     int ret = 0;
8219711cd0dSJens Freimann 
8229711cd0dSJens Freimann     const char *standby_id = qemu_opt_get(opts, "failover_pair_id");
8239711cd0dSJens Freimann 
8249711cd0dSJens Freimann     if (standby_id != NULL && (g_strcmp0(standby_id, n->netclient_name) == 0)) {
8259711cd0dSJens Freimann         n->primary_device_id = g_strdup(opts->id);
8269711cd0dSJens Freimann         ret = 1;
8279711cd0dSJens Freimann     }
8289711cd0dSJens Freimann 
8299711cd0dSJens Freimann     return ret;
8309711cd0dSJens Freimann }
8319711cd0dSJens Freimann 
8329711cd0dSJens Freimann static DeviceState *virtio_net_find_primary(VirtIONet *n, Error **errp)
8339711cd0dSJens Freimann {
8349711cd0dSJens Freimann     DeviceState *dev = NULL;
8359711cd0dSJens Freimann     Error *err = NULL;
8369711cd0dSJens Freimann 
8379711cd0dSJens Freimann     if (qemu_opts_foreach(qemu_find_opts("device"),
8389711cd0dSJens Freimann                          is_my_primary, n, &err)) {
8399711cd0dSJens Freimann         if (err) {
8409711cd0dSJens Freimann             error_propagate(errp, err);
8419711cd0dSJens Freimann             return NULL;
8429711cd0dSJens Freimann         }
8439711cd0dSJens Freimann         if (n->primary_device_id) {
8449711cd0dSJens Freimann             dev = qdev_find_recursive(sysbus_get_default(),
8459711cd0dSJens Freimann                     n->primary_device_id);
8469711cd0dSJens Freimann         } else {
8479711cd0dSJens Freimann             error_setg(errp, "Primary device id not found");
8489711cd0dSJens Freimann             return NULL;
8499711cd0dSJens Freimann         }
8509711cd0dSJens Freimann     }
8519711cd0dSJens Freimann     return dev;
8529711cd0dSJens Freimann }
8539711cd0dSJens Freimann 
8549711cd0dSJens Freimann 
8559711cd0dSJens Freimann 
8569711cd0dSJens Freimann static DeviceState *virtio_connect_failover_devices(VirtIONet *n,
8579711cd0dSJens Freimann                                                     DeviceState *dev,
8589711cd0dSJens Freimann                                                     Error **errp)
8599711cd0dSJens Freimann {
8609711cd0dSJens Freimann     DeviceState *prim_dev = NULL;
8619711cd0dSJens Freimann     Error *err = NULL;
8629711cd0dSJens Freimann 
8639711cd0dSJens Freimann     prim_dev = virtio_net_find_primary(n, &err);
8649711cd0dSJens Freimann     if (prim_dev) {
8659711cd0dSJens Freimann         n->primary_device_id = g_strdup(prim_dev->id);
8669711cd0dSJens Freimann         n->primary_device_opts = prim_dev->opts;
8679711cd0dSJens Freimann     } else {
8689711cd0dSJens Freimann         if (err) {
8699711cd0dSJens Freimann             error_propagate(errp, err);
8709711cd0dSJens Freimann         }
8719711cd0dSJens Freimann     }
8729711cd0dSJens Freimann 
8739711cd0dSJens Freimann     return prim_dev;
8749711cd0dSJens Freimann }
8759711cd0dSJens Freimann 
876d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
8776e790746SPaolo Bonzini {
87817a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
8799711cd0dSJens Freimann     Error *err = NULL;
8806e790746SPaolo Bonzini     int i;
8816e790746SPaolo Bonzini 
88275ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
88375ebec11SMaxime Coquelin             !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) {
88475ebec11SMaxime Coquelin         features &= ~(1ULL << VIRTIO_NET_F_MTU);
88575ebec11SMaxime Coquelin     }
88675ebec11SMaxime Coquelin 
887ef546f12SCornelia Huck     virtio_net_set_multiqueue(n,
88859079029SYuri Benditovich                               virtio_has_feature(features, VIRTIO_NET_F_RSS) ||
88995129d6fSCornelia Huck                               virtio_has_feature(features, VIRTIO_NET_F_MQ));
8906e790746SPaolo Bonzini 
891ef546f12SCornelia Huck     virtio_net_set_mrg_rx_bufs(n,
89295129d6fSCornelia Huck                                virtio_has_feature(features,
893bb9d17f8SCornelia Huck                                                   VIRTIO_NET_F_MRG_RXBUF),
89495129d6fSCornelia Huck                                virtio_has_feature(features,
895e22f0603SYuri Benditovich                                                   VIRTIO_F_VERSION_1),
896e22f0603SYuri Benditovich                                virtio_has_feature(features,
897e22f0603SYuri Benditovich                                                   VIRTIO_NET_F_HASH_REPORT));
8986e790746SPaolo Bonzini 
8992974e916SYuri Benditovich     n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9002974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4);
9012974e916SYuri Benditovich     n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9022974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6);
903e22f0603SYuri Benditovich     n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS);
9042974e916SYuri Benditovich 
9056e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
906644c9858SDmitry Fleytman         n->curr_guest_offloads =
907644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
908644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
9096e790746SPaolo Bonzini     }
9106e790746SPaolo Bonzini 
9116e790746SPaolo Bonzini     for (i = 0;  i < n->max_queues; i++) {
9126e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
9136e790746SPaolo Bonzini 
914ed8b4afeSNikolay Nikolaev         if (!get_vhost_net(nc->peer)) {
9156e790746SPaolo Bonzini             continue;
9166e790746SPaolo Bonzini         }
917ed8b4afeSNikolay Nikolaev         vhost_net_ack_features(get_vhost_net(nc->peer), features);
9186e790746SPaolo Bonzini     }
9190b1eaa88SStefan Fritsch 
92095129d6fSCornelia Huck     if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
9210b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
9220b1eaa88SStefan Fritsch     } else {
9230b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
9240b1eaa88SStefan Fritsch     }
9259711cd0dSJens Freimann 
9269711cd0dSJens Freimann     if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) {
9279711cd0dSJens Freimann         qapi_event_send_failover_negotiated(n->netclient_name);
9289711cd0dSJens Freimann         atomic_set(&n->primary_should_be_hidden, false);
9299711cd0dSJens Freimann         failover_add_primary(n, &err);
9309711cd0dSJens Freimann         if (err) {
9319711cd0dSJens Freimann             n->primary_dev = virtio_connect_failover_devices(n, n->qdev, &err);
9329711cd0dSJens Freimann             if (err) {
9339711cd0dSJens Freimann                 goto out_err;
9349711cd0dSJens Freimann             }
9359711cd0dSJens Freimann             failover_add_primary(n, &err);
9369711cd0dSJens Freimann             if (err) {
9379711cd0dSJens Freimann                 goto out_err;
9389711cd0dSJens Freimann             }
9399711cd0dSJens Freimann         }
9409711cd0dSJens Freimann     }
9419711cd0dSJens Freimann     return;
9429711cd0dSJens Freimann 
9439711cd0dSJens Freimann out_err:
9449711cd0dSJens Freimann     if (err) {
9459711cd0dSJens Freimann         warn_report_err(err);
9469711cd0dSJens Freimann     }
9476e790746SPaolo Bonzini }
9486e790746SPaolo Bonzini 
9496e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
9506e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
9516e790746SPaolo Bonzini {
9526e790746SPaolo Bonzini     uint8_t on;
9536e790746SPaolo Bonzini     size_t s;
954b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
9556e790746SPaolo Bonzini 
9566e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
9576e790746SPaolo Bonzini     if (s != sizeof(on)) {
9586e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9596e790746SPaolo Bonzini     }
9606e790746SPaolo Bonzini 
9616e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
9626e790746SPaolo Bonzini         n->promisc = on;
9636e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
9646e790746SPaolo Bonzini         n->allmulti = on;
9656e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
9666e790746SPaolo Bonzini         n->alluni = on;
9676e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
9686e790746SPaolo Bonzini         n->nomulti = on;
9696e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
9706e790746SPaolo Bonzini         n->nouni = on;
9716e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
9726e790746SPaolo Bonzini         n->nobcast = on;
9736e790746SPaolo Bonzini     } else {
9746e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9756e790746SPaolo Bonzini     }
9766e790746SPaolo Bonzini 
977b1be4280SAmos Kong     rxfilter_notify(nc);
978b1be4280SAmos Kong 
9796e790746SPaolo Bonzini     return VIRTIO_NET_OK;
9806e790746SPaolo Bonzini }
9816e790746SPaolo Bonzini 
982644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
983644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
984644c9858SDmitry Fleytman {
985644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
986644c9858SDmitry Fleytman     uint64_t offloads;
987644c9858SDmitry Fleytman     size_t s;
988644c9858SDmitry Fleytman 
98995129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
990644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
991644c9858SDmitry Fleytman     }
992644c9858SDmitry Fleytman 
993644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
994644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
995644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
996644c9858SDmitry Fleytman     }
997644c9858SDmitry Fleytman 
998644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
999644c9858SDmitry Fleytman         uint64_t supported_offloads;
1000644c9858SDmitry Fleytman 
1001189ae6bbSJason Wang         offloads = virtio_ldq_p(vdev, &offloads);
1002189ae6bbSJason Wang 
1003644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
1004644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1005644c9858SDmitry Fleytman         }
1006644c9858SDmitry Fleytman 
10072974e916SYuri Benditovich         n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10082974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4);
10092974e916SYuri Benditovich         n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10102974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6);
10112974e916SYuri Benditovich         virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT);
10122974e916SYuri Benditovich 
1013644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
1014644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
1015644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1016644c9858SDmitry Fleytman         }
1017644c9858SDmitry Fleytman 
1018644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
1019644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1020644c9858SDmitry Fleytman 
1021644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
1022644c9858SDmitry Fleytman     } else {
1023644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1024644c9858SDmitry Fleytman     }
1025644c9858SDmitry Fleytman }
1026644c9858SDmitry Fleytman 
10276e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
10286e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
10296e790746SPaolo Bonzini {
10301399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10316e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
10326e790746SPaolo Bonzini     size_t s;
1033b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10346e790746SPaolo Bonzini 
10356e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
10366e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
10376e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
10386e790746SPaolo Bonzini         }
10396e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
10406e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
10416e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1042b1be4280SAmos Kong         rxfilter_notify(nc);
1043b1be4280SAmos Kong 
10446e790746SPaolo Bonzini         return VIRTIO_NET_OK;
10456e790746SPaolo Bonzini     }
10466e790746SPaolo Bonzini 
10476e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
10486e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10496e790746SPaolo Bonzini     }
10506e790746SPaolo Bonzini 
1051cae2e556SAmos Kong     int in_use = 0;
1052cae2e556SAmos Kong     int first_multi = 0;
1053cae2e556SAmos Kong     uint8_t uni_overflow = 0;
1054cae2e556SAmos Kong     uint8_t multi_overflow = 0;
1055cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
10566e790746SPaolo Bonzini 
10576e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10586e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10591399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10606e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1061b1be4280SAmos Kong         goto error;
10626e790746SPaolo Bonzini     }
10636e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10646e790746SPaolo Bonzini 
10656e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
1066b1be4280SAmos Kong         goto error;
10676e790746SPaolo Bonzini     }
10686e790746SPaolo Bonzini 
10696e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
1070cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
10716e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
10726e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1073b1be4280SAmos Kong             goto error;
10746e790746SPaolo Bonzini         }
1075cae2e556SAmos Kong         in_use += mac_data.entries;
10766e790746SPaolo Bonzini     } else {
1077cae2e556SAmos Kong         uni_overflow = 1;
10786e790746SPaolo Bonzini     }
10796e790746SPaolo Bonzini 
10806e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
10816e790746SPaolo Bonzini 
1082cae2e556SAmos Kong     first_multi = in_use;
10836e790746SPaolo Bonzini 
10846e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10856e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10861399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10876e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1088b1be4280SAmos Kong         goto error;
10896e790746SPaolo Bonzini     }
10906e790746SPaolo Bonzini 
10916e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10926e790746SPaolo Bonzini 
10936e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
1094b1be4280SAmos Kong         goto error;
10956e790746SPaolo Bonzini     }
10966e790746SPaolo Bonzini 
1097edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
1098cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
10996e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
11006e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1101b1be4280SAmos Kong             goto error;
11026e790746SPaolo Bonzini         }
1103cae2e556SAmos Kong         in_use += mac_data.entries;
11046e790746SPaolo Bonzini     } else {
1105cae2e556SAmos Kong         multi_overflow = 1;
11066e790746SPaolo Bonzini     }
11076e790746SPaolo Bonzini 
1108cae2e556SAmos Kong     n->mac_table.in_use = in_use;
1109cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
1110cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
1111cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
1112cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
1113cae2e556SAmos Kong     g_free(macs);
1114b1be4280SAmos Kong     rxfilter_notify(nc);
1115b1be4280SAmos Kong 
11166e790746SPaolo Bonzini     return VIRTIO_NET_OK;
1117b1be4280SAmos Kong 
1118b1be4280SAmos Kong error:
1119cae2e556SAmos Kong     g_free(macs);
1120b1be4280SAmos Kong     return VIRTIO_NET_ERR;
11216e790746SPaolo Bonzini }
11226e790746SPaolo Bonzini 
11236e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
11246e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
11256e790746SPaolo Bonzini {
11261399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
11276e790746SPaolo Bonzini     uint16_t vid;
11286e790746SPaolo Bonzini     size_t s;
1129b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
11306e790746SPaolo Bonzini 
11316e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
11321399c60dSRusty Russell     vid = virtio_lduw_p(vdev, &vid);
11336e790746SPaolo Bonzini     if (s != sizeof(vid)) {
11346e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11356e790746SPaolo Bonzini     }
11366e790746SPaolo Bonzini 
11376e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
11386e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11396e790746SPaolo Bonzini 
11406e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
11416e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
11426e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
11436e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
11446e790746SPaolo Bonzini     else
11456e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11466e790746SPaolo Bonzini 
1147b1be4280SAmos Kong     rxfilter_notify(nc);
1148b1be4280SAmos Kong 
11496e790746SPaolo Bonzini     return VIRTIO_NET_OK;
11506e790746SPaolo Bonzini }
11516e790746SPaolo Bonzini 
1152f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
1153f57fcf70SJason Wang                                       struct iovec *iov, unsigned int iov_cnt)
1154f57fcf70SJason Wang {
11559d8c6a25SDr. David Alan Gilbert     trace_virtio_net_handle_announce(n->announce_timer.round);
1156f57fcf70SJason Wang     if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
1157f57fcf70SJason Wang         n->status & VIRTIO_NET_S_ANNOUNCE) {
1158f57fcf70SJason Wang         n->status &= ~VIRTIO_NET_S_ANNOUNCE;
11599d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
11609d8c6a25SDr. David Alan Gilbert             qemu_announce_timer_step(&n->announce_timer);
1161f57fcf70SJason Wang         }
1162f57fcf70SJason Wang         return VIRTIO_NET_OK;
1163f57fcf70SJason Wang     } else {
1164f57fcf70SJason Wang         return VIRTIO_NET_ERR;
1165f57fcf70SJason Wang     }
1166f57fcf70SJason Wang }
1167f57fcf70SJason Wang 
116859079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n)
116959079029SYuri Benditovich {
117059079029SYuri Benditovich     if (n->rss_data.enabled) {
117159079029SYuri Benditovich         trace_virtio_net_rss_disable();
117259079029SYuri Benditovich     }
117359079029SYuri Benditovich     n->rss_data.enabled = false;
117459079029SYuri Benditovich }
117559079029SYuri Benditovich 
117659079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n,
1177e22f0603SYuri Benditovich                                       struct iovec *iov,
1178e22f0603SYuri Benditovich                                       unsigned int iov_cnt,
1179e22f0603SYuri Benditovich                                       bool do_rss)
118059079029SYuri Benditovich {
118159079029SYuri Benditovich     VirtIODevice *vdev = VIRTIO_DEVICE(n);
118259079029SYuri Benditovich     struct virtio_net_rss_config cfg;
118359079029SYuri Benditovich     size_t s, offset = 0, size_get;
118459079029SYuri Benditovich     uint16_t queues, i;
118559079029SYuri Benditovich     struct {
118659079029SYuri Benditovich         uint16_t us;
118759079029SYuri Benditovich         uint8_t b;
118859079029SYuri Benditovich     } QEMU_PACKED temp;
118959079029SYuri Benditovich     const char *err_msg = "";
119059079029SYuri Benditovich     uint32_t err_value = 0;
119159079029SYuri Benditovich 
1192e22f0603SYuri Benditovich     if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) {
119359079029SYuri Benditovich         err_msg = "RSS is not negotiated";
119459079029SYuri Benditovich         goto error;
119559079029SYuri Benditovich     }
1196e22f0603SYuri Benditovich     if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) {
1197e22f0603SYuri Benditovich         err_msg = "Hash report is not negotiated";
1198e22f0603SYuri Benditovich         goto error;
1199e22f0603SYuri Benditovich     }
120059079029SYuri Benditovich     size_get = offsetof(struct virtio_net_rss_config, indirection_table);
120159079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get);
120259079029SYuri Benditovich     if (s != size_get) {
120359079029SYuri Benditovich         err_msg = "Short command buffer";
120459079029SYuri Benditovich         err_value = (uint32_t)s;
120559079029SYuri Benditovich         goto error;
120659079029SYuri Benditovich     }
120759079029SYuri Benditovich     n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types);
120859079029SYuri Benditovich     n->rss_data.indirections_len =
120959079029SYuri Benditovich         virtio_lduw_p(vdev, &cfg.indirection_table_mask);
121059079029SYuri Benditovich     n->rss_data.indirections_len++;
1211e22f0603SYuri Benditovich     if (!do_rss) {
1212e22f0603SYuri Benditovich         n->rss_data.indirections_len = 1;
1213e22f0603SYuri Benditovich     }
121459079029SYuri Benditovich     if (!is_power_of_2(n->rss_data.indirections_len)) {
121559079029SYuri Benditovich         err_msg = "Invalid size of indirection table";
121659079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
121759079029SYuri Benditovich         goto error;
121859079029SYuri Benditovich     }
121959079029SYuri Benditovich     if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) {
122059079029SYuri Benditovich         err_msg = "Too large indirection table";
122159079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
122259079029SYuri Benditovich         goto error;
122359079029SYuri Benditovich     }
1224e22f0603SYuri Benditovich     n->rss_data.default_queue = do_rss ?
1225e22f0603SYuri Benditovich         virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0;
122659079029SYuri Benditovich     if (n->rss_data.default_queue >= n->max_queues) {
122759079029SYuri Benditovich         err_msg = "Invalid default queue";
122859079029SYuri Benditovich         err_value = n->rss_data.default_queue;
122959079029SYuri Benditovich         goto error;
123059079029SYuri Benditovich     }
123159079029SYuri Benditovich     offset += size_get;
123259079029SYuri Benditovich     size_get = sizeof(uint16_t) * n->rss_data.indirections_len;
123359079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
123459079029SYuri Benditovich     n->rss_data.indirections_table = g_malloc(size_get);
123559079029SYuri Benditovich     if (!n->rss_data.indirections_table) {
123659079029SYuri Benditovich         err_msg = "Can't allocate indirections table";
123759079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
123859079029SYuri Benditovich         goto error;
123959079029SYuri Benditovich     }
124059079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset,
124159079029SYuri Benditovich                    n->rss_data.indirections_table, size_get);
124259079029SYuri Benditovich     if (s != size_get) {
124359079029SYuri Benditovich         err_msg = "Short indirection table buffer";
124459079029SYuri Benditovich         err_value = (uint32_t)s;
124559079029SYuri Benditovich         goto error;
124659079029SYuri Benditovich     }
124759079029SYuri Benditovich     for (i = 0; i < n->rss_data.indirections_len; ++i) {
124859079029SYuri Benditovich         uint16_t val = n->rss_data.indirections_table[i];
124959079029SYuri Benditovich         n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val);
125059079029SYuri Benditovich     }
125159079029SYuri Benditovich     offset += size_get;
125259079029SYuri Benditovich     size_get = sizeof(temp);
125359079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get);
125459079029SYuri Benditovich     if (s != size_get) {
125559079029SYuri Benditovich         err_msg = "Can't get queues";
125659079029SYuri Benditovich         err_value = (uint32_t)s;
125759079029SYuri Benditovich         goto error;
125859079029SYuri Benditovich     }
1259e22f0603SYuri Benditovich     queues = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queues;
126059079029SYuri Benditovich     if (queues == 0 || queues > n->max_queues) {
126159079029SYuri Benditovich         err_msg = "Invalid number of queues";
126259079029SYuri Benditovich         err_value = queues;
126359079029SYuri Benditovich         goto error;
126459079029SYuri Benditovich     }
126559079029SYuri Benditovich     if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) {
126659079029SYuri Benditovich         err_msg = "Invalid key size";
126759079029SYuri Benditovich         err_value = temp.b;
126859079029SYuri Benditovich         goto error;
126959079029SYuri Benditovich     }
127059079029SYuri Benditovich     if (!temp.b && n->rss_data.hash_types) {
127159079029SYuri Benditovich         err_msg = "No key provided";
127259079029SYuri Benditovich         err_value = 0;
127359079029SYuri Benditovich         goto error;
127459079029SYuri Benditovich     }
127559079029SYuri Benditovich     if (!temp.b && !n->rss_data.hash_types) {
127659079029SYuri Benditovich         virtio_net_disable_rss(n);
127759079029SYuri Benditovich         return queues;
127859079029SYuri Benditovich     }
127959079029SYuri Benditovich     offset += size_get;
128059079029SYuri Benditovich     size_get = temp.b;
128159079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get);
128259079029SYuri Benditovich     if (s != size_get) {
128359079029SYuri Benditovich         err_msg = "Can get key buffer";
128459079029SYuri Benditovich         err_value = (uint32_t)s;
128559079029SYuri Benditovich         goto error;
128659079029SYuri Benditovich     }
128759079029SYuri Benditovich     n->rss_data.enabled = true;
128859079029SYuri Benditovich     trace_virtio_net_rss_enable(n->rss_data.hash_types,
128959079029SYuri Benditovich                                 n->rss_data.indirections_len,
129059079029SYuri Benditovich                                 temp.b);
129159079029SYuri Benditovich     return queues;
129259079029SYuri Benditovich error:
129359079029SYuri Benditovich     trace_virtio_net_rss_error(err_msg, err_value);
129459079029SYuri Benditovich     virtio_net_disable_rss(n);
129559079029SYuri Benditovich     return 0;
129659079029SYuri Benditovich }
129759079029SYuri Benditovich 
12986e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
12996e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
13006e790746SPaolo Bonzini {
130117a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
13026e790746SPaolo Bonzini     uint16_t queues;
13036e790746SPaolo Bonzini 
130459079029SYuri Benditovich     virtio_net_disable_rss(n);
1305e22f0603SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) {
1306e22f0603SYuri Benditovich         queues = virtio_net_handle_rss(n, iov, iov_cnt, false);
1307e22f0603SYuri Benditovich         return queues ? VIRTIO_NET_OK : VIRTIO_NET_ERR;
1308e22f0603SYuri Benditovich     }
130959079029SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) {
1310e22f0603SYuri Benditovich         queues = virtio_net_handle_rss(n, iov, iov_cnt, true);
131159079029SYuri Benditovich     } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
131259079029SYuri Benditovich         struct virtio_net_ctrl_mq mq;
131359079029SYuri Benditovich         size_t s;
131459079029SYuri Benditovich         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) {
131559079029SYuri Benditovich             return VIRTIO_NET_ERR;
131659079029SYuri Benditovich         }
13176e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
13186e790746SPaolo Bonzini         if (s != sizeof(mq)) {
13196e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
13206e790746SPaolo Bonzini         }
132159079029SYuri Benditovich         queues = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
13226e790746SPaolo Bonzini 
132359079029SYuri Benditovich     } else {
13246e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
13256e790746SPaolo Bonzini     }
13266e790746SPaolo Bonzini 
13276e790746SPaolo Bonzini     if (queues < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
13286e790746SPaolo Bonzini         queues > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
13296e790746SPaolo Bonzini         queues > n->max_queues ||
13306e790746SPaolo Bonzini         !n->multiqueue) {
13316e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
13326e790746SPaolo Bonzini     }
13336e790746SPaolo Bonzini 
13346e790746SPaolo Bonzini     n->curr_queues = queues;
13356e790746SPaolo Bonzini     /* stop the backend before changing the number of queues to avoid handling a
13366e790746SPaolo Bonzini      * disabled queue */
133717a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
13386e790746SPaolo Bonzini     virtio_net_set_queues(n);
13396e790746SPaolo Bonzini 
13406e790746SPaolo Bonzini     return VIRTIO_NET_OK;
13416e790746SPaolo Bonzini }
1342ba7eadb5SGreg Kurz 
13436e790746SPaolo Bonzini static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
13446e790746SPaolo Bonzini {
134517a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
13466e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
13476e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
134851b19ebeSPaolo Bonzini     VirtQueueElement *elem;
13496e790746SPaolo Bonzini     size_t s;
1350771b6ed3SJason Wang     struct iovec *iov, *iov2;
13516e790746SPaolo Bonzini     unsigned int iov_cnt;
13526e790746SPaolo Bonzini 
135351b19ebeSPaolo Bonzini     for (;;) {
135451b19ebeSPaolo Bonzini         elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
135551b19ebeSPaolo Bonzini         if (!elem) {
135651b19ebeSPaolo Bonzini             break;
135751b19ebeSPaolo Bonzini         }
135851b19ebeSPaolo Bonzini         if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) ||
135951b19ebeSPaolo Bonzini             iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) {
1360ba7eadb5SGreg Kurz             virtio_error(vdev, "virtio-net ctrl missing headers");
1361ba7eadb5SGreg Kurz             virtqueue_detach_element(vq, elem, 0);
1362ba7eadb5SGreg Kurz             g_free(elem);
1363ba7eadb5SGreg Kurz             break;
13646e790746SPaolo Bonzini         }
13656e790746SPaolo Bonzini 
136651b19ebeSPaolo Bonzini         iov_cnt = elem->out_num;
136751b19ebeSPaolo Bonzini         iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num);
13686e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl));
13696e790746SPaolo Bonzini         iov_discard_front(&iov, &iov_cnt, sizeof(ctrl));
13706e790746SPaolo Bonzini         if (s != sizeof(ctrl)) {
13716e790746SPaolo Bonzini             status = VIRTIO_NET_ERR;
13726e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
13736e790746SPaolo Bonzini             status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt);
13746e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
13756e790746SPaolo Bonzini             status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt);
13766e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
13776e790746SPaolo Bonzini             status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt);
1378f57fcf70SJason Wang         } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
1379f57fcf70SJason Wang             status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt);
13806e790746SPaolo Bonzini         } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
13816e790746SPaolo Bonzini             status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt);
1382644c9858SDmitry Fleytman         } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
1383644c9858SDmitry Fleytman             status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt);
13846e790746SPaolo Bonzini         }
13856e790746SPaolo Bonzini 
138651b19ebeSPaolo Bonzini         s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status));
13876e790746SPaolo Bonzini         assert(s == sizeof(status));
13886e790746SPaolo Bonzini 
138951b19ebeSPaolo Bonzini         virtqueue_push(vq, elem, sizeof(status));
13906e790746SPaolo Bonzini         virtio_notify(vdev, vq);
1391771b6ed3SJason Wang         g_free(iov2);
139251b19ebeSPaolo Bonzini         g_free(elem);
13936e790746SPaolo Bonzini     }
13946e790746SPaolo Bonzini }
13956e790746SPaolo Bonzini 
13966e790746SPaolo Bonzini /* RX */
13976e790746SPaolo Bonzini 
13986e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
13996e790746SPaolo Bonzini {
140017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
14016e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
14026e790746SPaolo Bonzini 
14036e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
14046e790746SPaolo Bonzini }
14056e790746SPaolo Bonzini 
1406b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc)
14076e790746SPaolo Bonzini {
14086e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
140917a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
14106e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
14116e790746SPaolo Bonzini 
141217a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
1413b8c4b67eSPhilippe Mathieu-Daudé         return false;
14146e790746SPaolo Bonzini     }
14156e790746SPaolo Bonzini 
14166e790746SPaolo Bonzini     if (nc->queue_index >= n->curr_queues) {
1417b8c4b67eSPhilippe Mathieu-Daudé         return false;
14186e790746SPaolo Bonzini     }
14196e790746SPaolo Bonzini 
14206e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
142117a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
1422b8c4b67eSPhilippe Mathieu-Daudé         return false;
14236e790746SPaolo Bonzini     }
14246e790746SPaolo Bonzini 
1425b8c4b67eSPhilippe Mathieu-Daudé     return true;
14266e790746SPaolo Bonzini }
14276e790746SPaolo Bonzini 
14286e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
14296e790746SPaolo Bonzini {
14306e790746SPaolo Bonzini     VirtIONet *n = q->n;
14316e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
14326e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
14336e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
14346e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
14356e790746SPaolo Bonzini 
14366e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
14376e790746SPaolo Bonzini          * available after the above check but before notification was
14386e790746SPaolo Bonzini          * enabled, check for available buffers again.
14396e790746SPaolo Bonzini          */
14406e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
14416e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
14426e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
14436e790746SPaolo Bonzini             return 0;
14446e790746SPaolo Bonzini         }
14456e790746SPaolo Bonzini     }
14466e790746SPaolo Bonzini 
14476e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
14486e790746SPaolo Bonzini     return 1;
14496e790746SPaolo Bonzini }
14506e790746SPaolo Bonzini 
14511399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
1452032a74a1SCédric Le Goater {
14531399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->hdr_len);
14541399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->gso_size);
14551399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_start);
14561399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_offset);
1457032a74a1SCédric Le Goater }
1458032a74a1SCédric Le Goater 
14596e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
14606e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
14616e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
14626e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
14636e790746SPaolo Bonzini  * dhclient yet.
14646e790746SPaolo Bonzini  *
14656e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
14666e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
14676e790746SPaolo Bonzini  * kernels.
14686e790746SPaolo Bonzini  *
14696e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
14706e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
14716e790746SPaolo Bonzini  * cache.
14726e790746SPaolo Bonzini  */
14736e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
14746e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
14756e790746SPaolo Bonzini {
14766e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
14776e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
14786e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
14796e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
14806e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
14816e790746SPaolo Bonzini         net_checksum_calculate(buf, size);
14826e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
14836e790746SPaolo Bonzini     }
14846e790746SPaolo Bonzini }
14856e790746SPaolo Bonzini 
14866e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
14876e790746SPaolo Bonzini                            const void *buf, size_t size)
14886e790746SPaolo Bonzini {
14896e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
14906e790746SPaolo Bonzini         /* FIXME this cast is evil */
14916e790746SPaolo Bonzini         void *wbuf = (void *)buf;
14926e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
14936e790746SPaolo Bonzini                                     size - n->host_hdr_len);
14941bfa316cSGreg Kurz 
14951bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
14961399c60dSRusty Russell             virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
14971bfa316cSGreg Kurz         }
14986e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
14996e790746SPaolo Bonzini     } else {
15006e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
15016e790746SPaolo Bonzini             .flags = 0,
15026e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
15036e790746SPaolo Bonzini         };
15046e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
15056e790746SPaolo Bonzini     }
15066e790746SPaolo Bonzini }
15076e790746SPaolo Bonzini 
15086e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
15096e790746SPaolo Bonzini {
15106e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
15116e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
15126e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
15136e790746SPaolo Bonzini     int i;
15146e790746SPaolo Bonzini 
15156e790746SPaolo Bonzini     if (n->promisc)
15166e790746SPaolo Bonzini         return 1;
15176e790746SPaolo Bonzini 
15186e790746SPaolo Bonzini     ptr += n->host_hdr_len;
15196e790746SPaolo Bonzini 
15206e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
15217542d3e7SPeter Maydell         int vid = lduw_be_p(ptr + 14) & 0xfff;
15226e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
15236e790746SPaolo Bonzini             return 0;
15246e790746SPaolo Bonzini     }
15256e790746SPaolo Bonzini 
15266e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
15276e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
15286e790746SPaolo Bonzini             return !n->nobcast;
15296e790746SPaolo Bonzini         } else if (n->nomulti) {
15306e790746SPaolo Bonzini             return 0;
15316e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
15326e790746SPaolo Bonzini             return 1;
15336e790746SPaolo Bonzini         }
15346e790746SPaolo Bonzini 
15356e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
15366e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
15376e790746SPaolo Bonzini                 return 1;
15386e790746SPaolo Bonzini             }
15396e790746SPaolo Bonzini         }
15406e790746SPaolo Bonzini     } else { // unicast
15416e790746SPaolo Bonzini         if (n->nouni) {
15426e790746SPaolo Bonzini             return 0;
15436e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
15446e790746SPaolo Bonzini             return 1;
15456e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
15466e790746SPaolo Bonzini             return 1;
15476e790746SPaolo Bonzini         }
15486e790746SPaolo Bonzini 
15496e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
15506e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
15516e790746SPaolo Bonzini                 return 1;
15526e790746SPaolo Bonzini             }
15536e790746SPaolo Bonzini         }
15546e790746SPaolo Bonzini     }
15556e790746SPaolo Bonzini 
15566e790746SPaolo Bonzini     return 0;
15576e790746SPaolo Bonzini }
15586e790746SPaolo Bonzini 
15594474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4,
15604474e37aSYuri Benditovich                                         bool isip6,
15614474e37aSYuri Benditovich                                         bool isudp,
15624474e37aSYuri Benditovich                                         bool istcp,
15634474e37aSYuri Benditovich                                         uint32_t types)
15644474e37aSYuri Benditovich {
15654474e37aSYuri Benditovich     if (isip4) {
15664474e37aSYuri Benditovich         if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) {
15674474e37aSYuri Benditovich             return NetPktRssIpV4Tcp;
15684474e37aSYuri Benditovich         }
15694474e37aSYuri Benditovich         if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) {
15704474e37aSYuri Benditovich             return NetPktRssIpV4Udp;
15714474e37aSYuri Benditovich         }
15724474e37aSYuri Benditovich         if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) {
15734474e37aSYuri Benditovich             return NetPktRssIpV4;
15744474e37aSYuri Benditovich         }
15754474e37aSYuri Benditovich     } else if (isip6) {
15764474e37aSYuri Benditovich         uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX |
15774474e37aSYuri Benditovich                         VIRTIO_NET_RSS_HASH_TYPE_TCPv6;
15784474e37aSYuri Benditovich 
15794474e37aSYuri Benditovich         if (istcp && (types & mask)) {
15804474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ?
15814474e37aSYuri Benditovich                 NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp;
15824474e37aSYuri Benditovich         }
15834474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6;
15844474e37aSYuri Benditovich         if (isudp && (types & mask)) {
15854474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ?
15864474e37aSYuri Benditovich                 NetPktRssIpV6UdpEx : NetPktRssIpV6Udp;
15874474e37aSYuri Benditovich         }
15884474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6;
15894474e37aSYuri Benditovich         if (types & mask) {
15904474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ?
15914474e37aSYuri Benditovich                 NetPktRssIpV6Ex : NetPktRssIpV6;
15924474e37aSYuri Benditovich         }
15934474e37aSYuri Benditovich     }
15944474e37aSYuri Benditovich     return 0xff;
15954474e37aSYuri Benditovich }
15964474e37aSYuri Benditovich 
1597e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report,
1598e22f0603SYuri Benditovich                                    uint32_t hash)
1599e22f0603SYuri Benditovich {
1600e22f0603SYuri Benditovich     struct virtio_net_hdr_v1_hash *hdr = (void *)buf;
1601e22f0603SYuri Benditovich     hdr->hash_value = hash;
1602e22f0603SYuri Benditovich     hdr->hash_report = report;
1603e22f0603SYuri Benditovich }
1604e22f0603SYuri Benditovich 
16054474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf,
160697cd965cSPaolo Bonzini                                   size_t size)
16076e790746SPaolo Bonzini {
16086e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1609e22f0603SYuri Benditovich     unsigned int index = nc->queue_index, new_index = index;
16104474e37aSYuri Benditovich     struct NetRxPkt *pkt = n->rx_pkt;
16114474e37aSYuri Benditovich     uint8_t net_hash_type;
16124474e37aSYuri Benditovich     uint32_t hash;
16134474e37aSYuri Benditovich     bool isip4, isip6, isudp, istcp;
1614e22f0603SYuri Benditovich     static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = {
1615e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv4,
1616e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv4,
1617e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6,
1618e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6,
1619e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6_EX,
1620e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6_EX,
1621e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv4,
1622e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6,
1623e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6_EX
1624e22f0603SYuri Benditovich     };
16254474e37aSYuri Benditovich 
16264474e37aSYuri Benditovich     net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len,
16274474e37aSYuri Benditovich                              size - n->host_hdr_len);
16284474e37aSYuri Benditovich     net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp);
16294474e37aSYuri Benditovich     if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) {
16304474e37aSYuri Benditovich         istcp = isudp = false;
16314474e37aSYuri Benditovich     }
16324474e37aSYuri Benditovich     if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) {
16334474e37aSYuri Benditovich         istcp = isudp = false;
16344474e37aSYuri Benditovich     }
16354474e37aSYuri Benditovich     net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp,
16364474e37aSYuri Benditovich                                              n->rss_data.hash_types);
16374474e37aSYuri Benditovich     if (net_hash_type > NetPktRssIpV6UdpEx) {
1638e22f0603SYuri Benditovich         if (n->rss_data.populate_hash) {
1639e22f0603SYuri Benditovich             virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0);
1640e22f0603SYuri Benditovich         }
1641e22f0603SYuri Benditovich         return n->rss_data.redirect ? n->rss_data.default_queue : -1;
16424474e37aSYuri Benditovich     }
16434474e37aSYuri Benditovich 
16444474e37aSYuri Benditovich     hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key);
1645e22f0603SYuri Benditovich 
1646e22f0603SYuri Benditovich     if (n->rss_data.populate_hash) {
1647e22f0603SYuri Benditovich         virtio_set_packet_hash(buf, reports[net_hash_type], hash);
1648e22f0603SYuri Benditovich     }
1649e22f0603SYuri Benditovich 
1650e22f0603SYuri Benditovich     if (n->rss_data.redirect) {
16514474e37aSYuri Benditovich         new_index = hash & (n->rss_data.indirections_len - 1);
16524474e37aSYuri Benditovich         new_index = n->rss_data.indirections_table[new_index];
16534474e37aSYuri Benditovich     }
1654e22f0603SYuri Benditovich 
1655e22f0603SYuri Benditovich     return (index == new_index) ? -1 : new_index;
16564474e37aSYuri Benditovich }
16574474e37aSYuri Benditovich 
16584474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf,
16594474e37aSYuri Benditovich                                       size_t size, bool no_rss)
16604474e37aSYuri Benditovich {
16614474e37aSYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
16626e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
166317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
16646e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
16656e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
16666e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
16676e790746SPaolo Bonzini     size_t offset, i, guest_offset;
16686e790746SPaolo Bonzini 
16696e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
16706e790746SPaolo Bonzini         return -1;
16716e790746SPaolo Bonzini     }
16726e790746SPaolo Bonzini 
16734474e37aSYuri Benditovich     if (!no_rss && n->rss_data.enabled) {
16744474e37aSYuri Benditovich         int index = virtio_net_process_rss(nc, buf, size);
16754474e37aSYuri Benditovich         if (index >= 0) {
16764474e37aSYuri Benditovich             NetClientState *nc2 = qemu_get_subqueue(n->nic, index);
16774474e37aSYuri Benditovich             return virtio_net_receive_rcu(nc2, buf, size, true);
16784474e37aSYuri Benditovich         }
16794474e37aSYuri Benditovich     }
16804474e37aSYuri Benditovich 
16816e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
16826e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
16836e790746SPaolo Bonzini         return 0;
16846e790746SPaolo Bonzini     }
16856e790746SPaolo Bonzini 
16866e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
16876e790746SPaolo Bonzini         return size;
16886e790746SPaolo Bonzini 
16896e790746SPaolo Bonzini     offset = i = 0;
16906e790746SPaolo Bonzini 
16916e790746SPaolo Bonzini     while (offset < size) {
169251b19ebeSPaolo Bonzini         VirtQueueElement *elem;
16936e790746SPaolo Bonzini         int len, total;
169451b19ebeSPaolo Bonzini         const struct iovec *sg;
16956e790746SPaolo Bonzini 
16966e790746SPaolo Bonzini         total = 0;
16976e790746SPaolo Bonzini 
169851b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
169951b19ebeSPaolo Bonzini         if (!elem) {
1700ba10b9c0SGreg Kurz             if (i) {
1701ba10b9c0SGreg Kurz                 virtio_error(vdev, "virtio-net unexpected empty queue: "
17026e790746SPaolo Bonzini                              "i %zd mergeable %d offset %zd, size %zd, "
1703019a3edbSGerd Hoffmann                              "guest hdr len %zd, host hdr len %zd "
1704019a3edbSGerd Hoffmann                              "guest features 0x%" PRIx64,
17056e790746SPaolo Bonzini                              i, n->mergeable_rx_bufs, offset, size,
1706019a3edbSGerd Hoffmann                              n->guest_hdr_len, n->host_hdr_len,
1707019a3edbSGerd Hoffmann                              vdev->guest_features);
1708ba10b9c0SGreg Kurz             }
1709ba10b9c0SGreg Kurz             return -1;
17106e790746SPaolo Bonzini         }
17116e790746SPaolo Bonzini 
171251b19ebeSPaolo Bonzini         if (elem->in_num < 1) {
1713ba10b9c0SGreg Kurz             virtio_error(vdev,
1714ba10b9c0SGreg Kurz                          "virtio-net receive queue contains no in buffers");
1715ba10b9c0SGreg Kurz             virtqueue_detach_element(q->rx_vq, elem, 0);
1716ba10b9c0SGreg Kurz             g_free(elem);
1717ba10b9c0SGreg Kurz             return -1;
17186e790746SPaolo Bonzini         }
17196e790746SPaolo Bonzini 
172051b19ebeSPaolo Bonzini         sg = elem->in_sg;
17216e790746SPaolo Bonzini         if (i == 0) {
17226e790746SPaolo Bonzini             assert(offset == 0);
17236e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
17246e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
172551b19ebeSPaolo Bonzini                                     sg, elem->in_num,
17266e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
17276e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
17286e790746SPaolo Bonzini             }
17296e790746SPaolo Bonzini 
173051b19ebeSPaolo Bonzini             receive_header(n, sg, elem->in_num, buf, size);
1731e22f0603SYuri Benditovich             if (n->rss_data.populate_hash) {
1732e22f0603SYuri Benditovich                 offset = sizeof(mhdr);
1733e22f0603SYuri Benditovich                 iov_from_buf(sg, elem->in_num, offset,
1734e22f0603SYuri Benditovich                              buf + offset, n->host_hdr_len - sizeof(mhdr));
1735e22f0603SYuri Benditovich             }
17366e790746SPaolo Bonzini             offset = n->host_hdr_len;
17376e790746SPaolo Bonzini             total += n->guest_hdr_len;
17386e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
17396e790746SPaolo Bonzini         } else {
17406e790746SPaolo Bonzini             guest_offset = 0;
17416e790746SPaolo Bonzini         }
17426e790746SPaolo Bonzini 
17436e790746SPaolo Bonzini         /* copy in packet.  ugh */
174451b19ebeSPaolo Bonzini         len = iov_from_buf(sg, elem->in_num, guest_offset,
17456e790746SPaolo Bonzini                            buf + offset, size - offset);
17466e790746SPaolo Bonzini         total += len;
17476e790746SPaolo Bonzini         offset += len;
17486e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
17496e790746SPaolo Bonzini          * must have consumed the complete packet.
17506e790746SPaolo Bonzini          * Otherwise, drop it. */
17516e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
175227e57efeSLadi Prosek             virtqueue_unpop(q->rx_vq, elem, total);
175351b19ebeSPaolo Bonzini             g_free(elem);
17546e790746SPaolo Bonzini             return size;
17556e790746SPaolo Bonzini         }
17566e790746SPaolo Bonzini 
17576e790746SPaolo Bonzini         /* signal other side */
175851b19ebeSPaolo Bonzini         virtqueue_fill(q->rx_vq, elem, total, i++);
175951b19ebeSPaolo Bonzini         g_free(elem);
17606e790746SPaolo Bonzini     }
17616e790746SPaolo Bonzini 
17626e790746SPaolo Bonzini     if (mhdr_cnt) {
17631399c60dSRusty Russell         virtio_stw_p(vdev, &mhdr.num_buffers, i);
17646e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
17656e790746SPaolo Bonzini                      0,
17666e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
17676e790746SPaolo Bonzini     }
17686e790746SPaolo Bonzini 
17696e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
177017a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
17716e790746SPaolo Bonzini 
17726e790746SPaolo Bonzini     return size;
17736e790746SPaolo Bonzini }
17746e790746SPaolo Bonzini 
17752974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf,
177697cd965cSPaolo Bonzini                                   size_t size)
177797cd965cSPaolo Bonzini {
1778068ddfa9SDr. David Alan Gilbert     RCU_READ_LOCK_GUARD();
177997cd965cSPaolo Bonzini 
17804474e37aSYuri Benditovich     return virtio_net_receive_rcu(nc, buf, size, false);
178197cd965cSPaolo Bonzini }
178297cd965cSPaolo Bonzini 
17832974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain,
17842974e916SYuri Benditovich                                          const uint8_t *buf,
17852974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
17862974e916SYuri Benditovich {
17872974e916SYuri Benditovich     uint16_t ip_hdrlen;
17882974e916SYuri Benditovich     struct ip_header *ip;
17892974e916SYuri Benditovich 
17902974e916SYuri Benditovich     ip = (struct ip_header *)(buf + chain->n->guest_hdr_len
17912974e916SYuri Benditovich                               + sizeof(struct eth_header));
17922974e916SYuri Benditovich     unit->ip = (void *)ip;
17932974e916SYuri Benditovich     ip_hdrlen = (ip->ip_ver_len & 0xF) << 2;
17942974e916SYuri Benditovich     unit->ip_plen = &ip->ip_len;
17952974e916SYuri Benditovich     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen);
17962974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
17972974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen;
17982974e916SYuri Benditovich }
17992974e916SYuri Benditovich 
18002974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain,
18012974e916SYuri Benditovich                                          const uint8_t *buf,
18022974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
18032974e916SYuri Benditovich {
18042974e916SYuri Benditovich     struct ip6_header *ip6;
18052974e916SYuri Benditovich 
18062974e916SYuri Benditovich     ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len
18072974e916SYuri Benditovich                                  + sizeof(struct eth_header));
18082974e916SYuri Benditovich     unit->ip = ip6;
18092974e916SYuri Benditovich     unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
181078ee6bd0SPhilippe Mathieu-Daudé     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip)
18112974e916SYuri Benditovich                                         + sizeof(struct ip6_header));
18122974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
18132974e916SYuri Benditovich 
18142974e916SYuri Benditovich     /* There is a difference between payload lenght in ipv4 and v6,
18152974e916SYuri Benditovich        ip header is excluded in ipv6 */
18162974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen;
18172974e916SYuri Benditovich }
18182974e916SYuri Benditovich 
18192974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain,
18202974e916SYuri Benditovich                                        VirtioNetRscSeg *seg)
18212974e916SYuri Benditovich {
18222974e916SYuri Benditovich     int ret;
1823dd3d85e8SYuri Benditovich     struct virtio_net_hdr_v1 *h;
18242974e916SYuri Benditovich 
1825dd3d85e8SYuri Benditovich     h = (struct virtio_net_hdr_v1 *)seg->buf;
18262974e916SYuri Benditovich     h->flags = 0;
18272974e916SYuri Benditovich     h->gso_type = VIRTIO_NET_HDR_GSO_NONE;
18282974e916SYuri Benditovich 
18292974e916SYuri Benditovich     if (seg->is_coalesced) {
1830dd3d85e8SYuri Benditovich         h->rsc.segments = seg->packets;
1831dd3d85e8SYuri Benditovich         h->rsc.dup_acks = seg->dup_ack;
18322974e916SYuri Benditovich         h->flags = VIRTIO_NET_HDR_F_RSC_INFO;
18332974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
18342974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
18352974e916SYuri Benditovich         } else {
18362974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
18372974e916SYuri Benditovich         }
18382974e916SYuri Benditovich     }
18392974e916SYuri Benditovich 
18402974e916SYuri Benditovich     ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size);
18412974e916SYuri Benditovich     QTAILQ_REMOVE(&chain->buffers, seg, next);
18422974e916SYuri Benditovich     g_free(seg->buf);
18432974e916SYuri Benditovich     g_free(seg);
18442974e916SYuri Benditovich 
18452974e916SYuri Benditovich     return ret;
18462974e916SYuri Benditovich }
18472974e916SYuri Benditovich 
18482974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq)
18492974e916SYuri Benditovich {
18502974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn;
18512974e916SYuri Benditovich     VirtioNetRscChain *chain = (VirtioNetRscChain *)opq;
18522974e916SYuri Benditovich 
18532974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) {
18542974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
18552974e916SYuri Benditovich             chain->stat.purge_failed++;
18562974e916SYuri Benditovich             continue;
18572974e916SYuri Benditovich         }
18582974e916SYuri Benditovich     }
18592974e916SYuri Benditovich 
18602974e916SYuri Benditovich     chain->stat.timer++;
18612974e916SYuri Benditovich     if (!QTAILQ_EMPTY(&chain->buffers)) {
18622974e916SYuri Benditovich         timer_mod(chain->drain_timer,
18632974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
18642974e916SYuri Benditovich     }
18652974e916SYuri Benditovich }
18662974e916SYuri Benditovich 
18672974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n)
18682974e916SYuri Benditovich {
18692974e916SYuri Benditovich     VirtioNetRscChain *chain, *rn_chain;
18702974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn_seg;
18712974e916SYuri Benditovich 
18722974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) {
18732974e916SYuri Benditovich         QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) {
18742974e916SYuri Benditovich             QTAILQ_REMOVE(&chain->buffers, seg, next);
18752974e916SYuri Benditovich             g_free(seg->buf);
18762974e916SYuri Benditovich             g_free(seg);
18772974e916SYuri Benditovich         }
18782974e916SYuri Benditovich 
18792974e916SYuri Benditovich         timer_del(chain->drain_timer);
18802974e916SYuri Benditovich         timer_free(chain->drain_timer);
18812974e916SYuri Benditovich         QTAILQ_REMOVE(&n->rsc_chains, chain, next);
18822974e916SYuri Benditovich         g_free(chain);
18832974e916SYuri Benditovich     }
18842974e916SYuri Benditovich }
18852974e916SYuri Benditovich 
18862974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain,
18872974e916SYuri Benditovich                                      NetClientState *nc,
18882974e916SYuri Benditovich                                      const uint8_t *buf, size_t size)
18892974e916SYuri Benditovich {
18902974e916SYuri Benditovich     uint16_t hdr_len;
18912974e916SYuri Benditovich     VirtioNetRscSeg *seg;
18922974e916SYuri Benditovich 
18932974e916SYuri Benditovich     hdr_len = chain->n->guest_hdr_len;
18942974e916SYuri Benditovich     seg = g_malloc(sizeof(VirtioNetRscSeg));
18952974e916SYuri Benditovich     seg->buf = g_malloc(hdr_len + sizeof(struct eth_header)
18962974e916SYuri Benditovich         + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD);
18972974e916SYuri Benditovich     memcpy(seg->buf, buf, size);
18982974e916SYuri Benditovich     seg->size = size;
18992974e916SYuri Benditovich     seg->packets = 1;
19002974e916SYuri Benditovich     seg->dup_ack = 0;
19012974e916SYuri Benditovich     seg->is_coalesced = 0;
19022974e916SYuri Benditovich     seg->nc = nc;
19032974e916SYuri Benditovich 
19042974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&chain->buffers, seg, next);
19052974e916SYuri Benditovich     chain->stat.cache++;
19062974e916SYuri Benditovich 
19072974e916SYuri Benditovich     switch (chain->proto) {
19082974e916SYuri Benditovich     case ETH_P_IP:
19092974e916SYuri Benditovich         virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit);
19102974e916SYuri Benditovich         break;
19112974e916SYuri Benditovich     case ETH_P_IPV6:
19122974e916SYuri Benditovich         virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit);
19132974e916SYuri Benditovich         break;
19142974e916SYuri Benditovich     default:
19152974e916SYuri Benditovich         g_assert_not_reached();
19162974e916SYuri Benditovich     }
19172974e916SYuri Benditovich }
19182974e916SYuri Benditovich 
19192974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain,
19202974e916SYuri Benditovich                                          VirtioNetRscSeg *seg,
19212974e916SYuri Benditovich                                          const uint8_t *buf,
19222974e916SYuri Benditovich                                          struct tcp_header *n_tcp,
19232974e916SYuri Benditovich                                          struct tcp_header *o_tcp)
19242974e916SYuri Benditovich {
19252974e916SYuri Benditovich     uint32_t nack, oack;
19262974e916SYuri Benditovich     uint16_t nwin, owin;
19272974e916SYuri Benditovich 
19282974e916SYuri Benditovich     nack = htonl(n_tcp->th_ack);
19292974e916SYuri Benditovich     nwin = htons(n_tcp->th_win);
19302974e916SYuri Benditovich     oack = htonl(o_tcp->th_ack);
19312974e916SYuri Benditovich     owin = htons(o_tcp->th_win);
19322974e916SYuri Benditovich 
19332974e916SYuri Benditovich     if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) {
19342974e916SYuri Benditovich         chain->stat.ack_out_of_win++;
19352974e916SYuri Benditovich         return RSC_FINAL;
19362974e916SYuri Benditovich     } else if (nack == oack) {
19372974e916SYuri Benditovich         /* duplicated ack or window probe */
19382974e916SYuri Benditovich         if (nwin == owin) {
19392974e916SYuri Benditovich             /* duplicated ack, add dup ack count due to whql test up to 1 */
19402974e916SYuri Benditovich             chain->stat.dup_ack++;
19412974e916SYuri Benditovich             return RSC_FINAL;
19422974e916SYuri Benditovich         } else {
19432974e916SYuri Benditovich             /* Coalesce window update */
19442974e916SYuri Benditovich             o_tcp->th_win = n_tcp->th_win;
19452974e916SYuri Benditovich             chain->stat.win_update++;
19462974e916SYuri Benditovich             return RSC_COALESCE;
19472974e916SYuri Benditovich         }
19482974e916SYuri Benditovich     } else {
19492974e916SYuri Benditovich         /* pure ack, go to 'C', finalize*/
19502974e916SYuri Benditovich         chain->stat.pure_ack++;
19512974e916SYuri Benditovich         return RSC_FINAL;
19522974e916SYuri Benditovich     }
19532974e916SYuri Benditovich }
19542974e916SYuri Benditovich 
19552974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain,
19562974e916SYuri Benditovich                                             VirtioNetRscSeg *seg,
19572974e916SYuri Benditovich                                             const uint8_t *buf,
19582974e916SYuri Benditovich                                             VirtioNetRscUnit *n_unit)
19592974e916SYuri Benditovich {
19602974e916SYuri Benditovich     void *data;
19612974e916SYuri Benditovich     uint16_t o_ip_len;
19622974e916SYuri Benditovich     uint32_t nseq, oseq;
19632974e916SYuri Benditovich     VirtioNetRscUnit *o_unit;
19642974e916SYuri Benditovich 
19652974e916SYuri Benditovich     o_unit = &seg->unit;
19662974e916SYuri Benditovich     o_ip_len = htons(*o_unit->ip_plen);
19672974e916SYuri Benditovich     nseq = htonl(n_unit->tcp->th_seq);
19682974e916SYuri Benditovich     oseq = htonl(o_unit->tcp->th_seq);
19692974e916SYuri Benditovich 
19702974e916SYuri Benditovich     /* out of order or retransmitted. */
19712974e916SYuri Benditovich     if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) {
19722974e916SYuri Benditovich         chain->stat.data_out_of_win++;
19732974e916SYuri Benditovich         return RSC_FINAL;
19742974e916SYuri Benditovich     }
19752974e916SYuri Benditovich 
19762974e916SYuri Benditovich     data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen;
19772974e916SYuri Benditovich     if (nseq == oseq) {
19782974e916SYuri Benditovich         if ((o_unit->payload == 0) && n_unit->payload) {
19792974e916SYuri Benditovich             /* From no payload to payload, normal case, not a dup ack or etc */
19802974e916SYuri Benditovich             chain->stat.data_after_pure_ack++;
19812974e916SYuri Benditovich             goto coalesce;
19822974e916SYuri Benditovich         } else {
19832974e916SYuri Benditovich             return virtio_net_rsc_handle_ack(chain, seg, buf,
19842974e916SYuri Benditovich                                              n_unit->tcp, o_unit->tcp);
19852974e916SYuri Benditovich         }
19862974e916SYuri Benditovich     } else if ((nseq - oseq) != o_unit->payload) {
19872974e916SYuri Benditovich         /* Not a consistent packet, out of order */
19882974e916SYuri Benditovich         chain->stat.data_out_of_order++;
19892974e916SYuri Benditovich         return RSC_FINAL;
19902974e916SYuri Benditovich     } else {
19912974e916SYuri Benditovich coalesce:
19922974e916SYuri Benditovich         if ((o_ip_len + n_unit->payload) > chain->max_payload) {
19932974e916SYuri Benditovich             chain->stat.over_size++;
19942974e916SYuri Benditovich             return RSC_FINAL;
19952974e916SYuri Benditovich         }
19962974e916SYuri Benditovich 
19972974e916SYuri Benditovich         /* Here comes the right data, the payload length in v4/v6 is different,
19982974e916SYuri Benditovich            so use the field value to update and record the new data len */
19992974e916SYuri Benditovich         o_unit->payload += n_unit->payload; /* update new data len */
20002974e916SYuri Benditovich 
20012974e916SYuri Benditovich         /* update field in ip header */
20022974e916SYuri Benditovich         *o_unit->ip_plen = htons(o_ip_len + n_unit->payload);
20032974e916SYuri Benditovich 
20042974e916SYuri Benditovich         /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced
20052974e916SYuri Benditovich            for windows guest, while this may change the behavior for linux
20062974e916SYuri Benditovich            guest (only if it uses RSC feature). */
20072974e916SYuri Benditovich         o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags;
20082974e916SYuri Benditovich 
20092974e916SYuri Benditovich         o_unit->tcp->th_ack = n_unit->tcp->th_ack;
20102974e916SYuri Benditovich         o_unit->tcp->th_win = n_unit->tcp->th_win;
20112974e916SYuri Benditovich 
20122974e916SYuri Benditovich         memmove(seg->buf + seg->size, data, n_unit->payload);
20132974e916SYuri Benditovich         seg->size += n_unit->payload;
20142974e916SYuri Benditovich         seg->packets++;
20152974e916SYuri Benditovich         chain->stat.coalesced++;
20162974e916SYuri Benditovich         return RSC_COALESCE;
20172974e916SYuri Benditovich     }
20182974e916SYuri Benditovich }
20192974e916SYuri Benditovich 
20202974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain,
20212974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
20222974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
20232974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
20242974e916SYuri Benditovich {
20252974e916SYuri Benditovich     struct ip_header *ip1, *ip2;
20262974e916SYuri Benditovich 
20272974e916SYuri Benditovich     ip1 = (struct ip_header *)(unit->ip);
20282974e916SYuri Benditovich     ip2 = (struct ip_header *)(seg->unit.ip);
20292974e916SYuri Benditovich     if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst)
20302974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
20312974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
20322974e916SYuri Benditovich         chain->stat.no_match++;
20332974e916SYuri Benditovich         return RSC_NO_MATCH;
20342974e916SYuri Benditovich     }
20352974e916SYuri Benditovich 
20362974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
20372974e916SYuri Benditovich }
20382974e916SYuri Benditovich 
20392974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain,
20402974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
20412974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
20422974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
20432974e916SYuri Benditovich {
20442974e916SYuri Benditovich     struct ip6_header *ip1, *ip2;
20452974e916SYuri Benditovich 
20462974e916SYuri Benditovich     ip1 = (struct ip6_header *)(unit->ip);
20472974e916SYuri Benditovich     ip2 = (struct ip6_header *)(seg->unit.ip);
20482974e916SYuri Benditovich     if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address))
20492974e916SYuri Benditovich         || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address))
20502974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
20512974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
20522974e916SYuri Benditovich             chain->stat.no_match++;
20532974e916SYuri Benditovich             return RSC_NO_MATCH;
20542974e916SYuri Benditovich     }
20552974e916SYuri Benditovich 
20562974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
20572974e916SYuri Benditovich }
20582974e916SYuri Benditovich 
20592974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain
20602974e916SYuri Benditovich  * to prevent out of order */
20612974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain,
20622974e916SYuri Benditovich                                          struct tcp_header *tcp)
20632974e916SYuri Benditovich {
20642974e916SYuri Benditovich     uint16_t tcp_hdr;
20652974e916SYuri Benditovich     uint16_t tcp_flag;
20662974e916SYuri Benditovich 
20672974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags);
20682974e916SYuri Benditovich     tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10;
20692974e916SYuri Benditovich     tcp_flag &= VIRTIO_NET_TCP_FLAG;
20702974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags) & 0x3F;
20712974e916SYuri Benditovich     if (tcp_flag & TH_SYN) {
20722974e916SYuri Benditovich         chain->stat.tcp_syn++;
20732974e916SYuri Benditovich         return RSC_BYPASS;
20742974e916SYuri Benditovich     }
20752974e916SYuri Benditovich 
20762974e916SYuri Benditovich     if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) {
20772974e916SYuri Benditovich         chain->stat.tcp_ctrl_drain++;
20782974e916SYuri Benditovich         return RSC_FINAL;
20792974e916SYuri Benditovich     }
20802974e916SYuri Benditovich 
20812974e916SYuri Benditovich     if (tcp_hdr > sizeof(struct tcp_header)) {
20822974e916SYuri Benditovich         chain->stat.tcp_all_opt++;
20832974e916SYuri Benditovich         return RSC_FINAL;
20842974e916SYuri Benditovich     }
20852974e916SYuri Benditovich 
20862974e916SYuri Benditovich     return RSC_CANDIDATE;
20872974e916SYuri Benditovich }
20882974e916SYuri Benditovich 
20892974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain,
20902974e916SYuri Benditovich                                          NetClientState *nc,
20912974e916SYuri Benditovich                                          const uint8_t *buf, size_t size,
20922974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
20932974e916SYuri Benditovich {
20942974e916SYuri Benditovich     int ret;
20952974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
20962974e916SYuri Benditovich 
20972974e916SYuri Benditovich     if (QTAILQ_EMPTY(&chain->buffers)) {
20982974e916SYuri Benditovich         chain->stat.empty_cache++;
20992974e916SYuri Benditovich         virtio_net_rsc_cache_buf(chain, nc, buf, size);
21002974e916SYuri Benditovich         timer_mod(chain->drain_timer,
21012974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
21022974e916SYuri Benditovich         return size;
21032974e916SYuri Benditovich     }
21042974e916SYuri Benditovich 
21052974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
21062974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
21072974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit);
21082974e916SYuri Benditovich         } else {
21092974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit);
21102974e916SYuri Benditovich         }
21112974e916SYuri Benditovich 
21122974e916SYuri Benditovich         if (ret == RSC_FINAL) {
21132974e916SYuri Benditovich             if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
21142974e916SYuri Benditovich                 /* Send failed */
21152974e916SYuri Benditovich                 chain->stat.final_failed++;
21162974e916SYuri Benditovich                 return 0;
21172974e916SYuri Benditovich             }
21182974e916SYuri Benditovich 
21192974e916SYuri Benditovich             /* Send current packet */
21202974e916SYuri Benditovich             return virtio_net_do_receive(nc, buf, size);
21212974e916SYuri Benditovich         } else if (ret == RSC_NO_MATCH) {
21222974e916SYuri Benditovich             continue;
21232974e916SYuri Benditovich         } else {
21242974e916SYuri Benditovich             /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */
21252974e916SYuri Benditovich             seg->is_coalesced = 1;
21262974e916SYuri Benditovich             return size;
21272974e916SYuri Benditovich         }
21282974e916SYuri Benditovich     }
21292974e916SYuri Benditovich 
21302974e916SYuri Benditovich     chain->stat.no_match_cache++;
21312974e916SYuri Benditovich     virtio_net_rsc_cache_buf(chain, nc, buf, size);
21322974e916SYuri Benditovich     return size;
21332974e916SYuri Benditovich }
21342974e916SYuri Benditovich 
21352974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */
21362974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain,
21372974e916SYuri Benditovich                                         NetClientState *nc,
21382974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21392974e916SYuri Benditovich                                         uint16_t ip_start, uint16_t ip_size,
21402974e916SYuri Benditovich                                         uint16_t tcp_port)
21412974e916SYuri Benditovich {
21422974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
21432974e916SYuri Benditovich     uint32_t ppair1, ppair2;
21442974e916SYuri Benditovich 
21452974e916SYuri Benditovich     ppair1 = *(uint32_t *)(buf + tcp_port);
21462974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
21472974e916SYuri Benditovich         ppair2 = *(uint32_t *)(seg->buf + tcp_port);
21482974e916SYuri Benditovich         if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size)
21492974e916SYuri Benditovich             || (ppair1 != ppair2)) {
21502974e916SYuri Benditovich             continue;
21512974e916SYuri Benditovich         }
21522974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
21532974e916SYuri Benditovich             chain->stat.drain_failed++;
21542974e916SYuri Benditovich         }
21552974e916SYuri Benditovich 
21562974e916SYuri Benditovich         break;
21572974e916SYuri Benditovich     }
21582974e916SYuri Benditovich 
21592974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
21602974e916SYuri Benditovich }
21612974e916SYuri Benditovich 
21622974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain,
21632974e916SYuri Benditovich                                             struct ip_header *ip,
21642974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
21652974e916SYuri Benditovich {
21662974e916SYuri Benditovich     uint16_t ip_len;
21672974e916SYuri Benditovich 
21682974e916SYuri Benditovich     /* Not an ipv4 packet */
21692974e916SYuri Benditovich     if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) {
21702974e916SYuri Benditovich         chain->stat.ip_option++;
21712974e916SYuri Benditovich         return RSC_BYPASS;
21722974e916SYuri Benditovich     }
21732974e916SYuri Benditovich 
21742974e916SYuri Benditovich     /* Don't handle packets with ip option */
21752974e916SYuri Benditovich     if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) {
21762974e916SYuri Benditovich         chain->stat.ip_option++;
21772974e916SYuri Benditovich         return RSC_BYPASS;
21782974e916SYuri Benditovich     }
21792974e916SYuri Benditovich 
21802974e916SYuri Benditovich     if (ip->ip_p != IPPROTO_TCP) {
21812974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
21822974e916SYuri Benditovich         return RSC_BYPASS;
21832974e916SYuri Benditovich     }
21842974e916SYuri Benditovich 
21852974e916SYuri Benditovich     /* Don't handle packets with ip fragment */
21862974e916SYuri Benditovich     if (!(htons(ip->ip_off) & IP_DF)) {
21872974e916SYuri Benditovich         chain->stat.ip_frag++;
21882974e916SYuri Benditovich         return RSC_BYPASS;
21892974e916SYuri Benditovich     }
21902974e916SYuri Benditovich 
21912974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
21922974e916SYuri Benditovich     if (IPTOS_ECN(ip->ip_tos)) {
21932974e916SYuri Benditovich         chain->stat.ip_ecn++;
21942974e916SYuri Benditovich         return RSC_BYPASS;
21952974e916SYuri Benditovich     }
21962974e916SYuri Benditovich 
21972974e916SYuri Benditovich     ip_len = htons(ip->ip_len);
21982974e916SYuri Benditovich     if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header))
21992974e916SYuri Benditovich         || ip_len > (size - chain->n->guest_hdr_len -
22002974e916SYuri Benditovich                      sizeof(struct eth_header))) {
22012974e916SYuri Benditovich         chain->stat.ip_hacked++;
22022974e916SYuri Benditovich         return RSC_BYPASS;
22032974e916SYuri Benditovich     }
22042974e916SYuri Benditovich 
22052974e916SYuri Benditovich     return RSC_CANDIDATE;
22062974e916SYuri Benditovich }
22072974e916SYuri Benditovich 
22082974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain,
22092974e916SYuri Benditovich                                       NetClientState *nc,
22102974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
22112974e916SYuri Benditovich {
22122974e916SYuri Benditovich     int32_t ret;
22132974e916SYuri Benditovich     uint16_t hdr_len;
22142974e916SYuri Benditovich     VirtioNetRscUnit unit;
22152974e916SYuri Benditovich 
22162974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
22172974e916SYuri Benditovich 
22182974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)
22192974e916SYuri Benditovich         + sizeof(struct tcp_header))) {
22202974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
22212974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22222974e916SYuri Benditovich     }
22232974e916SYuri Benditovich 
22242974e916SYuri Benditovich     virtio_net_rsc_extract_unit4(chain, buf, &unit);
22252974e916SYuri Benditovich     if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size)
22262974e916SYuri Benditovich         != RSC_CANDIDATE) {
22272974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22282974e916SYuri Benditovich     }
22292974e916SYuri Benditovich 
22302974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
22312974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
22322974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22332974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
22342974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
22352974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 12),
22362974e916SYuri Benditovich                 VIRTIO_NET_IP4_ADDR_SIZE,
22372974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header));
22382974e916SYuri Benditovich     }
22392974e916SYuri Benditovich 
22402974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
22412974e916SYuri Benditovich }
22422974e916SYuri Benditovich 
22432974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain,
22442974e916SYuri Benditovich                                             struct ip6_header *ip6,
22452974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
22462974e916SYuri Benditovich {
22472974e916SYuri Benditovich     uint16_t ip_len;
22482974e916SYuri Benditovich 
22492974e916SYuri Benditovich     if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4)
22502974e916SYuri Benditovich         != IP_HEADER_VERSION_6) {
22512974e916SYuri Benditovich         return RSC_BYPASS;
22522974e916SYuri Benditovich     }
22532974e916SYuri Benditovich 
22542974e916SYuri Benditovich     /* Both option and protocol is checked in this */
22552974e916SYuri Benditovich     if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) {
22562974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
22572974e916SYuri Benditovich         return RSC_BYPASS;
22582974e916SYuri Benditovich     }
22592974e916SYuri Benditovich 
22602974e916SYuri Benditovich     ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
22612974e916SYuri Benditovich     if (ip_len < sizeof(struct tcp_header) ||
22622974e916SYuri Benditovich         ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header)
22632974e916SYuri Benditovich                   - sizeof(struct ip6_header))) {
22642974e916SYuri Benditovich         chain->stat.ip_hacked++;
22652974e916SYuri Benditovich         return RSC_BYPASS;
22662974e916SYuri Benditovich     }
22672974e916SYuri Benditovich 
22682974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
22692974e916SYuri Benditovich     if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) {
22702974e916SYuri Benditovich         chain->stat.ip_ecn++;
22712974e916SYuri Benditovich         return RSC_BYPASS;
22722974e916SYuri Benditovich     }
22732974e916SYuri Benditovich 
22742974e916SYuri Benditovich     return RSC_CANDIDATE;
22752974e916SYuri Benditovich }
22762974e916SYuri Benditovich 
22772974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc,
22782974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
22792974e916SYuri Benditovich {
22802974e916SYuri Benditovich     int32_t ret;
22812974e916SYuri Benditovich     uint16_t hdr_len;
22822974e916SYuri Benditovich     VirtioNetRscChain *chain;
22832974e916SYuri Benditovich     VirtioNetRscUnit unit;
22842974e916SYuri Benditovich 
22852974e916SYuri Benditovich     chain = (VirtioNetRscChain *)opq;
22862974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
22872974e916SYuri Benditovich 
22882974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header)
22892974e916SYuri Benditovich         + sizeof(tcp_header))) {
22902974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22912974e916SYuri Benditovich     }
22922974e916SYuri Benditovich 
22932974e916SYuri Benditovich     virtio_net_rsc_extract_unit6(chain, buf, &unit);
22942974e916SYuri Benditovich     if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain,
22952974e916SYuri Benditovich                                                  unit.ip, buf, size)) {
22962974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
22972974e916SYuri Benditovich     }
22982974e916SYuri Benditovich 
22992974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
23002974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
23012974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23022974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
23032974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
23042974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 8),
23052974e916SYuri Benditovich                 VIRTIO_NET_IP6_ADDR_SIZE,
23062974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header)
23072974e916SYuri Benditovich                 + sizeof(struct ip6_header));
23082974e916SYuri Benditovich     }
23092974e916SYuri Benditovich 
23102974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
23112974e916SYuri Benditovich }
23122974e916SYuri Benditovich 
23132974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n,
23142974e916SYuri Benditovich                                                       NetClientState *nc,
23152974e916SYuri Benditovich                                                       uint16_t proto)
23162974e916SYuri Benditovich {
23172974e916SYuri Benditovich     VirtioNetRscChain *chain;
23182974e916SYuri Benditovich 
23192974e916SYuri Benditovich     if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) {
23202974e916SYuri Benditovich         return NULL;
23212974e916SYuri Benditovich     }
23222974e916SYuri Benditovich 
23232974e916SYuri Benditovich     QTAILQ_FOREACH(chain, &n->rsc_chains, next) {
23242974e916SYuri Benditovich         if (chain->proto == proto) {
23252974e916SYuri Benditovich             return chain;
23262974e916SYuri Benditovich         }
23272974e916SYuri Benditovich     }
23282974e916SYuri Benditovich 
23292974e916SYuri Benditovich     chain = g_malloc(sizeof(*chain));
23302974e916SYuri Benditovich     chain->n = n;
23312974e916SYuri Benditovich     chain->proto = proto;
23322974e916SYuri Benditovich     if (proto == (uint16_t)ETH_P_IP) {
23332974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD;
23342974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
23352974e916SYuri Benditovich     } else {
23362974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD;
23372974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
23382974e916SYuri Benditovich     }
23392974e916SYuri Benditovich     chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST,
23402974e916SYuri Benditovich                                       virtio_net_rsc_purge, chain);
23412974e916SYuri Benditovich     memset(&chain->stat, 0, sizeof(chain->stat));
23422974e916SYuri Benditovich 
23432974e916SYuri Benditovich     QTAILQ_INIT(&chain->buffers);
23442974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next);
23452974e916SYuri Benditovich 
23462974e916SYuri Benditovich     return chain;
23472974e916SYuri Benditovich }
23482974e916SYuri Benditovich 
23492974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc,
23502974e916SYuri Benditovich                                       const uint8_t *buf,
23512974e916SYuri Benditovich                                       size_t size)
23522974e916SYuri Benditovich {
23532974e916SYuri Benditovich     uint16_t proto;
23542974e916SYuri Benditovich     VirtioNetRscChain *chain;
23552974e916SYuri Benditovich     struct eth_header *eth;
23562974e916SYuri Benditovich     VirtIONet *n;
23572974e916SYuri Benditovich 
23582974e916SYuri Benditovich     n = qemu_get_nic_opaque(nc);
23592974e916SYuri Benditovich     if (size < (n->host_hdr_len + sizeof(struct eth_header))) {
23602974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23612974e916SYuri Benditovich     }
23622974e916SYuri Benditovich 
23632974e916SYuri Benditovich     eth = (struct eth_header *)(buf + n->guest_hdr_len);
23642974e916SYuri Benditovich     proto = htons(eth->h_proto);
23652974e916SYuri Benditovich 
23662974e916SYuri Benditovich     chain = virtio_net_rsc_lookup_chain(n, nc, proto);
23672974e916SYuri Benditovich     if (chain) {
23682974e916SYuri Benditovich         chain->stat.received++;
23692974e916SYuri Benditovich         if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) {
23702974e916SYuri Benditovich             return virtio_net_rsc_receive4(chain, nc, buf, size);
23712974e916SYuri Benditovich         } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) {
23722974e916SYuri Benditovich             return virtio_net_rsc_receive6(chain, nc, buf, size);
23732974e916SYuri Benditovich         }
23742974e916SYuri Benditovich     }
23752974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
23762974e916SYuri Benditovich }
23772974e916SYuri Benditovich 
23782974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf,
23792974e916SYuri Benditovich                                   size_t size)
23802974e916SYuri Benditovich {
23812974e916SYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
23822974e916SYuri Benditovich     if ((n->rsc4_enabled || n->rsc6_enabled)) {
23832974e916SYuri Benditovich         return virtio_net_rsc_receive(nc, buf, size);
23842974e916SYuri Benditovich     } else {
23852974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23862974e916SYuri Benditovich     }
23872974e916SYuri Benditovich }
23882974e916SYuri Benditovich 
23896e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
23906e790746SPaolo Bonzini 
23916e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
23926e790746SPaolo Bonzini {
23936e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
23946e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
239517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
23966e790746SPaolo Bonzini 
239751b19ebeSPaolo Bonzini     virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
239817a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
23996e790746SPaolo Bonzini 
240051b19ebeSPaolo Bonzini     g_free(q->async_tx.elem);
240151b19ebeSPaolo Bonzini     q->async_tx.elem = NULL;
24026e790746SPaolo Bonzini 
24036e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
24046e790746SPaolo Bonzini     virtio_net_flush_tx(q);
24056e790746SPaolo Bonzini }
24066e790746SPaolo Bonzini 
24076e790746SPaolo Bonzini /* TX */
24086e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
24096e790746SPaolo Bonzini {
24106e790746SPaolo Bonzini     VirtIONet *n = q->n;
241117a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
241251b19ebeSPaolo Bonzini     VirtQueueElement *elem;
24136e790746SPaolo Bonzini     int32_t num_packets = 0;
24146e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
241517a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
24166e790746SPaolo Bonzini         return num_packets;
24176e790746SPaolo Bonzini     }
24186e790746SPaolo Bonzini 
241951b19ebeSPaolo Bonzini     if (q->async_tx.elem) {
24206e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
24216e790746SPaolo Bonzini         return num_packets;
24226e790746SPaolo Bonzini     }
24236e790746SPaolo Bonzini 
242451b19ebeSPaolo Bonzini     for (;;) {
2425bd89dd98SJason Wang         ssize_t ret;
242651b19ebeSPaolo Bonzini         unsigned int out_num;
242751b19ebeSPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
2428feb93f36SJason Wang         struct virtio_net_hdr_mrg_rxbuf mhdr;
24296e790746SPaolo Bonzini 
243051b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
243151b19ebeSPaolo Bonzini         if (!elem) {
243251b19ebeSPaolo Bonzini             break;
243351b19ebeSPaolo Bonzini         }
243451b19ebeSPaolo Bonzini 
243551b19ebeSPaolo Bonzini         out_num = elem->out_num;
243651b19ebeSPaolo Bonzini         out_sg = elem->out_sg;
24376e790746SPaolo Bonzini         if (out_num < 1) {
2438fa5e56c2SGreg Kurz             virtio_error(vdev, "virtio-net header not in first element");
2439fa5e56c2SGreg Kurz             virtqueue_detach_element(q->tx_vq, elem, 0);
2440fa5e56c2SGreg Kurz             g_free(elem);
2441fa5e56c2SGreg Kurz             return -EINVAL;
24426e790746SPaolo Bonzini         }
24436e790746SPaolo Bonzini 
2444032a74a1SCédric Le Goater         if (n->has_vnet_hdr) {
2445feb93f36SJason Wang             if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
2446feb93f36SJason Wang                 n->guest_hdr_len) {
2447fa5e56c2SGreg Kurz                 virtio_error(vdev, "virtio-net header incorrect");
2448fa5e56c2SGreg Kurz                 virtqueue_detach_element(q->tx_vq, elem, 0);
2449fa5e56c2SGreg Kurz                 g_free(elem);
2450fa5e56c2SGreg Kurz                 return -EINVAL;
2451032a74a1SCédric Le Goater             }
24521bfa316cSGreg Kurz             if (n->needs_vnet_hdr_swap) {
2453feb93f36SJason Wang                 virtio_net_hdr_swap(vdev, (void *) &mhdr);
2454feb93f36SJason Wang                 sg2[0].iov_base = &mhdr;
2455feb93f36SJason Wang                 sg2[0].iov_len = n->guest_hdr_len;
2456feb93f36SJason Wang                 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
2457feb93f36SJason Wang                                    out_sg, out_num,
2458feb93f36SJason Wang                                    n->guest_hdr_len, -1);
2459feb93f36SJason Wang                 if (out_num == VIRTQUEUE_MAX_SIZE) {
2460feb93f36SJason Wang                     goto drop;
2461032a74a1SCédric Le Goater                 }
2462feb93f36SJason Wang                 out_num += 1;
2463feb93f36SJason Wang                 out_sg = sg2;
2464feb93f36SJason Wang             }
2465feb93f36SJason Wang         }
24666e790746SPaolo Bonzini         /*
24676e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
24686e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
24696e790746SPaolo Bonzini          * that host is interested in.
24706e790746SPaolo Bonzini          */
24716e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
24726e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
24736e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
24746e790746SPaolo Bonzini                                        out_sg, out_num,
24756e790746SPaolo Bonzini                                        0, n->host_hdr_len);
24766e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
24776e790746SPaolo Bonzini                              out_sg, out_num,
24786e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
24796e790746SPaolo Bonzini             out_num = sg_num;
24806e790746SPaolo Bonzini             out_sg = sg;
24816e790746SPaolo Bonzini         }
24826e790746SPaolo Bonzini 
24836e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
24846e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
24856e790746SPaolo Bonzini         if (ret == 0) {
24866e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
24876e790746SPaolo Bonzini             q->async_tx.elem = elem;
24886e790746SPaolo Bonzini             return -EBUSY;
24896e790746SPaolo Bonzini         }
24906e790746SPaolo Bonzini 
2491feb93f36SJason Wang drop:
249251b19ebeSPaolo Bonzini         virtqueue_push(q->tx_vq, elem, 0);
249317a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
249451b19ebeSPaolo Bonzini         g_free(elem);
24956e790746SPaolo Bonzini 
24966e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
24976e790746SPaolo Bonzini             break;
24986e790746SPaolo Bonzini         }
24996e790746SPaolo Bonzini     }
25006e790746SPaolo Bonzini     return num_packets;
25016e790746SPaolo Bonzini }
25026e790746SPaolo Bonzini 
25036e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
25046e790746SPaolo Bonzini {
250517a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
25066e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
25076e790746SPaolo Bonzini 
2508283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2509283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2510283e2c2aSYuri Benditovich         return;
2511283e2c2aSYuri Benditovich     }
2512283e2c2aSYuri Benditovich 
25136e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
251417a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
25156e790746SPaolo Bonzini         q->tx_waiting = 1;
25166e790746SPaolo Bonzini         return;
25176e790746SPaolo Bonzini     }
25186e790746SPaolo Bonzini 
25196e790746SPaolo Bonzini     if (q->tx_waiting) {
25206e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 1);
2521bc72ad67SAlex Bligh         timer_del(q->tx_timer);
25226e790746SPaolo Bonzini         q->tx_waiting = 0;
2523fa5e56c2SGreg Kurz         if (virtio_net_flush_tx(q) == -EINVAL) {
2524fa5e56c2SGreg Kurz             return;
2525fa5e56c2SGreg Kurz         }
25266e790746SPaolo Bonzini     } else {
2527bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
2528bc72ad67SAlex Bligh                        qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
25296e790746SPaolo Bonzini         q->tx_waiting = 1;
25306e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
25316e790746SPaolo Bonzini     }
25326e790746SPaolo Bonzini }
25336e790746SPaolo Bonzini 
25346e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
25356e790746SPaolo Bonzini {
253617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
25376e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
25386e790746SPaolo Bonzini 
2539283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2540283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2541283e2c2aSYuri Benditovich         return;
2542283e2c2aSYuri Benditovich     }
2543283e2c2aSYuri Benditovich 
25446e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
25456e790746SPaolo Bonzini         return;
25466e790746SPaolo Bonzini     }
25476e790746SPaolo Bonzini     q->tx_waiting = 1;
25486e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
254917a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
25506e790746SPaolo Bonzini         return;
25516e790746SPaolo Bonzini     }
25526e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
25536e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
25546e790746SPaolo Bonzini }
25556e790746SPaolo Bonzini 
25566e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
25576e790746SPaolo Bonzini {
25586e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
25596e790746SPaolo Bonzini     VirtIONet *n = q->n;
256017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2561e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2562e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2563e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2564e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2565e8bcf842SMichael S. Tsirkin         return;
2566e8bcf842SMichael S. Tsirkin     }
25676e790746SPaolo Bonzini 
25686e790746SPaolo Bonzini     q->tx_waiting = 0;
25696e790746SPaolo Bonzini 
25706e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
257117a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
25726e790746SPaolo Bonzini         return;
257317a0ca55SKONRAD Frederic     }
25746e790746SPaolo Bonzini 
25756e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
25766e790746SPaolo Bonzini     virtio_net_flush_tx(q);
25776e790746SPaolo Bonzini }
25786e790746SPaolo Bonzini 
25796e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
25806e790746SPaolo Bonzini {
25816e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
25826e790746SPaolo Bonzini     VirtIONet *n = q->n;
258317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
25846e790746SPaolo Bonzini     int32_t ret;
25856e790746SPaolo Bonzini 
2586e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2587e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2588e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2589e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2590e8bcf842SMichael S. Tsirkin         return;
2591e8bcf842SMichael S. Tsirkin     }
25926e790746SPaolo Bonzini 
25936e790746SPaolo Bonzini     q->tx_waiting = 0;
25946e790746SPaolo Bonzini 
25956e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
259617a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
25976e790746SPaolo Bonzini         return;
259817a0ca55SKONRAD Frederic     }
25996e790746SPaolo Bonzini 
26006e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
2601fa5e56c2SGreg Kurz     if (ret == -EBUSY || ret == -EINVAL) {
2602fa5e56c2SGreg Kurz         return; /* Notification re-enable handled by tx_complete or device
2603fa5e56c2SGreg Kurz                  * broken */
26046e790746SPaolo Bonzini     }
26056e790746SPaolo Bonzini 
26066e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
26076e790746SPaolo Bonzini      * more coming and immediately reschedule */
26086e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
26096e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
26106e790746SPaolo Bonzini         q->tx_waiting = 1;
26116e790746SPaolo Bonzini         return;
26126e790746SPaolo Bonzini     }
26136e790746SPaolo Bonzini 
26146e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
26156e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
26166e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
26176e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2618fa5e56c2SGreg Kurz     ret = virtio_net_flush_tx(q);
2619fa5e56c2SGreg Kurz     if (ret == -EINVAL) {
2620fa5e56c2SGreg Kurz         return;
2621fa5e56c2SGreg Kurz     } else if (ret > 0) {
26226e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
26236e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
26246e790746SPaolo Bonzini         q->tx_waiting = 1;
26256e790746SPaolo Bonzini     }
26266e790746SPaolo Bonzini }
26276e790746SPaolo Bonzini 
2628f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index)
2629f9d6dbf0SWen Congyang {
2630f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2631f9d6dbf0SWen Congyang 
26321c0fbfa3SMichael S. Tsirkin     n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
26331c0fbfa3SMichael S. Tsirkin                                            virtio_net_handle_rx);
26349b02e161SWei Wang 
2635f9d6dbf0SWen Congyang     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
2636f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
26379b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
26389b02e161SWei Wang                              virtio_net_handle_tx_timer);
2639f9d6dbf0SWen Congyang         n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
2640f9d6dbf0SWen Congyang                                               virtio_net_tx_timer,
2641f9d6dbf0SWen Congyang                                               &n->vqs[index]);
2642f9d6dbf0SWen Congyang     } else {
2643f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
26449b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
26459b02e161SWei Wang                              virtio_net_handle_tx_bh);
2646f9d6dbf0SWen Congyang         n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
2647f9d6dbf0SWen Congyang     }
2648f9d6dbf0SWen Congyang 
2649f9d6dbf0SWen Congyang     n->vqs[index].tx_waiting = 0;
2650f9d6dbf0SWen Congyang     n->vqs[index].n = n;
2651f9d6dbf0SWen Congyang }
2652f9d6dbf0SWen Congyang 
2653f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index)
2654f9d6dbf0SWen Congyang {
2655f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2656f9d6dbf0SWen Congyang     VirtIONetQueue *q = &n->vqs[index];
2657f9d6dbf0SWen Congyang     NetClientState *nc = qemu_get_subqueue(n->nic, index);
2658f9d6dbf0SWen Congyang 
2659f9d6dbf0SWen Congyang     qemu_purge_queued_packets(nc);
2660f9d6dbf0SWen Congyang 
2661f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2);
2662f9d6dbf0SWen Congyang     if (q->tx_timer) {
2663f9d6dbf0SWen Congyang         timer_del(q->tx_timer);
2664f9d6dbf0SWen Congyang         timer_free(q->tx_timer);
2665f989c30cSYunjian Wang         q->tx_timer = NULL;
2666f9d6dbf0SWen Congyang     } else {
2667f9d6dbf0SWen Congyang         qemu_bh_delete(q->tx_bh);
2668f989c30cSYunjian Wang         q->tx_bh = NULL;
2669f9d6dbf0SWen Congyang     }
2670f989c30cSYunjian Wang     q->tx_waiting = 0;
2671f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2 + 1);
2672f9d6dbf0SWen Congyang }
2673f9d6dbf0SWen Congyang 
2674f9d6dbf0SWen Congyang static void virtio_net_change_num_queues(VirtIONet *n, int new_max_queues)
2675f9d6dbf0SWen Congyang {
2676f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2677f9d6dbf0SWen Congyang     int old_num_queues = virtio_get_num_queues(vdev);
2678f9d6dbf0SWen Congyang     int new_num_queues = new_max_queues * 2 + 1;
2679f9d6dbf0SWen Congyang     int i;
2680f9d6dbf0SWen Congyang 
2681f9d6dbf0SWen Congyang     assert(old_num_queues >= 3);
2682f9d6dbf0SWen Congyang     assert(old_num_queues % 2 == 1);
2683f9d6dbf0SWen Congyang 
2684f9d6dbf0SWen Congyang     if (old_num_queues == new_num_queues) {
2685f9d6dbf0SWen Congyang         return;
2686f9d6dbf0SWen Congyang     }
2687f9d6dbf0SWen Congyang 
2688f9d6dbf0SWen Congyang     /*
2689f9d6dbf0SWen Congyang      * We always need to remove and add ctrl vq if
2690f9d6dbf0SWen Congyang      * old_num_queues != new_num_queues. Remove ctrl_vq first,
269120f86a75SYuval Shaia      * and then we only enter one of the following two loops.
2692f9d6dbf0SWen Congyang      */
2693f9d6dbf0SWen Congyang     virtio_del_queue(vdev, old_num_queues - 1);
2694f9d6dbf0SWen Congyang 
2695f9d6dbf0SWen Congyang     for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
2696f9d6dbf0SWen Congyang         /* new_num_queues < old_num_queues */
2697f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i / 2);
2698f9d6dbf0SWen Congyang     }
2699f9d6dbf0SWen Congyang 
2700f9d6dbf0SWen Congyang     for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
2701f9d6dbf0SWen Congyang         /* new_num_queues > old_num_queues */
2702f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i / 2);
2703f9d6dbf0SWen Congyang     }
2704f9d6dbf0SWen Congyang 
2705f9d6dbf0SWen Congyang     /* add ctrl_vq last */
2706f9d6dbf0SWen Congyang     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
2707f9d6dbf0SWen Congyang }
2708f9d6dbf0SWen Congyang 
2709ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
27106e790746SPaolo Bonzini {
2711f9d6dbf0SWen Congyang     int max = multiqueue ? n->max_queues : 1;
2712f9d6dbf0SWen Congyang 
27136e790746SPaolo Bonzini     n->multiqueue = multiqueue;
2714f9d6dbf0SWen Congyang     virtio_net_change_num_queues(n, max);
27156e790746SPaolo Bonzini 
27166e790746SPaolo Bonzini     virtio_net_set_queues(n);
27176e790746SPaolo Bonzini }
27186e790746SPaolo Bonzini 
2719982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id)
2720037dab2fSGreg Kurz {
2721982b78c5SDr. David Alan Gilbert     VirtIONet *n = opaque;
2722982b78c5SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2723037dab2fSGreg Kurz     int i, link_down;
2724037dab2fSGreg Kurz 
27259d8c6a25SDr. David Alan Gilbert     trace_virtio_net_post_load_device();
2726982b78c5SDr. David Alan Gilbert     virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs,
272795129d6fSCornelia Huck                                virtio_vdev_has_feature(vdev,
2728e22f0603SYuri Benditovich                                                        VIRTIO_F_VERSION_1),
2729e22f0603SYuri Benditovich                                virtio_vdev_has_feature(vdev,
2730e22f0603SYuri Benditovich                                                        VIRTIO_NET_F_HASH_REPORT));
27316e790746SPaolo Bonzini 
27326e790746SPaolo Bonzini     /* MAC_TABLE_ENTRIES may be different from the saved image */
2733982b78c5SDr. David Alan Gilbert     if (n->mac_table.in_use > MAC_TABLE_ENTRIES) {
27346e790746SPaolo Bonzini         n->mac_table.in_use = 0;
27356e790746SPaolo Bonzini     }
27366e790746SPaolo Bonzini 
2737982b78c5SDr. David Alan Gilbert     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
27386c666823SMichael S. Tsirkin         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
27396c666823SMichael S. Tsirkin     }
27406c666823SMichael S. Tsirkin 
27417788c3f2SMikhail Sennikovsky     /*
27427788c3f2SMikhail Sennikovsky      * curr_guest_offloads will be later overwritten by the
27437788c3f2SMikhail Sennikovsky      * virtio_set_features_nocheck call done from the virtio_load.
27447788c3f2SMikhail Sennikovsky      * Here we make sure it is preserved and restored accordingly
27457788c3f2SMikhail Sennikovsky      * in the virtio_net_post_load_virtio callback.
27467788c3f2SMikhail Sennikovsky      */
27477788c3f2SMikhail Sennikovsky     n->saved_guest_offloads = n->curr_guest_offloads;
27486c666823SMichael S. Tsirkin 
27496e790746SPaolo Bonzini     virtio_net_set_queues(n);
27506e790746SPaolo Bonzini 
27516e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
27526e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
27536e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
27546e790746SPaolo Bonzini             break;
27556e790746SPaolo Bonzini         }
27566e790746SPaolo Bonzini     }
27576e790746SPaolo Bonzini     n->mac_table.first_multi = i;
27586e790746SPaolo Bonzini 
27596e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
27606e790746SPaolo Bonzini      * to link status bit in n->status */
27616e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
27626e790746SPaolo Bonzini     for (i = 0; i < n->max_queues; i++) {
27636e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
27646e790746SPaolo Bonzini     }
27656e790746SPaolo Bonzini 
27666c666823SMichael S. Tsirkin     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
27676c666823SMichael S. Tsirkin         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
27689d8c6a25SDr. David Alan Gilbert         qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
27699d8c6a25SDr. David Alan Gilbert                                   QEMU_CLOCK_VIRTUAL,
27709d8c6a25SDr. David Alan Gilbert                                   virtio_net_announce_timer, n);
27719d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
27729d8c6a25SDr. David Alan Gilbert             timer_mod(n->announce_timer.tm,
27739d8c6a25SDr. David Alan Gilbert                       qemu_clock_get_ms(n->announce_timer.type));
27749d8c6a25SDr. David Alan Gilbert         } else {
2775944458b6SDr. David Alan Gilbert             qemu_announce_timer_del(&n->announce_timer, false);
27769d8c6a25SDr. David Alan Gilbert         }
27776c666823SMichael S. Tsirkin     }
27786c666823SMichael S. Tsirkin 
2779e41b7114SYuri Benditovich     if (n->rss_data.enabled) {
2780e41b7114SYuri Benditovich         trace_virtio_net_rss_enable(n->rss_data.hash_types,
2781e41b7114SYuri Benditovich                                     n->rss_data.indirections_len,
2782e41b7114SYuri Benditovich                                     sizeof(n->rss_data.key));
2783e41b7114SYuri Benditovich     } else {
2784e41b7114SYuri Benditovich         trace_virtio_net_rss_disable();
2785e41b7114SYuri Benditovich     }
27866e790746SPaolo Bonzini     return 0;
27876e790746SPaolo Bonzini }
27886e790746SPaolo Bonzini 
27897788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev)
27907788c3f2SMikhail Sennikovsky {
27917788c3f2SMikhail Sennikovsky     VirtIONet *n = VIRTIO_NET(vdev);
27927788c3f2SMikhail Sennikovsky     /*
27937788c3f2SMikhail Sennikovsky      * The actual needed state is now in saved_guest_offloads,
27947788c3f2SMikhail Sennikovsky      * see virtio_net_post_load_device for detail.
27957788c3f2SMikhail Sennikovsky      * Restore it back and apply the desired offloads.
27967788c3f2SMikhail Sennikovsky      */
27977788c3f2SMikhail Sennikovsky     n->curr_guest_offloads = n->saved_guest_offloads;
27987788c3f2SMikhail Sennikovsky     if (peer_has_vnet_hdr(n)) {
27997788c3f2SMikhail Sennikovsky         virtio_net_apply_guest_offloads(n);
28007788c3f2SMikhail Sennikovsky     }
28017788c3f2SMikhail Sennikovsky 
28027788c3f2SMikhail Sennikovsky     return 0;
28037788c3f2SMikhail Sennikovsky }
28047788c3f2SMikhail Sennikovsky 
2805982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */
2806982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = {
2807982b78c5SDr. David Alan Gilbert     .name = "virtio-net-queue-tx_waiting",
2808982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2809982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(tx_waiting, VirtIONetQueue),
2810982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2811982b78c5SDr. David Alan Gilbert    },
2812982b78c5SDr. David Alan Gilbert };
2813982b78c5SDr. David Alan Gilbert 
2814982b78c5SDr. David Alan Gilbert static bool max_queues_gt_1(void *opaque, int version_id)
2815982b78c5SDr. David Alan Gilbert {
2816982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->max_queues > 1;
2817982b78c5SDr. David Alan Gilbert }
2818982b78c5SDr. David Alan Gilbert 
2819982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id)
2820982b78c5SDr. David Alan Gilbert {
2821982b78c5SDr. David Alan Gilbert     return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque),
2822982b78c5SDr. David Alan Gilbert                                    VIRTIO_NET_F_CTRL_GUEST_OFFLOADS);
2823982b78c5SDr. David Alan Gilbert }
2824982b78c5SDr. David Alan Gilbert 
2825982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id)
2826982b78c5SDr. David Alan Gilbert {
2827982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES;
2828982b78c5SDr. David Alan Gilbert }
2829982b78c5SDr. David Alan Gilbert 
2830982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id)
2831982b78c5SDr. David Alan Gilbert {
2832982b78c5SDr. David Alan Gilbert     return !mac_table_fits(opaque, version_id);
2833982b78c5SDr. David Alan Gilbert }
2834982b78c5SDr. David Alan Gilbert 
2835982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods
2836982b78c5SDr. David Alan Gilbert  * although only some fields are used by each.
2837982b78c5SDr. David Alan Gilbert  */
2838982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp {
2839982b78c5SDr. David Alan Gilbert     VirtIONet      *parent;
2840982b78c5SDr. David Alan Gilbert     VirtIONetQueue *vqs_1;
2841982b78c5SDr. David Alan Gilbert     uint16_t        curr_queues_1;
2842982b78c5SDr. David Alan Gilbert     uint8_t         has_ufo;
2843982b78c5SDr. David Alan Gilbert     uint32_t        has_vnet_hdr;
2844982b78c5SDr. David Alan Gilbert };
2845982b78c5SDr. David Alan Gilbert 
2846982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than
2847982b78c5SDr. David Alan Gilbert  * the 1st entry in the queues and only if there's more than one
2848982b78c5SDr. David Alan Gilbert  * entry.  We use the tmp mechanism to calculate a temporary
2849982b78c5SDr. David Alan Gilbert  * pointer and count and also validate the count.
2850982b78c5SDr. David Alan Gilbert  */
2851982b78c5SDr. David Alan Gilbert 
285244b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque)
2853982b78c5SDr. David Alan Gilbert {
2854982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2855982b78c5SDr. David Alan Gilbert 
2856982b78c5SDr. David Alan Gilbert     tmp->vqs_1 = tmp->parent->vqs + 1;
2857982b78c5SDr. David Alan Gilbert     tmp->curr_queues_1 = tmp->parent->curr_queues - 1;
2858982b78c5SDr. David Alan Gilbert     if (tmp->parent->curr_queues == 0) {
2859982b78c5SDr. David Alan Gilbert         tmp->curr_queues_1 = 0;
2860982b78c5SDr. David Alan Gilbert     }
286144b1ff31SDr. David Alan Gilbert 
286244b1ff31SDr. David Alan Gilbert     return 0;
2863982b78c5SDr. David Alan Gilbert }
2864982b78c5SDr. David Alan Gilbert 
2865982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque)
2866982b78c5SDr. David Alan Gilbert {
2867982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2868982b78c5SDr. David Alan Gilbert 
2869982b78c5SDr. David Alan Gilbert     /* Reuse the pointer setup from save */
2870982b78c5SDr. David Alan Gilbert     virtio_net_tx_waiting_pre_save(opaque);
2871982b78c5SDr. David Alan Gilbert 
2872982b78c5SDr. David Alan Gilbert     if (tmp->parent->curr_queues > tmp->parent->max_queues) {
2873982b78c5SDr. David Alan Gilbert         error_report("virtio-net: curr_queues %x > max_queues %x",
2874982b78c5SDr. David Alan Gilbert             tmp->parent->curr_queues, tmp->parent->max_queues);
2875982b78c5SDr. David Alan Gilbert 
2876982b78c5SDr. David Alan Gilbert         return -EINVAL;
2877982b78c5SDr. David Alan Gilbert     }
2878982b78c5SDr. David Alan Gilbert 
2879982b78c5SDr. David Alan Gilbert     return 0; /* all good */
2880982b78c5SDr. David Alan Gilbert }
2881982b78c5SDr. David Alan Gilbert 
2882982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = {
2883982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-tx_waiting",
2884982b78c5SDr. David Alan Gilbert     .pre_load  = virtio_net_tx_waiting_pre_load,
2885982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_tx_waiting_pre_save,
2886982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2887982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp,
2888982b78c5SDr. David Alan Gilbert                                      curr_queues_1,
2889982b78c5SDr. David Alan Gilbert                                      vmstate_virtio_net_queue_tx_waiting,
2890982b78c5SDr. David Alan Gilbert                                      struct VirtIONetQueue),
2891982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2892982b78c5SDr. David Alan Gilbert     },
2893982b78c5SDr. David Alan Gilbert };
2894982b78c5SDr. David Alan Gilbert 
2895982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the
2896982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
2897982b78c5SDr. David Alan Gilbert  */
2898982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id)
2899982b78c5SDr. David Alan Gilbert {
2900982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2901982b78c5SDr. David Alan Gilbert 
2902982b78c5SDr. David Alan Gilbert     if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) {
2903982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires TUN_F_UFO support");
2904982b78c5SDr. David Alan Gilbert         return -EINVAL;
2905982b78c5SDr. David Alan Gilbert     }
2906982b78c5SDr. David Alan Gilbert 
2907982b78c5SDr. David Alan Gilbert     return 0;
2908982b78c5SDr. David Alan Gilbert }
2909982b78c5SDr. David Alan Gilbert 
291044b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque)
2911982b78c5SDr. David Alan Gilbert {
2912982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2913982b78c5SDr. David Alan Gilbert 
2914982b78c5SDr. David Alan Gilbert     tmp->has_ufo = tmp->parent->has_ufo;
291544b1ff31SDr. David Alan Gilbert 
291644b1ff31SDr. David Alan Gilbert     return 0;
2917982b78c5SDr. David Alan Gilbert }
2918982b78c5SDr. David Alan Gilbert 
2919982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = {
2920982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-ufo",
2921982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_ufo_post_load,
2922982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_ufo_pre_save,
2923982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2924982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp),
2925982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2926982b78c5SDr. David Alan Gilbert     },
2927982b78c5SDr. David Alan Gilbert };
2928982b78c5SDr. David Alan Gilbert 
2929982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the
2930982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
2931982b78c5SDr. David Alan Gilbert  */
2932982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id)
2933982b78c5SDr. David Alan Gilbert {
2934982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2935982b78c5SDr. David Alan Gilbert 
2936982b78c5SDr. David Alan Gilbert     if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) {
2937982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires vnet_hdr=on");
2938982b78c5SDr. David Alan Gilbert         return -EINVAL;
2939982b78c5SDr. David Alan Gilbert     }
2940982b78c5SDr. David Alan Gilbert 
2941982b78c5SDr. David Alan Gilbert     return 0;
2942982b78c5SDr. David Alan Gilbert }
2943982b78c5SDr. David Alan Gilbert 
294444b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque)
2945982b78c5SDr. David Alan Gilbert {
2946982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
2947982b78c5SDr. David Alan Gilbert 
2948982b78c5SDr. David Alan Gilbert     tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr;
294944b1ff31SDr. David Alan Gilbert 
295044b1ff31SDr. David Alan Gilbert     return 0;
2951982b78c5SDr. David Alan Gilbert }
2952982b78c5SDr. David Alan Gilbert 
2953982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = {
2954982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-vnet",
2955982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_vnet_post_load,
2956982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_vnet_pre_save,
2957982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
2958982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp),
2959982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2960982b78c5SDr. David Alan Gilbert     },
2961982b78c5SDr. David Alan Gilbert };
2962982b78c5SDr. David Alan Gilbert 
2963e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque)
2964e41b7114SYuri Benditovich {
2965e41b7114SYuri Benditovich     return VIRTIO_NET(opaque)->rss_data.enabled;
2966e41b7114SYuri Benditovich }
2967e41b7114SYuri Benditovich 
2968e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = {
2969e41b7114SYuri Benditovich     .name      = "virtio-net-device/rss",
2970e41b7114SYuri Benditovich     .version_id = 1,
2971e41b7114SYuri Benditovich     .minimum_version_id = 1,
2972e41b7114SYuri Benditovich     .needed = virtio_net_rss_needed,
2973e41b7114SYuri Benditovich     .fields = (VMStateField[]) {
2974e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.enabled, VirtIONet),
2975e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.redirect, VirtIONet),
2976e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.populate_hash, VirtIONet),
2977e41b7114SYuri Benditovich         VMSTATE_UINT32(rss_data.hash_types, VirtIONet),
2978e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.indirections_len, VirtIONet),
2979e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.default_queue, VirtIONet),
2980e41b7114SYuri Benditovich         VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet,
2981e41b7114SYuri Benditovich                             VIRTIO_NET_RSS_MAX_KEY_SIZE),
2982e41b7114SYuri Benditovich         VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet,
2983e41b7114SYuri Benditovich                                     rss_data.indirections_len, 0,
2984e41b7114SYuri Benditovich                                     vmstate_info_uint16, uint16_t),
2985e41b7114SYuri Benditovich         VMSTATE_END_OF_LIST()
2986e41b7114SYuri Benditovich     },
2987e41b7114SYuri Benditovich };
2988e41b7114SYuri Benditovich 
2989982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = {
2990982b78c5SDr. David Alan Gilbert     .name = "virtio-net-device",
2991982b78c5SDr. David Alan Gilbert     .version_id = VIRTIO_NET_VM_VERSION,
2992982b78c5SDr. David Alan Gilbert     .minimum_version_id = VIRTIO_NET_VM_VERSION,
2993982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_post_load_device,
2994982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2995982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN),
2996982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_POINTER(vqs, VirtIONet,
2997982b78c5SDr. David Alan Gilbert                                vmstate_virtio_net_queue_tx_waiting,
2998982b78c5SDr. David Alan Gilbert                                VirtIONetQueue),
2999982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet),
3000982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16(status, VirtIONet),
3001982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(promisc, VirtIONet),
3002982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(allmulti, VirtIONet),
3003982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mac_table.in_use, VirtIONet),
3004982b78c5SDr. David Alan Gilbert 
3005982b78c5SDr. David Alan Gilbert         /* Guarded pair: If it fits we load it, else we throw it away
3006982b78c5SDr. David Alan Gilbert          * - can happen if source has a larger MAC table.; post-load
3007982b78c5SDr. David Alan Gilbert          *  sets flags in this case.
3008982b78c5SDr. David Alan Gilbert          */
3009982b78c5SDr. David Alan Gilbert         VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet,
3010982b78c5SDr. David Alan Gilbert                                 0, mac_table_fits, mac_table.in_use,
3011982b78c5SDr. David Alan Gilbert                                  ETH_ALEN),
3012982b78c5SDr. David Alan Gilbert         VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0,
3013982b78c5SDr. David Alan Gilbert                                      mac_table.in_use, ETH_ALEN),
3014982b78c5SDr. David Alan Gilbert 
3015982b78c5SDr. David Alan Gilbert         /* Note: This is an array of uint32's that's always been saved as a
3016982b78c5SDr. David Alan Gilbert          * buffer; hold onto your endiannesses; it's actually used as a bitmap
3017982b78c5SDr. David Alan Gilbert          * but based on the uint.
3018982b78c5SDr. David Alan Gilbert          */
3019982b78c5SDr. David Alan Gilbert         VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3),
3020982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3021982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_vnet),
3022982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet),
3023982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet),
3024982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(alluni, VirtIONet),
3025982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nomulti, VirtIONet),
3026982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nouni, VirtIONet),
3027982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nobcast, VirtIONet),
3028982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3029982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_ufo),
3030982b78c5SDr. David Alan Gilbert         VMSTATE_SINGLE_TEST(max_queues, VirtIONet, max_queues_gt_1, 0,
3031982b78c5SDr. David Alan Gilbert                             vmstate_info_uint16_equal, uint16_t),
3032982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16_TEST(curr_queues, VirtIONet, max_queues_gt_1),
3033982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3034982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_tx_waiting),
3035982b78c5SDr. David Alan Gilbert         VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet,
3036982b78c5SDr. David Alan Gilbert                             has_ctrl_guest_offloads),
3037982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3038982b78c5SDr. David Alan Gilbert    },
3039e41b7114SYuri Benditovich     .subsections = (const VMStateDescription * []) {
3040e41b7114SYuri Benditovich         &vmstate_virtio_net_rss,
3041e41b7114SYuri Benditovich         NULL
3042e41b7114SYuri Benditovich     }
3043982b78c5SDr. David Alan Gilbert };
3044982b78c5SDr. David Alan Gilbert 
30456e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
3046f394b2e2SEric Blake     .type = NET_CLIENT_DRIVER_NIC,
30476e790746SPaolo Bonzini     .size = sizeof(NICState),
30486e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
30496e790746SPaolo Bonzini     .receive = virtio_net_receive,
30506e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
3051b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
3052b2c929f0SDr. David Alan Gilbert     .announce = virtio_net_announce,
30536e790746SPaolo Bonzini };
30546e790746SPaolo Bonzini 
30556e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
30566e790746SPaolo Bonzini {
305717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
30586e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
30596e790746SPaolo Bonzini     assert(n->vhost_started);
3060ed8b4afeSNikolay Nikolaev     return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
30616e790746SPaolo Bonzini }
30626e790746SPaolo Bonzini 
30636e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
30646e790746SPaolo Bonzini                                            bool mask)
30656e790746SPaolo Bonzini {
306617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
30676e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
30686e790746SPaolo Bonzini     assert(n->vhost_started);
3069ed8b4afeSNikolay Nikolaev     vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
30706e790746SPaolo Bonzini                              vdev, idx, mask);
30716e790746SPaolo Bonzini }
30726e790746SPaolo Bonzini 
3073019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
30746e790746SPaolo Bonzini {
30750cd09c3aSCornelia Huck     virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
3076a93e599dSMaxime Coquelin 
3077ba550851SStefano Garzarella     n->config_size = virtio_feature_get_config_size(feature_sizes,
3078ba550851SStefano Garzarella                                                     host_features);
307917ec5a86SKONRAD Frederic }
30806e790746SPaolo Bonzini 
30818a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
30828a253ec2SKONRAD Frederic                                    const char *type)
30838a253ec2SKONRAD Frederic {
30848a253ec2SKONRAD Frederic     /*
30858a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
30868a253ec2SKONRAD Frederic      */
30878a253ec2SKONRAD Frederic     assert(type != NULL);
30888a253ec2SKONRAD Frederic 
30898a253ec2SKONRAD Frederic     g_free(n->netclient_name);
30908a253ec2SKONRAD Frederic     g_free(n->netclient_type);
30918a253ec2SKONRAD Frederic     n->netclient_name = g_strdup(name);
30928a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
30938a253ec2SKONRAD Frederic }
30948a253ec2SKONRAD Frederic 
30959711cd0dSJens Freimann static bool failover_unplug_primary(VirtIONet *n)
30969711cd0dSJens Freimann {
30979711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
30989711cd0dSJens Freimann     PCIDevice *pci_dev;
30999711cd0dSJens Freimann     Error *err = NULL;
31009711cd0dSJens Freimann 
31019711cd0dSJens Freimann     hotplug_ctrl = qdev_get_hotplug_handler(n->primary_dev);
31029711cd0dSJens Freimann     if (hotplug_ctrl) {
31039711cd0dSJens Freimann         pci_dev = PCI_DEVICE(n->primary_dev);
31049711cd0dSJens Freimann         pci_dev->partially_hotplugged = true;
31059711cd0dSJens Freimann         hotplug_handler_unplug_request(hotplug_ctrl, n->primary_dev, &err);
31069711cd0dSJens Freimann         if (err) {
31079711cd0dSJens Freimann             error_report_err(err);
31089711cd0dSJens Freimann             return false;
31099711cd0dSJens Freimann         }
31109711cd0dSJens Freimann     } else {
31119711cd0dSJens Freimann         return false;
31129711cd0dSJens Freimann     }
31139711cd0dSJens Freimann     return true;
31149711cd0dSJens Freimann }
31159711cd0dSJens Freimann 
31169711cd0dSJens Freimann static bool failover_replug_primary(VirtIONet *n, Error **errp)
31179711cd0dSJens Freimann {
31185a0948d3SMarkus Armbruster     Error *err = NULL;
31199711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
31209711cd0dSJens Freimann     PCIDevice *pdev = PCI_DEVICE(n->primary_dev);
31219711cd0dSJens Freimann 
31229711cd0dSJens Freimann     if (!pdev->partially_hotplugged) {
31239711cd0dSJens Freimann         return true;
31249711cd0dSJens Freimann     }
31259711cd0dSJens Freimann     if (!n->primary_device_opts) {
31269711cd0dSJens Freimann         n->primary_device_opts = qemu_opts_from_qdict(
31279711cd0dSJens Freimann                 qemu_find_opts("device"),
31289711cd0dSJens Freimann                 n->primary_device_dict, errp);
3129150ab54aSJens Freimann         if (!n->primary_device_opts) {
31305a0948d3SMarkus Armbruster             return false;
31319711cd0dSJens Freimann         }
3132150ab54aSJens Freimann     }
31339711cd0dSJens Freimann     n->primary_bus = n->primary_dev->parent_bus;
3134150ab54aSJens Freimann     if (!n->primary_bus) {
3135150ab54aSJens Freimann         error_setg(errp, "virtio_net: couldn't find primary bus");
31365a0948d3SMarkus Armbruster         return false;
31379711cd0dSJens Freimann     }
31389711cd0dSJens Freimann     qdev_set_parent_bus(n->primary_dev, n->primary_bus);
31399711cd0dSJens Freimann     n->primary_should_be_hidden = false;
31409711cd0dSJens Freimann     qemu_opt_set_bool(n->primary_device_opts,
31415a0948d3SMarkus Armbruster                       "partially_hotplugged", true, &err);
31425a0948d3SMarkus Armbruster     if (err) {
31435a0948d3SMarkus Armbruster         goto out;
31445a0948d3SMarkus Armbruster     }
31459711cd0dSJens Freimann     hotplug_ctrl = qdev_get_hotplug_handler(n->primary_dev);
31469711cd0dSJens Freimann     if (hotplug_ctrl) {
31475a0948d3SMarkus Armbruster         hotplug_handler_pre_plug(hotplug_ctrl, n->primary_dev, &err);
31485a0948d3SMarkus Armbruster         if (err) {
31495a0948d3SMarkus Armbruster             goto out;
31505a0948d3SMarkus Armbruster         }
31519711cd0dSJens Freimann         hotplug_handler_plug(hotplug_ctrl, n->primary_dev, errp);
31529711cd0dSJens Freimann     }
3153150ab54aSJens Freimann 
3154150ab54aSJens Freimann out:
31555a0948d3SMarkus Armbruster     error_propagate(errp, err);
31565a0948d3SMarkus Armbruster     return !err;
31579711cd0dSJens Freimann }
31589711cd0dSJens Freimann 
31599711cd0dSJens Freimann static void virtio_net_handle_migration_primary(VirtIONet *n,
31609711cd0dSJens Freimann                                                 MigrationState *s)
31619711cd0dSJens Freimann {
31629711cd0dSJens Freimann     bool should_be_hidden;
31639711cd0dSJens Freimann     Error *err = NULL;
31649711cd0dSJens Freimann 
31659711cd0dSJens Freimann     should_be_hidden = atomic_read(&n->primary_should_be_hidden);
31669711cd0dSJens Freimann 
31679711cd0dSJens Freimann     if (!n->primary_dev) {
31689711cd0dSJens Freimann         n->primary_dev = virtio_connect_failover_devices(n, n->qdev, &err);
31699711cd0dSJens Freimann         if (!n->primary_dev) {
31709711cd0dSJens Freimann             return;
31719711cd0dSJens Freimann         }
31729711cd0dSJens Freimann     }
31739711cd0dSJens Freimann 
31744dbac1aeSMarkus Armbruster     if (migration_in_setup(s) && !should_be_hidden) {
31759711cd0dSJens Freimann         if (failover_unplug_primary(n)) {
31763cad405bSMarc-André Lureau             vmstate_unregister(VMSTATE_IF(n->primary_dev),
31773cad405bSMarc-André Lureau                     qdev_get_vmsd(n->primary_dev),
31789711cd0dSJens Freimann                     n->primary_dev);
31799711cd0dSJens Freimann             qapi_event_send_unplug_primary(n->primary_device_id);
31809711cd0dSJens Freimann             atomic_set(&n->primary_should_be_hidden, true);
31819711cd0dSJens Freimann         } else {
31829711cd0dSJens Freimann             warn_report("couldn't unplug primary device");
31839711cd0dSJens Freimann         }
31849711cd0dSJens Freimann     } else if (migration_has_failed(s)) {
3185150ab54aSJens Freimann         /* We already unplugged the device let's plug it back */
31869711cd0dSJens Freimann         if (!failover_replug_primary(n, &err)) {
31879711cd0dSJens Freimann             if (err) {
31889711cd0dSJens Freimann                 error_report_err(err);
31899711cd0dSJens Freimann             }
31909711cd0dSJens Freimann         }
31919711cd0dSJens Freimann     }
31929711cd0dSJens Freimann }
31939711cd0dSJens Freimann 
31949711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data)
31959711cd0dSJens Freimann {
31969711cd0dSJens Freimann     MigrationState *s = data;
31979711cd0dSJens Freimann     VirtIONet *n = container_of(notifier, VirtIONet, migration_state);
31989711cd0dSJens Freimann     virtio_net_handle_migration_primary(n, s);
31999711cd0dSJens Freimann }
32009711cd0dSJens Freimann 
32019711cd0dSJens Freimann static int virtio_net_primary_should_be_hidden(DeviceListener *listener,
32029711cd0dSJens Freimann             QemuOpts *device_opts)
32039711cd0dSJens Freimann {
32049711cd0dSJens Freimann     VirtIONet *n = container_of(listener, VirtIONet, primary_listener);
32054d0e59acSJens Freimann     bool match_found = false;
32064d0e59acSJens Freimann     bool hide = false;
32079711cd0dSJens Freimann 
32084d0e59acSJens Freimann     if (!device_opts) {
32094d0e59acSJens Freimann         return -1;
32104d0e59acSJens Freimann     }
32119711cd0dSJens Freimann     n->primary_device_dict = qemu_opts_to_qdict(device_opts,
32129711cd0dSJens Freimann             n->primary_device_dict);
32139711cd0dSJens Freimann     if (n->primary_device_dict) {
32149711cd0dSJens Freimann         g_free(n->standby_id);
32159711cd0dSJens Freimann         n->standby_id = g_strdup(qdict_get_try_str(n->primary_device_dict,
32169711cd0dSJens Freimann                     "failover_pair_id"));
32179711cd0dSJens Freimann     }
32184d0e59acSJens Freimann     if (g_strcmp0(n->standby_id, n->netclient_name) == 0) {
32199711cd0dSJens Freimann         match_found = true;
32209711cd0dSJens Freimann     } else {
32219711cd0dSJens Freimann         match_found = false;
32229711cd0dSJens Freimann         hide = false;
32239711cd0dSJens Freimann         g_free(n->standby_id);
32249711cd0dSJens Freimann         n->primary_device_dict = NULL;
32259711cd0dSJens Freimann         goto out;
32269711cd0dSJens Freimann     }
32279711cd0dSJens Freimann 
32289711cd0dSJens Freimann     n->primary_device_opts = device_opts;
32299711cd0dSJens Freimann 
32309711cd0dSJens Freimann     /* primary_should_be_hidden is set during feature negotiation */
32319711cd0dSJens Freimann     hide = atomic_read(&n->primary_should_be_hidden);
32329711cd0dSJens Freimann 
32339711cd0dSJens Freimann     if (n->primary_device_dict) {
32349711cd0dSJens Freimann         g_free(n->primary_device_id);
32359711cd0dSJens Freimann         n->primary_device_id = g_strdup(qdict_get_try_str(
32369711cd0dSJens Freimann                     n->primary_device_dict, "id"));
32379711cd0dSJens Freimann         if (!n->primary_device_id) {
32389711cd0dSJens Freimann             warn_report("primary_device_id not set");
32399711cd0dSJens Freimann         }
32409711cd0dSJens Freimann     }
32419711cd0dSJens Freimann 
32429711cd0dSJens Freimann out:
32439711cd0dSJens Freimann     if (match_found && hide) {
32449711cd0dSJens Freimann         return 1;
32459711cd0dSJens Freimann     } else if (match_found && !hide) {
32469711cd0dSJens Freimann         return 0;
32479711cd0dSJens Freimann     } else {
32489711cd0dSJens Freimann         return -1;
32499711cd0dSJens Freimann     }
32509711cd0dSJens Freimann }
32519711cd0dSJens Freimann 
3252e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
325317ec5a86SKONRAD Frederic {
3254e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3255284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3256284a32f0SAndreas Färber     NetClientState *nc;
32571773d9eeSKONRAD Frederic     int i;
325817ec5a86SKONRAD Frederic 
3259a93e599dSMaxime Coquelin     if (n->net_conf.mtu) {
3260127833eeSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_MTU);
3261a93e599dSMaxime Coquelin     }
3262a93e599dSMaxime Coquelin 
32639473939eSJason Baron     if (n->net_conf.duplex_str) {
32649473939eSJason Baron         if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) {
32659473939eSJason Baron             n->net_conf.duplex = DUPLEX_HALF;
32669473939eSJason Baron         } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) {
32679473939eSJason Baron             n->net_conf.duplex = DUPLEX_FULL;
32689473939eSJason Baron         } else {
32699473939eSJason Baron             error_setg(errp, "'duplex' must be 'half' or 'full'");
3270843c4cfcSMarkus Armbruster             return;
32719473939eSJason Baron         }
32729473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
32739473939eSJason Baron     } else {
32749473939eSJason Baron         n->net_conf.duplex = DUPLEX_UNKNOWN;
32759473939eSJason Baron     }
32769473939eSJason Baron 
32779473939eSJason Baron     if (n->net_conf.speed < SPEED_UNKNOWN) {
32789473939eSJason Baron         error_setg(errp, "'speed' must be between 0 and INT_MAX");
3279843c4cfcSMarkus Armbruster         return;
3280843c4cfcSMarkus Armbruster     }
3281843c4cfcSMarkus Armbruster     if (n->net_conf.speed >= 0) {
32829473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
32839473939eSJason Baron     }
32849473939eSJason Baron 
32859711cd0dSJens Freimann     if (n->failover) {
32869711cd0dSJens Freimann         n->primary_listener.should_be_hidden =
32879711cd0dSJens Freimann             virtio_net_primary_should_be_hidden;
32889711cd0dSJens Freimann         atomic_set(&n->primary_should_be_hidden, true);
32899711cd0dSJens Freimann         device_listener_register(&n->primary_listener);
32909711cd0dSJens Freimann         n->migration_state.notify = virtio_net_migration_state_notifier;
32919711cd0dSJens Freimann         add_migration_state_change_notifier(&n->migration_state);
32929711cd0dSJens Freimann         n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY);
32939711cd0dSJens Freimann     }
32949711cd0dSJens Freimann 
3295da3e8a23SShannon Zhao     virtio_net_set_config_size(n, n->host_features);
3296284a32f0SAndreas Färber     virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size);
329717ec5a86SKONRAD Frederic 
32981c0fbfa3SMichael S. Tsirkin     /*
32991c0fbfa3SMichael S. Tsirkin      * We set a lower limit on RX queue size to what it always was.
33001c0fbfa3SMichael S. Tsirkin      * Guests that want a smaller ring can always resize it without
33011c0fbfa3SMichael S. Tsirkin      * help from us (using virtio 1 and up).
33021c0fbfa3SMichael S. Tsirkin      */
33031c0fbfa3SMichael S. Tsirkin     if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
33041c0fbfa3SMichael S. Tsirkin         n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
33055f997fd1SMichal Privoznik         !is_power_of_2(n->net_conf.rx_queue_size)) {
33061c0fbfa3SMichael S. Tsirkin         error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
33071c0fbfa3SMichael S. Tsirkin                    "must be a power of 2 between %d and %d.",
33081c0fbfa3SMichael S. Tsirkin                    n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
33091c0fbfa3SMichael S. Tsirkin                    VIRTQUEUE_MAX_SIZE);
33101c0fbfa3SMichael S. Tsirkin         virtio_cleanup(vdev);
33111c0fbfa3SMichael S. Tsirkin         return;
33121c0fbfa3SMichael S. Tsirkin     }
33131c0fbfa3SMichael S. Tsirkin 
33149b02e161SWei Wang     if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE ||
33159b02e161SWei Wang         n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE ||
33169b02e161SWei Wang         !is_power_of_2(n->net_conf.tx_queue_size)) {
33179b02e161SWei Wang         error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), "
33189b02e161SWei Wang                    "must be a power of 2 between %d and %d",
33199b02e161SWei Wang                    n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE,
33209b02e161SWei Wang                    VIRTQUEUE_MAX_SIZE);
33219b02e161SWei Wang         virtio_cleanup(vdev);
33229b02e161SWei Wang         return;
33239b02e161SWei Wang     }
33249b02e161SWei Wang 
3325575a1c0eSJiri Pirko     n->max_queues = MAX(n->nic_conf.peers.queues, 1);
332687b3bd1cSJason Wang     if (n->max_queues * 2 + 1 > VIRTIO_QUEUE_MAX) {
33277e0e736eSJason Wang         error_setg(errp, "Invalid number of queues (= %" PRIu32 "), "
3328631b22eaSStefan Weil                    "must be a positive integer less than %d.",
332987b3bd1cSJason Wang                    n->max_queues, (VIRTIO_QUEUE_MAX - 1) / 2);
33307e0e736eSJason Wang         virtio_cleanup(vdev);
33317e0e736eSJason Wang         return;
33327e0e736eSJason Wang     }
33336e790746SPaolo Bonzini     n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queues);
33346e790746SPaolo Bonzini     n->curr_queues = 1;
33351773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
33366e790746SPaolo Bonzini 
33371773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
33381773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
33390765691eSMarkus Armbruster         warn_report("virtio-net: "
33406e790746SPaolo Bonzini                     "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
33411773d9eeSKONRAD Frederic                     n->net_conf.tx);
33420765691eSMarkus Armbruster         error_printf("Defaulting to \"bh\"");
33436e790746SPaolo Bonzini     }
33446e790746SPaolo Bonzini 
33452eef278bSMichael S. Tsirkin     n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n),
33462eef278bSMichael S. Tsirkin                                     n->net_conf.tx_queue_size);
33479b02e161SWei Wang 
3348da51a335SJason Wang     for (i = 0; i < n->max_queues; i++) {
3349f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i);
3350da51a335SJason Wang     }
3351da51a335SJason Wang 
335217a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
33531773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
33541773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
33556e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
33569d8c6a25SDr. David Alan Gilbert     qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
33579d8c6a25SDr. David Alan Gilbert                               QEMU_CLOCK_VIRTUAL,
3358f57fcf70SJason Wang                               virtio_net_announce_timer, n);
3359b2c929f0SDr. David Alan Gilbert     n->announce_timer.round = 0;
33606e790746SPaolo Bonzini 
33618a253ec2SKONRAD Frederic     if (n->netclient_type) {
33628a253ec2SKONRAD Frederic         /*
33638a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
33648a253ec2SKONRAD Frederic          */
33658a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
33668a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
33678a253ec2SKONRAD Frederic     } else {
33681773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
3369284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
33708a253ec2SKONRAD Frederic     }
33718a253ec2SKONRAD Frederic 
33726e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
33736e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
33746e790746SPaolo Bonzini         for (i = 0; i < n->max_queues; i++) {
3375d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
33766e790746SPaolo Bonzini         }
33776e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
33786e790746SPaolo Bonzini     } else {
33796e790746SPaolo Bonzini         n->host_hdr_len = 0;
33806e790746SPaolo Bonzini     }
33816e790746SPaolo Bonzini 
33821773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
33836e790746SPaolo Bonzini 
33846e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
33851773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
3386e22f0603SYuri Benditovich     virtio_net_set_mrg_rx_bufs(n, 0, 0, 0);
33876e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
33886e790746SPaolo Bonzini 
33896e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
33906e790746SPaolo Bonzini 
33916e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
33926e790746SPaolo Bonzini 
3393b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
3394b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
3395b1be4280SAmos Kong 
33962974e916SYuri Benditovich     QTAILQ_INIT(&n->rsc_chains);
3397284a32f0SAndreas Färber     n->qdev = dev;
33984474e37aSYuri Benditovich 
33994474e37aSYuri Benditovich     net_rx_pkt_init(&n->rx_pkt, false);
340017ec5a86SKONRAD Frederic }
340117ec5a86SKONRAD Frederic 
3402b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev)
340317ec5a86SKONRAD Frederic {
3404306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3405306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3406f9d6dbf0SWen Congyang     int i, max_queues;
340717ec5a86SKONRAD Frederic 
340817ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
340917ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
341017ec5a86SKONRAD Frederic 
34118a253ec2SKONRAD Frederic     g_free(n->netclient_name);
34128a253ec2SKONRAD Frederic     n->netclient_name = NULL;
34138a253ec2SKONRAD Frederic     g_free(n->netclient_type);
34148a253ec2SKONRAD Frederic     n->netclient_type = NULL;
34158a253ec2SKONRAD Frederic 
341617ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
341717ec5a86SKONRAD Frederic     g_free(n->vlans);
341817ec5a86SKONRAD Frederic 
34199711cd0dSJens Freimann     if (n->failover) {
34209711cd0dSJens Freimann         g_free(n->primary_device_id);
34219711cd0dSJens Freimann         g_free(n->standby_id);
34229711cd0dSJens Freimann         qobject_unref(n->primary_device_dict);
34239711cd0dSJens Freimann         n->primary_device_dict = NULL;
34249711cd0dSJens Freimann     }
34259711cd0dSJens Freimann 
3426f9d6dbf0SWen Congyang     max_queues = n->multiqueue ? n->max_queues : 1;
3427f9d6dbf0SWen Congyang     for (i = 0; i < max_queues; i++) {
3428f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i);
342917ec5a86SKONRAD Frederic     }
3430d945d9f1SYuri Benditovich     /* delete also control vq */
3431d945d9f1SYuri Benditovich     virtio_del_queue(vdev, max_queues * 2);
3432944458b6SDr. David Alan Gilbert     qemu_announce_timer_del(&n->announce_timer, false);
343317ec5a86SKONRAD Frederic     g_free(n->vqs);
343417ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
34352974e916SYuri Benditovich     virtio_net_rsc_cleanup(n);
343659079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
34374474e37aSYuri Benditovich     net_rx_pkt_uninit(n->rx_pkt);
34386a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
343917ec5a86SKONRAD Frederic }
344017ec5a86SKONRAD Frederic 
344117ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
344217ec5a86SKONRAD Frederic {
344317ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
344417ec5a86SKONRAD Frederic 
344517ec5a86SKONRAD Frederic     /*
344617ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
344717ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
344817ec5a86SKONRAD Frederic      */
344917ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
3450aa4197c3SGonglei     device_add_bootindex_property(obj, &n->nic_conf.bootindex,
3451aa4197c3SGonglei                                   "bootindex", "/ethernet-phy@0",
345240c2281cSMarkus Armbruster                                   DEVICE(n));
345317ec5a86SKONRAD Frederic }
345417ec5a86SKONRAD Frederic 
345544b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque)
34564d45dcfbSHalil Pasic {
34574d45dcfbSHalil Pasic     VirtIONet *n = opaque;
34584d45dcfbSHalil Pasic 
34594d45dcfbSHalil Pasic     /* At this point, backend must be stopped, otherwise
34604d45dcfbSHalil Pasic      * it might keep writing to memory. */
34614d45dcfbSHalil Pasic     assert(!n->vhost_started);
346244b1ff31SDr. David Alan Gilbert 
346344b1ff31SDr. David Alan Gilbert     return 0;
34644d45dcfbSHalil Pasic }
34654d45dcfbSHalil Pasic 
34669711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque)
34679711cd0dSJens Freimann {
34689711cd0dSJens Freimann     DeviceState *dev = opaque;
34699711cd0dSJens Freimann     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
34709711cd0dSJens Freimann     VirtIONet *n = VIRTIO_NET(vdev);
34719711cd0dSJens Freimann 
3472284f42a5SJens Freimann     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) {
3473284f42a5SJens Freimann         return false;
3474284f42a5SJens Freimann     }
34759711cd0dSJens Freimann     return n->primary_dev ? n->primary_dev->pending_deleted_event : false;
34769711cd0dSJens Freimann }
34779711cd0dSJens Freimann 
34789711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque)
34799711cd0dSJens Freimann {
34809711cd0dSJens Freimann     DeviceState *dev = opaque;
34819711cd0dSJens Freimann     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
34829711cd0dSJens Freimann 
34839711cd0dSJens Freimann     return vdc->primary_unplug_pending(dev);
34849711cd0dSJens Freimann }
34859711cd0dSJens Freimann 
34864d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = {
34874d45dcfbSHalil Pasic     .name = "virtio-net",
34884d45dcfbSHalil Pasic     .minimum_version_id = VIRTIO_NET_VM_VERSION,
34894d45dcfbSHalil Pasic     .version_id = VIRTIO_NET_VM_VERSION,
34904d45dcfbSHalil Pasic     .fields = (VMStateField[]) {
34914d45dcfbSHalil Pasic         VMSTATE_VIRTIO_DEVICE,
34924d45dcfbSHalil Pasic         VMSTATE_END_OF_LIST()
34934d45dcfbSHalil Pasic     },
34944d45dcfbSHalil Pasic     .pre_save = virtio_net_pre_save,
34959711cd0dSJens Freimann     .dev_unplug_pending = dev_unplug_pending,
34964d45dcfbSHalil Pasic };
3497290c2428SDr. David Alan Gilbert 
349817ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
3499127833eeSJason Baron     DEFINE_PROP_BIT64("csum", VirtIONet, host_features,
3500127833eeSJason Baron                     VIRTIO_NET_F_CSUM, true),
3501127833eeSJason Baron     DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features,
350287108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_CSUM, true),
3503127833eeSJason Baron     DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
3504127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features,
350587108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO4, true),
3506127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features,
350787108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO6, true),
3508127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features,
350987108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ECN, true),
3510127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features,
351187108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_UFO, true),
3512127833eeSJason Baron     DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features,
351387108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ANNOUNCE, true),
3514127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features,
351587108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO4, true),
3516127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features,
351787108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO6, true),
3518127833eeSJason Baron     DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features,
351987108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_ECN, true),
3520127833eeSJason Baron     DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features,
352187108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_UFO, true),
3522127833eeSJason Baron     DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features,
352387108bb2SShannon Zhao                     VIRTIO_NET_F_MRG_RXBUF, true),
3524127833eeSJason Baron     DEFINE_PROP_BIT64("status", VirtIONet, host_features,
352587108bb2SShannon Zhao                     VIRTIO_NET_F_STATUS, true),
3526127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features,
352787108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VQ, true),
3528127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features,
352987108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX, true),
3530127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features,
353187108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VLAN, true),
3532127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features,
353387108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX_EXTRA, true),
3534127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features,
353587108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_MAC_ADDR, true),
3536127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features,
353787108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
3538127833eeSJason Baron     DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
353959079029SYuri Benditovich     DEFINE_PROP_BIT64("rss", VirtIONet, host_features,
354059079029SYuri Benditovich                     VIRTIO_NET_F_RSS, false),
3541e22f0603SYuri Benditovich     DEFINE_PROP_BIT64("hash", VirtIONet, host_features,
3542e22f0603SYuri Benditovich                     VIRTIO_NET_F_HASH_REPORT, false),
35432974e916SYuri Benditovich     DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features,
35442974e916SYuri Benditovich                     VIRTIO_NET_F_RSC_EXT, false),
35452974e916SYuri Benditovich     DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout,
35462974e916SYuri Benditovich                        VIRTIO_NET_RSC_DEFAULT_INTERVAL),
354717ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
354817ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
354917ec5a86SKONRAD Frederic                        TX_TIMER_INTERVAL),
355017ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
355117ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
35521c0fbfa3SMichael S. Tsirkin     DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
35531c0fbfa3SMichael S. Tsirkin                        VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
35549b02e161SWei Wang     DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size,
35559b02e161SWei Wang                        VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE),
3556a93e599dSMaxime Coquelin     DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0),
355775ebec11SMaxime Coquelin     DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend,
355875ebec11SMaxime Coquelin                      true),
35599473939eSJason Baron     DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN),
35609473939eSJason Baron     DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str),
35619711cd0dSJens Freimann     DEFINE_PROP_BOOL("failover", VirtIONet, failover, false),
356217ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
356317ec5a86SKONRAD Frederic };
356417ec5a86SKONRAD Frederic 
356517ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
356617ec5a86SKONRAD Frederic {
356717ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
356817ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
3569e6f746b3SAndreas Färber 
35704f67d30bSMarc-André Lureau     device_class_set_props(dc, virtio_net_properties);
3571290c2428SDr. David Alan Gilbert     dc->vmsd = &vmstate_virtio_net;
3572125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
3573e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
3574306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
357517ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
357617ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
357717ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
357817ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
357917ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
358017ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
358117ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
358217ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
358317ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
35842a083ffdSMichael S. Tsirkin     vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO);
35857788c3f2SMikhail Sennikovsky     vdc->post_load = virtio_net_post_load_virtio;
3586982b78c5SDr. David Alan Gilbert     vdc->vmsd = &vmstate_virtio_net_device;
35879711cd0dSJens Freimann     vdc->primary_unplug_pending = primary_unplug_pending;
358817ec5a86SKONRAD Frederic }
358917ec5a86SKONRAD Frederic 
359017ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
359117ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
359217ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
359317ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
359417ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
359517ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
359617ec5a86SKONRAD Frederic };
359717ec5a86SKONRAD Frederic 
359817ec5a86SKONRAD Frederic static void virtio_register_types(void)
359917ec5a86SKONRAD Frederic {
360017ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
360117ec5a86SKONRAD Frederic }
360217ec5a86SKONRAD Frederic 
360317ec5a86SKONRAD Frederic type_init(virtio_register_types)
3604