xref: /openbmc/qemu/hw/net/virtio-net.c (revision df8d07081718c29d04d106583d9c300128686cda)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
149b8bfe21SPeter Maydell #include "qemu/osdep.h"
159711cd0dSJens Freimann #include "qemu/atomic.h"
166e790746SPaolo Bonzini #include "qemu/iov.h"
1768b0a639SSi-Wei Liu #include "qemu/log.h"
18db725815SMarkus Armbruster #include "qemu/main-loop.h"
190b8fa32fSMarkus Armbruster #include "qemu/module.h"
206e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
216e790746SPaolo Bonzini #include "net/net.h"
226e790746SPaolo Bonzini #include "net/checksum.h"
236e790746SPaolo Bonzini #include "net/tap.h"
246e790746SPaolo Bonzini #include "qemu/error-report.h"
256e790746SPaolo Bonzini #include "qemu/timer.h"
269711cd0dSJens Freimann #include "qemu/option.h"
279711cd0dSJens Freimann #include "qemu/option_int.h"
289711cd0dSJens Freimann #include "qemu/config-file.h"
299711cd0dSJens Freimann #include "qapi/qmp/qdict.h"
306e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
316e790746SPaolo Bonzini #include "net/vhost_net.h"
329d8c6a25SDr. David Alan Gilbert #include "net/announce.h"
3317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
34e688df6bSMarkus Armbruster #include "qapi/error.h"
359af23989SMarkus Armbruster #include "qapi/qapi-events-net.h"
36a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h"
379711cd0dSJens Freimann #include "qapi/qapi-types-migration.h"
389711cd0dSJens Freimann #include "qapi/qapi-events-migration.h"
391399c60dSRusty Russell #include "hw/virtio/virtio-access.h"
40f8d806c9SJuan Quintela #include "migration/misc.h"
419473939eSJason Baron #include "standard-headers/linux/ethtool.h"
422f780b6aSMarkus Armbruster #include "sysemu/sysemu.h"
439d8c6a25SDr. David Alan Gilbert #include "trace.h"
449711cd0dSJens Freimann #include "monitor/qdev.h"
459711cd0dSJens Freimann #include "hw/pci/pci.h"
464474e37aSYuri Benditovich #include "net_rx_pkt.h"
47108a6481SCindy Lu #include "hw/virtio/vhost.h"
481b529d90SLaurent Vivier #include "sysemu/qtest.h"
496e790746SPaolo Bonzini 
506e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
516e790746SPaolo Bonzini 
526e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
536e790746SPaolo Bonzini 
541c0fbfa3SMichael S. Tsirkin /* previously fixed value */
551c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
569b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256
579b02e161SWei Wang 
58441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */
591c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
609b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE
611c0fbfa3SMichael S. Tsirkin 
622974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE   8        /* ipv4 saddr + daddr */
632974e916SYuri Benditovich 
642974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG         0x3F
652974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH   0xF000
662974e916SYuri Benditovich 
672974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */
682974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header))
692974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535
702974e916SYuri Benditovich 
712974e916SYuri Benditovich /* header length value in ip header without option */
722974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5
732974e916SYuri Benditovich 
742974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE   32      /* ipv6 saddr + daddr */
752974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD
762974e916SYuri Benditovich 
772974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance
782974e916SYuri Benditovich    a lot, and should be tuned carefully, '300000'(300us) is the recommended
792974e916SYuri Benditovich    value to pass the WHQL test, '50000' can gain 2x netperf throughput with
802974e916SYuri Benditovich    tso/gso/gro 'off'. */
812974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000
822974e916SYuri Benditovich 
8359079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \
8459079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \
8559079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \
8659079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \
8759079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \
8859079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \
8959079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \
9059079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \
9159079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDP_EX)
9259079029SYuri Benditovich 
93ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = {
94127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MAC,
955d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mac)},
96127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_STATUS,
975d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, status)},
98127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MQ,
995d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
100127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MTU,
1015d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mtu)},
1029473939eSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX,
1035d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, duplex)},
104e22f0603SYuri Benditovich     {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT),
10559079029SYuri Benditovich      .end = endof(struct virtio_net_config, supported_hash_types)},
1066e790746SPaolo Bonzini     {}
1076e790746SPaolo Bonzini };
1086e790746SPaolo Bonzini 
109d74c30c8SDaniil Tatianin static const VirtIOConfigSizeParams cfg_size_params = {
110d74c30c8SDaniil Tatianin     .min_size = endof(struct virtio_net_config, mac),
111d74c30c8SDaniil Tatianin     .max_size = sizeof(struct virtio_net_config),
112d74c30c8SDaniil Tatianin     .feature_sizes = feature_sizes
113d74c30c8SDaniil Tatianin };
114d74c30c8SDaniil Tatianin 
1156e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
1166e790746SPaolo Bonzini {
1176e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1186e790746SPaolo Bonzini 
1196e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
1206e790746SPaolo Bonzini }
1216e790746SPaolo Bonzini 
1226e790746SPaolo Bonzini static int vq2q(int queue_index)
1236e790746SPaolo Bonzini {
1246e790746SPaolo Bonzini     return queue_index / 2;
1256e790746SPaolo Bonzini }
1266e790746SPaolo Bonzini 
1276e790746SPaolo Bonzini /* TODO
1286e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
1296e790746SPaolo Bonzini  */
1306e790746SPaolo Bonzini 
1316e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
1326e790746SPaolo Bonzini {
13317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1346e790746SPaolo Bonzini     struct virtio_net_config netcfg;
135c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
136fb592882SCindy Lu     static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } };
1376e790746SPaolo Bonzini 
138108a6481SCindy Lu     int ret = 0;
139108a6481SCindy Lu     memset(&netcfg, 0 , sizeof(struct virtio_net_config));
1401399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.status, n->status);
141441537f1SJason Wang     virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs);
142a93e599dSMaxime Coquelin     virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu);
1436e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
1449473939eSJason Baron     virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed);
1459473939eSJason Baron     netcfg.duplex = n->net_conf.duplex;
14659079029SYuri Benditovich     netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE;
14759079029SYuri Benditovich     virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length,
148e22f0603SYuri Benditovich                  virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ?
149e22f0603SYuri Benditovich                  VIRTIO_NET_RSS_MAX_TABLE_LEN : 1);
15059079029SYuri Benditovich     virtio_stl_p(vdev, &netcfg.supported_hash_types,
15159079029SYuri Benditovich                  VIRTIO_NET_RSS_SUPPORTED_HASHES);
1526e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
153108a6481SCindy Lu 
154c546ecf2SJason Wang     /*
155c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
156c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
157c546ecf2SJason Wang      */
158c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
159108a6481SCindy Lu         ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
160108a6481SCindy Lu                                    n->config_size);
161108a6481SCindy Lu         if (ret != -1) {
162fb592882SCindy Lu             /*
163fb592882SCindy Lu              * Some NIC/kernel combinations present 0 as the mac address.  As
164fb592882SCindy Lu              * that is not a legal address, try to proceed with the
165fb592882SCindy Lu              * address from the QEMU command line in the hope that the
166fb592882SCindy Lu              * address has been configured correctly elsewhere - just not
167fb592882SCindy Lu              * reported by the device.
168fb592882SCindy Lu              */
169fb592882SCindy Lu             if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) {
170fb592882SCindy Lu                 info_report("Zero hardware mac address detected. Ignoring.");
171fb592882SCindy Lu                 memcpy(netcfg.mac, n->mac, ETH_ALEN);
172fb592882SCindy Lu             }
173108a6481SCindy Lu             memcpy(config, &netcfg, n->config_size);
174108a6481SCindy Lu         }
175108a6481SCindy Lu     }
1766e790746SPaolo Bonzini }
1776e790746SPaolo Bonzini 
1786e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
1796e790746SPaolo Bonzini {
18017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1816e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
182c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1836e790746SPaolo Bonzini 
1846e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
1856e790746SPaolo Bonzini 
18695129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
18795129d6fSCornelia Huck         !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
1886e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
1896e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
1906e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1916e790746SPaolo Bonzini     }
192108a6481SCindy Lu 
193c546ecf2SJason Wang     /*
194c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
195c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
196c546ecf2SJason Wang      */
197c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
198c546ecf2SJason Wang         vhost_net_set_config(get_vhost_net(nc->peer),
199c546ecf2SJason Wang                              (uint8_t *)&netcfg, 0, n->config_size,
200108a6481SCindy Lu                              VHOST_SET_CONFIG_TYPE_MASTER);
201108a6481SCindy Lu       }
2026e790746SPaolo Bonzini }
2036e790746SPaolo Bonzini 
2046e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
2056e790746SPaolo Bonzini {
20617a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2076e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
20817a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
2096e790746SPaolo Bonzini }
2106e790746SPaolo Bonzini 
211b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net)
212b2c929f0SDr. David Alan Gilbert {
213b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(net);
214b2c929f0SDr. David Alan Gilbert     trace_virtio_net_announce_notify();
215b2c929f0SDr. David Alan Gilbert 
216b2c929f0SDr. David Alan Gilbert     net->status |= VIRTIO_NET_S_ANNOUNCE;
217b2c929f0SDr. David Alan Gilbert     virtio_notify_config(vdev);
218b2c929f0SDr. David Alan Gilbert }
219b2c929f0SDr. David Alan Gilbert 
220f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque)
221f57fcf70SJason Wang {
222f57fcf70SJason Wang     VirtIONet *n = opaque;
2239d8c6a25SDr. David Alan Gilbert     trace_virtio_net_announce_timer(n->announce_timer.round);
224f57fcf70SJason Wang 
2259d8c6a25SDr. David Alan Gilbert     n->announce_timer.round--;
226b2c929f0SDr. David Alan Gilbert     virtio_net_announce_notify(n);
227b2c929f0SDr. David Alan Gilbert }
228b2c929f0SDr. David Alan Gilbert 
229b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc)
230b2c929f0SDr. David Alan Gilbert {
231b2c929f0SDr. David Alan Gilbert     VirtIONet *n = qemu_get_nic_opaque(nc);
232b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
233b2c929f0SDr. David Alan Gilbert 
234b2c929f0SDr. David Alan Gilbert     /*
235b2c929f0SDr. David Alan Gilbert      * Make sure the virtio migration announcement timer isn't running
236b2c929f0SDr. David Alan Gilbert      * If it is, let it trigger announcement so that we do not cause
237b2c929f0SDr. David Alan Gilbert      * confusion.
238b2c929f0SDr. David Alan Gilbert      */
239b2c929f0SDr. David Alan Gilbert     if (n->announce_timer.round) {
240b2c929f0SDr. David Alan Gilbert         return;
241b2c929f0SDr. David Alan Gilbert     }
242b2c929f0SDr. David Alan Gilbert 
243b2c929f0SDr. David Alan Gilbert     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
244b2c929f0SDr. David Alan Gilbert         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
245b2c929f0SDr. David Alan Gilbert             virtio_net_announce_notify(n);
246b2c929f0SDr. David Alan Gilbert     }
247f57fcf70SJason Wang }
248f57fcf70SJason Wang 
2496e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
2506e790746SPaolo Bonzini {
25117a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2526e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
253441537f1SJason Wang     int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
254aa858194SSi-Wei Liu     int cvq = virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ) ?
255aa858194SSi-Wei Liu               n->max_ncs - n->max_queue_pairs : 0;
2566e790746SPaolo Bonzini 
257ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
2586e790746SPaolo Bonzini         return;
2596e790746SPaolo Bonzini     }
2606e790746SPaolo Bonzini 
2618c1ac475SRadim Krčmář     if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
2628c1ac475SRadim Krčmář         !!n->vhost_started) {
2636e790746SPaolo Bonzini         return;
2646e790746SPaolo Bonzini     }
2656e790746SPaolo Bonzini     if (!n->vhost_started) {
266086abc1cSMichael S. Tsirkin         int r, i;
267086abc1cSMichael S. Tsirkin 
2681bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
2691bfa316cSGreg Kurz             error_report("backend does not support %s vnet headers; "
2701bfa316cSGreg Kurz                          "falling back on userspace virtio",
2711bfa316cSGreg Kurz                          virtio_is_big_endian(vdev) ? "BE" : "LE");
2721bfa316cSGreg Kurz             return;
2731bfa316cSGreg Kurz         }
2741bfa316cSGreg Kurz 
275086abc1cSMichael S. Tsirkin         /* Any packets outstanding? Purge them to avoid touching rings
276086abc1cSMichael S. Tsirkin          * when vhost is running.
277086abc1cSMichael S. Tsirkin          */
278441537f1SJason Wang         for (i = 0;  i < queue_pairs; i++) {
279086abc1cSMichael S. Tsirkin             NetClientState *qnc = qemu_get_subqueue(n->nic, i);
280086abc1cSMichael S. Tsirkin 
281086abc1cSMichael S. Tsirkin             /* Purge both directions: TX and RX. */
282086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
283086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
284086abc1cSMichael S. Tsirkin         }
285086abc1cSMichael S. Tsirkin 
286a93e599dSMaxime Coquelin         if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) {
287a93e599dSMaxime Coquelin             r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu);
288a93e599dSMaxime Coquelin             if (r < 0) {
289a93e599dSMaxime Coquelin                 error_report("%uBytes MTU not supported by the backend",
290a93e599dSMaxime Coquelin                              n->net_conf.mtu);
291a93e599dSMaxime Coquelin 
292a93e599dSMaxime Coquelin                 return;
293a93e599dSMaxime Coquelin             }
294a93e599dSMaxime Coquelin         }
295a93e599dSMaxime Coquelin 
2966e790746SPaolo Bonzini         n->vhost_started = 1;
29722288fe5SJason Wang         r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq);
2986e790746SPaolo Bonzini         if (r < 0) {
2996e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
3006e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
3016e790746SPaolo Bonzini             n->vhost_started = 0;
3026e790746SPaolo Bonzini         }
3036e790746SPaolo Bonzini     } else {
30422288fe5SJason Wang         vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq);
3056e790746SPaolo Bonzini         n->vhost_started = 0;
3066e790746SPaolo Bonzini     }
3076e790746SPaolo Bonzini }
3086e790746SPaolo Bonzini 
3091bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
3101bfa316cSGreg Kurz                                           NetClientState *peer,
3111bfa316cSGreg Kurz                                           bool enable)
3121bfa316cSGreg Kurz {
3131bfa316cSGreg Kurz     if (virtio_is_big_endian(vdev)) {
3141bfa316cSGreg Kurz         return qemu_set_vnet_be(peer, enable);
3151bfa316cSGreg Kurz     } else {
3161bfa316cSGreg Kurz         return qemu_set_vnet_le(peer, enable);
3171bfa316cSGreg Kurz     }
3181bfa316cSGreg Kurz }
3191bfa316cSGreg Kurz 
3201bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
321441537f1SJason Wang                                        int queue_pairs, bool enable)
3221bfa316cSGreg Kurz {
3231bfa316cSGreg Kurz     int i;
3241bfa316cSGreg Kurz 
325441537f1SJason Wang     for (i = 0; i < queue_pairs; i++) {
3261bfa316cSGreg Kurz         if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
3271bfa316cSGreg Kurz             enable) {
3281bfa316cSGreg Kurz             while (--i >= 0) {
3291bfa316cSGreg Kurz                 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
3301bfa316cSGreg Kurz             }
3311bfa316cSGreg Kurz 
3321bfa316cSGreg Kurz             return true;
3331bfa316cSGreg Kurz         }
3341bfa316cSGreg Kurz     }
3351bfa316cSGreg Kurz 
3361bfa316cSGreg Kurz     return false;
3371bfa316cSGreg Kurz }
3381bfa316cSGreg Kurz 
3391bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
3401bfa316cSGreg Kurz {
3411bfa316cSGreg Kurz     VirtIODevice *vdev = VIRTIO_DEVICE(n);
342441537f1SJason Wang     int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
3431bfa316cSGreg Kurz 
3441bfa316cSGreg Kurz     if (virtio_net_started(n, status)) {
3451bfa316cSGreg Kurz         /* Before using the device, we tell the network backend about the
3461bfa316cSGreg Kurz          * endianness to use when parsing vnet headers. If the backend
3471bfa316cSGreg Kurz          * can't do it, we fallback onto fixing the headers in the core
3481bfa316cSGreg Kurz          * virtio-net code.
3491bfa316cSGreg Kurz          */
3501bfa316cSGreg Kurz         n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
351441537f1SJason Wang                                                             queue_pairs, true);
3521bfa316cSGreg Kurz     } else if (virtio_net_started(n, vdev->status)) {
3531bfa316cSGreg Kurz         /* After using the device, we need to reset the network backend to
3541bfa316cSGreg Kurz          * the default (guest native endianness), otherwise the guest may
3551bfa316cSGreg Kurz          * lose network connectivity if it is rebooted into a different
3561bfa316cSGreg Kurz          * endianness.
3571bfa316cSGreg Kurz          */
358441537f1SJason Wang         virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false);
3591bfa316cSGreg Kurz     }
3601bfa316cSGreg Kurz }
3611bfa316cSGreg Kurz 
362283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq)
363283e2c2aSYuri Benditovich {
364283e2c2aSYuri Benditovich     unsigned int dropped = virtqueue_drop_all(vq);
365283e2c2aSYuri Benditovich     if (dropped) {
366283e2c2aSYuri Benditovich         virtio_notify(vdev, vq);
367283e2c2aSYuri Benditovich     }
368283e2c2aSYuri Benditovich }
369283e2c2aSYuri Benditovich 
3706e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
3716e790746SPaolo Bonzini {
37217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3736e790746SPaolo Bonzini     VirtIONetQueue *q;
3746e790746SPaolo Bonzini     int i;
3756e790746SPaolo Bonzini     uint8_t queue_status;
3766e790746SPaolo Bonzini 
3771bfa316cSGreg Kurz     virtio_net_vnet_endian_status(n, status);
3786e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
3796e790746SPaolo Bonzini 
380441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
38138705bb5SFam Zheng         NetClientState *ncs = qemu_get_subqueue(n->nic, i);
38238705bb5SFam Zheng         bool queue_started;
3836e790746SPaolo Bonzini         q = &n->vqs[i];
3846e790746SPaolo Bonzini 
385441537f1SJason Wang         if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) {
3866e790746SPaolo Bonzini             queue_status = 0;
3876e790746SPaolo Bonzini         } else {
3886e790746SPaolo Bonzini             queue_status = status;
3896e790746SPaolo Bonzini         }
39038705bb5SFam Zheng         queue_started =
39138705bb5SFam Zheng             virtio_net_started(n, queue_status) && !n->vhost_started;
39238705bb5SFam Zheng 
39338705bb5SFam Zheng         if (queue_started) {
39438705bb5SFam Zheng             qemu_flush_queued_packets(ncs);
39538705bb5SFam Zheng         }
3966e790746SPaolo Bonzini 
3976e790746SPaolo Bonzini         if (!q->tx_waiting) {
3986e790746SPaolo Bonzini             continue;
3996e790746SPaolo Bonzini         }
4006e790746SPaolo Bonzini 
40138705bb5SFam Zheng         if (queue_started) {
4026e790746SPaolo Bonzini             if (q->tx_timer) {
403bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
404bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
4056e790746SPaolo Bonzini             } else {
4066e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
4076e790746SPaolo Bonzini             }
4086e790746SPaolo Bonzini         } else {
4096e790746SPaolo Bonzini             if (q->tx_timer) {
410bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
4116e790746SPaolo Bonzini             } else {
4126e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
4136e790746SPaolo Bonzini             }
414283e2c2aSYuri Benditovich             if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 &&
41570e53e6eSJason Wang                 (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) &&
41670e53e6eSJason Wang                 vdev->vm_running) {
417283e2c2aSYuri Benditovich                 /* if tx is waiting we are likely have some packets in tx queue
418283e2c2aSYuri Benditovich                  * and disabled notification */
419283e2c2aSYuri Benditovich                 q->tx_waiting = 0;
420283e2c2aSYuri Benditovich                 virtio_queue_set_notification(q->tx_vq, 1);
421283e2c2aSYuri Benditovich                 virtio_net_drop_tx_queue_data(vdev, q->tx_vq);
422283e2c2aSYuri Benditovich             }
4236e790746SPaolo Bonzini         }
4246e790746SPaolo Bonzini     }
4256e790746SPaolo Bonzini }
4266e790746SPaolo Bonzini 
4276e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
4286e790746SPaolo Bonzini {
4296e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
43017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
4316e790746SPaolo Bonzini     uint16_t old_status = n->status;
4326e790746SPaolo Bonzini 
4336e790746SPaolo Bonzini     if (nc->link_down)
4346e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
4356e790746SPaolo Bonzini     else
4366e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
4376e790746SPaolo Bonzini 
4386e790746SPaolo Bonzini     if (n->status != old_status)
43917a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
4406e790746SPaolo Bonzini 
44117a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
4426e790746SPaolo Bonzini }
4436e790746SPaolo Bonzini 
444b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
445b1be4280SAmos Kong {
446b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
447b1be4280SAmos Kong 
448b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
449ddfb0baaSMarkus Armbruster         char *path = object_get_canonical_path(OBJECT(n->qdev));
45006150279SWenchao Xia         qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
4513ab72385SPeter Xu                                               n->netclient_name, path);
45296e35046SAmos Kong         g_free(path);
453b1be4280SAmos Kong 
454b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
455b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
456b1be4280SAmos Kong     }
457b1be4280SAmos Kong }
458b1be4280SAmos Kong 
459f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
460f7bc8ef8SAmos Kong {
46154aa3de7SEric Blake     intList *list;
462f7bc8ef8SAmos Kong     int i, j;
463f7bc8ef8SAmos Kong 
464f7bc8ef8SAmos Kong     list = NULL;
465f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
466f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
467f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
46854aa3de7SEric Blake                 QAPI_LIST_PREPEND(list, (i << 5) + j);
469f7bc8ef8SAmos Kong             }
470f7bc8ef8SAmos Kong         }
471f7bc8ef8SAmos Kong     }
472f7bc8ef8SAmos Kong 
473f7bc8ef8SAmos Kong     return list;
474f7bc8ef8SAmos Kong }
475f7bc8ef8SAmos Kong 
476b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
477b1be4280SAmos Kong {
478b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
479f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
480b1be4280SAmos Kong     RxFilterInfo *info;
48154aa3de7SEric Blake     strList *str_list;
482f7bc8ef8SAmos Kong     int i;
483b1be4280SAmos Kong 
484b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
485b1be4280SAmos Kong     info->name = g_strdup(nc->name);
486b1be4280SAmos Kong     info->promiscuous = n->promisc;
487b1be4280SAmos Kong 
488b1be4280SAmos Kong     if (n->nouni) {
489b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
490b1be4280SAmos Kong     } else if (n->alluni) {
491b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
492b1be4280SAmos Kong     } else {
493b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
494b1be4280SAmos Kong     }
495b1be4280SAmos Kong 
496b1be4280SAmos Kong     if (n->nomulti) {
497b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
498b1be4280SAmos Kong     } else if (n->allmulti) {
499b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
500b1be4280SAmos Kong     } else {
501b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
502b1be4280SAmos Kong     }
503b1be4280SAmos Kong 
504b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
505b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
506b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
507b1be4280SAmos Kong 
508b0575ba4SScott Feldman     info->main_mac = qemu_mac_strdup_printf(n->mac);
509b1be4280SAmos Kong 
510b1be4280SAmos Kong     str_list = NULL;
511b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
51254aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
51354aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
514b1be4280SAmos Kong     }
515b1be4280SAmos Kong     info->unicast_table = str_list;
516b1be4280SAmos Kong 
517b1be4280SAmos Kong     str_list = NULL;
518b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
51954aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
52054aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
521b1be4280SAmos Kong     }
522b1be4280SAmos Kong     info->multicast_table = str_list;
523f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
524b1be4280SAmos Kong 
52595129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
526f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
527f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
528f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
529f7bc8ef8SAmos Kong     } else {
530f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
531b1be4280SAmos Kong     }
532b1be4280SAmos Kong 
533b1be4280SAmos Kong     /* enable event notification after query */
534b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
535b1be4280SAmos Kong 
536b1be4280SAmos Kong     return info;
537b1be4280SAmos Kong }
538b1be4280SAmos Kong 
5396e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
5406e790746SPaolo Bonzini {
54117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
54294b52958SGreg Kurz     int i;
5436e790746SPaolo Bonzini 
5446e790746SPaolo Bonzini     /* Reset back to compatibility mode */
5456e790746SPaolo Bonzini     n->promisc = 1;
5466e790746SPaolo Bonzini     n->allmulti = 0;
5476e790746SPaolo Bonzini     n->alluni = 0;
5486e790746SPaolo Bonzini     n->nomulti = 0;
5496e790746SPaolo Bonzini     n->nouni = 0;
5506e790746SPaolo Bonzini     n->nobcast = 0;
5516e790746SPaolo Bonzini     /* multiqueue is disabled by default */
552441537f1SJason Wang     n->curr_queue_pairs = 1;
5539d8c6a25SDr. David Alan Gilbert     timer_del(n->announce_timer.tm);
5549d8c6a25SDr. David Alan Gilbert     n->announce_timer.round = 0;
555f57fcf70SJason Wang     n->status &= ~VIRTIO_NET_S_ANNOUNCE;
5566e790746SPaolo Bonzini 
5576e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
5586e790746SPaolo Bonzini     n->mac_table.in_use = 0;
5596e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
5606e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
5616e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
5626e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
5636e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
564702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
5656e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
56694b52958SGreg Kurz 
56794b52958SGreg Kurz     /* Flush any async TX */
568441537f1SJason Wang     for (i = 0;  i < n->max_queue_pairs; i++) {
56994b52958SGreg Kurz         NetClientState *nc = qemu_get_subqueue(n->nic, i);
57094b52958SGreg Kurz 
57194b52958SGreg Kurz         if (nc->peer) {
57294b52958SGreg Kurz             qemu_flush_or_purge_queued_packets(nc->peer, true);
57394b52958SGreg Kurz             assert(!virtio_net_get_subqueue(nc)->async_tx.elem);
57494b52958SGreg Kurz         }
57594b52958SGreg Kurz     }
5766e790746SPaolo Bonzini }
5776e790746SPaolo Bonzini 
5786e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
5796e790746SPaolo Bonzini {
5806e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
5816e790746SPaolo Bonzini     if (!nc->peer) {
5826e790746SPaolo Bonzini         return;
5836e790746SPaolo Bonzini     }
5846e790746SPaolo Bonzini 
585d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
5866e790746SPaolo Bonzini }
5876e790746SPaolo Bonzini 
5886e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
5896e790746SPaolo Bonzini {
5906e790746SPaolo Bonzini     return n->has_vnet_hdr;
5916e790746SPaolo Bonzini }
5926e790746SPaolo Bonzini 
5936e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
5946e790746SPaolo Bonzini {
5956e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
5966e790746SPaolo Bonzini         return 0;
5976e790746SPaolo Bonzini 
598d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
5996e790746SPaolo Bonzini 
6006e790746SPaolo Bonzini     return n->has_ufo;
6016e790746SPaolo Bonzini }
6026e790746SPaolo Bonzini 
603bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
604e22f0603SYuri Benditovich                                        int version_1, int hash_report)
6056e790746SPaolo Bonzini {
6066e790746SPaolo Bonzini     int i;
6076e790746SPaolo Bonzini     NetClientState *nc;
6086e790746SPaolo Bonzini 
6096e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
6106e790746SPaolo Bonzini 
611bb9d17f8SCornelia Huck     if (version_1) {
612e22f0603SYuri Benditovich         n->guest_hdr_len = hash_report ?
613e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_v1_hash) :
614e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_mrg_rxbuf);
615e22f0603SYuri Benditovich         n->rss_data.populate_hash = !!hash_report;
616bb9d17f8SCornelia Huck     } else {
6176e790746SPaolo Bonzini         n->guest_hdr_len = n->mergeable_rx_bufs ?
618bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr_mrg_rxbuf) :
619bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr);
620bb9d17f8SCornelia Huck     }
6216e790746SPaolo Bonzini 
622441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
6236e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
6246e790746SPaolo Bonzini 
6256e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
626d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
627d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
6286e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
6296e790746SPaolo Bonzini         }
6306e790746SPaolo Bonzini     }
6316e790746SPaolo Bonzini }
6326e790746SPaolo Bonzini 
6332eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n)
6342eef278bSMichael S. Tsirkin {
6352eef278bSMichael S. Tsirkin     NetClientState *peer = n->nic_conf.peers.ncs[0];
6362eef278bSMichael S. Tsirkin 
6372eef278bSMichael S. Tsirkin     /*
6380ea5778fSEugenio Pérez      * Backends other than vhost-user or vhost-vdpa don't support max queue
6390ea5778fSEugenio Pérez      * size.
6402eef278bSMichael S. Tsirkin      */
6412eef278bSMichael S. Tsirkin     if (!peer) {
6422eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6432eef278bSMichael S. Tsirkin     }
6442eef278bSMichael S. Tsirkin 
6450ea5778fSEugenio Pérez     switch(peer->info->type) {
6460ea5778fSEugenio Pérez     case NET_CLIENT_DRIVER_VHOST_USER:
6470ea5778fSEugenio Pérez     case NET_CLIENT_DRIVER_VHOST_VDPA:
6482eef278bSMichael S. Tsirkin         return VIRTQUEUE_MAX_SIZE;
6490ea5778fSEugenio Pérez     default:
6500ea5778fSEugenio Pérez         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6510ea5778fSEugenio Pérez     };
6522eef278bSMichael S. Tsirkin }
6532eef278bSMichael S. Tsirkin 
6546e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
6556e790746SPaolo Bonzini {
6566e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6576e790746SPaolo Bonzini 
6586e790746SPaolo Bonzini     if (!nc->peer) {
6596e790746SPaolo Bonzini         return 0;
6606e790746SPaolo Bonzini     }
6616e790746SPaolo Bonzini 
662f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6637263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 1);
6647263a0adSChangchun Ouyang     }
6657263a0adSChangchun Ouyang 
666f394b2e2SEric Blake     if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
6676e790746SPaolo Bonzini         return 0;
6686e790746SPaolo Bonzini     }
6696e790746SPaolo Bonzini 
670441537f1SJason Wang     if (n->max_queue_pairs == 1) {
6711074b879SJason Wang         return 0;
6721074b879SJason Wang     }
6731074b879SJason Wang 
6746e790746SPaolo Bonzini     return tap_enable(nc->peer);
6756e790746SPaolo Bonzini }
6766e790746SPaolo Bonzini 
6776e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
6786e790746SPaolo Bonzini {
6796e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6806e790746SPaolo Bonzini 
6816e790746SPaolo Bonzini     if (!nc->peer) {
6826e790746SPaolo Bonzini         return 0;
6836e790746SPaolo Bonzini     }
6846e790746SPaolo Bonzini 
685f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6867263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 0);
6877263a0adSChangchun Ouyang     }
6887263a0adSChangchun Ouyang 
689f394b2e2SEric Blake     if (nc->peer->info->type !=  NET_CLIENT_DRIVER_TAP) {
6906e790746SPaolo Bonzini         return 0;
6916e790746SPaolo Bonzini     }
6926e790746SPaolo Bonzini 
6936e790746SPaolo Bonzini     return tap_disable(nc->peer);
6946e790746SPaolo Bonzini }
6956e790746SPaolo Bonzini 
696441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n)
6976e790746SPaolo Bonzini {
6986e790746SPaolo Bonzini     int i;
699ddfa83eaSJoel Stanley     int r;
7006e790746SPaolo Bonzini 
70168b5f314SYuri Benditovich     if (n->nic->peer_deleted) {
70268b5f314SYuri Benditovich         return;
70368b5f314SYuri Benditovich     }
70468b5f314SYuri Benditovich 
705441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
706441537f1SJason Wang         if (i < n->curr_queue_pairs) {
707ddfa83eaSJoel Stanley             r = peer_attach(n, i);
708ddfa83eaSJoel Stanley             assert(!r);
7096e790746SPaolo Bonzini         } else {
710ddfa83eaSJoel Stanley             r = peer_detach(n, i);
711ddfa83eaSJoel Stanley             assert(!r);
7126e790746SPaolo Bonzini         }
7136e790746SPaolo Bonzini     }
7146e790746SPaolo Bonzini }
7156e790746SPaolo Bonzini 
716ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
7176e790746SPaolo Bonzini 
7189d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
7199d5b731dSJason Wang                                         Error **errp)
7206e790746SPaolo Bonzini {
72117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
7226e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
7236e790746SPaolo Bonzini 
724da3e8a23SShannon Zhao     /* Firstly sync all virtio-net possible supported features */
725da3e8a23SShannon Zhao     features |= n->host_features;
726da3e8a23SShannon Zhao 
7270cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7286e790746SPaolo Bonzini 
7296e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
7300cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
7310cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7320cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7330cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
7346e790746SPaolo Bonzini 
7350cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
7360cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
7370cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
7380cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
739e22f0603SYuri Benditovich 
740e22f0603SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
7416e790746SPaolo Bonzini     }
7426e790746SPaolo Bonzini 
7436e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
7440cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
7450cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
7466e790746SPaolo Bonzini     }
7476e790746SPaolo Bonzini 
748ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
7496e790746SPaolo Bonzini         return features;
7506e790746SPaolo Bonzini     }
7512974e916SYuri Benditovich 
7520145c393SAndrew Melnychenko     if (!ebpf_rss_is_loaded(&n->ebpf_rss)) {
75359079029SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_RSS);
7540145c393SAndrew Melnychenko     }
75575ebec11SMaxime Coquelin     features = vhost_net_get_features(get_vhost_net(nc->peer), features);
75675ebec11SMaxime Coquelin     vdev->backend_features = features;
75775ebec11SMaxime Coquelin 
75875ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
75975ebec11SMaxime Coquelin             (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) {
76075ebec11SMaxime Coquelin         features |= (1ULL << VIRTIO_NET_F_MTU);
76175ebec11SMaxime Coquelin     }
76275ebec11SMaxime Coquelin 
76375ebec11SMaxime Coquelin     return features;
7646e790746SPaolo Bonzini }
7656e790746SPaolo Bonzini 
766019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
7676e790746SPaolo Bonzini {
768019a3edbSGerd Hoffmann     uint64_t features = 0;
7696e790746SPaolo Bonzini 
7706e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
7716e790746SPaolo Bonzini      * but also these: */
7720cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7730cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
7740cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7750cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7760cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
7776e790746SPaolo Bonzini 
7786e790746SPaolo Bonzini     return features;
7796e790746SPaolo Bonzini }
7806e790746SPaolo Bonzini 
781644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
782644c9858SDmitry Fleytman {
783ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
784644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
785644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
786644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
787644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
788644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
789644c9858SDmitry Fleytman }
790644c9858SDmitry Fleytman 
791644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
792644c9858SDmitry Fleytman {
793644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
794644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
795644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
796644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
797644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
798644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
799644c9858SDmitry Fleytman 
800644c9858SDmitry Fleytman     return guest_offloads_mask & features;
801644c9858SDmitry Fleytman }
802644c9858SDmitry Fleytman 
803644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
804644c9858SDmitry Fleytman {
805644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
806644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
807644c9858SDmitry Fleytman }
808644c9858SDmitry Fleytman 
809f5e1847bSJuan Quintela typedef struct {
810f5e1847bSJuan Quintela     VirtIONet *n;
81112b2fad7SKevin Wolf     DeviceState *dev;
81212b2fad7SKevin Wolf } FailoverDevice;
813f5e1847bSJuan Quintela 
814f5e1847bSJuan Quintela /**
81512b2fad7SKevin Wolf  * Set the failover primary device
816f5e1847bSJuan Quintela  *
817f5e1847bSJuan Quintela  * @opaque: FailoverId to setup
818f5e1847bSJuan Quintela  * @opts: opts for device we are handling
819f5e1847bSJuan Quintela  * @errp: returns an error if this function fails
820f5e1847bSJuan Quintela  */
82112b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque)
822f5e1847bSJuan Quintela {
82312b2fad7SKevin Wolf     FailoverDevice *fdev = opaque;
82412b2fad7SKevin Wolf     PCIDevice *pci_dev = (PCIDevice *)
82512b2fad7SKevin Wolf         object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE);
826f5e1847bSJuan Quintela 
82712b2fad7SKevin Wolf     if (!pci_dev) {
82812b2fad7SKevin Wolf         return 0;
82912b2fad7SKevin Wolf     }
83012b2fad7SKevin Wolf 
83112b2fad7SKevin Wolf     if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) {
83212b2fad7SKevin Wolf         fdev->dev = dev;
833f5e1847bSJuan Quintela         return 1;
834f5e1847bSJuan Quintela     }
835f5e1847bSJuan Quintela 
836f5e1847bSJuan Quintela     return 0;
837f5e1847bSJuan Quintela }
838f5e1847bSJuan Quintela 
839f5e1847bSJuan Quintela /**
84085d3b931SJuan Quintela  * Find the primary device for this failover virtio-net
84185d3b931SJuan Quintela  *
84285d3b931SJuan Quintela  * @n: VirtIONet device
84385d3b931SJuan Quintela  * @errp: returns an error if this function fails
84485d3b931SJuan Quintela  */
8450a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n)
8469711cd0dSJens Freimann {
84712b2fad7SKevin Wolf     FailoverDevice fdev = {
84812b2fad7SKevin Wolf         .n = n,
84912b2fad7SKevin Wolf     };
8509711cd0dSJens Freimann 
85112b2fad7SKevin Wolf     qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL,
85212b2fad7SKevin Wolf                        NULL, NULL, &fdev);
85312b2fad7SKevin Wolf     return fdev.dev;
8549711cd0dSJens Freimann }
8559711cd0dSJens Freimann 
85621e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp)
85721e8709bSJuan Quintela {
85821e8709bSJuan Quintela     Error *err = NULL;
85921e8709bSJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
86021e8709bSJuan Quintela 
86121e8709bSJuan Quintela     if (dev) {
86221e8709bSJuan Quintela         return;
86321e8709bSJuan Quintela     }
86421e8709bSJuan Quintela 
865259a10dbSKevin Wolf     if (!n->primary_opts) {
86697ca9c59SLaurent Vivier         error_setg(errp, "Primary device not found");
86797ca9c59SLaurent Vivier         error_append_hint(errp, "Virtio-net failover will not work. Make "
86897ca9c59SLaurent Vivier                           "sure primary device has parameter"
86997ca9c59SLaurent Vivier                           " failover_pair_id=%s\n", n->netclient_name);
87021e8709bSJuan Quintela         return;
87121e8709bSJuan Quintela     }
872259a10dbSKevin Wolf 
873f3558b1bSKevin Wolf     dev = qdev_device_add_from_qdict(n->primary_opts,
874f3558b1bSKevin Wolf                                      n->primary_opts_from_json,
875f3558b1bSKevin Wolf                                      &err);
87621e8709bSJuan Quintela     if (err) {
877f3558b1bSKevin Wolf         qobject_unref(n->primary_opts);
878259a10dbSKevin Wolf         n->primary_opts = NULL;
87900e7b129SLaurent Vivier     } else {
88000e7b129SLaurent Vivier         object_unref(OBJECT(dev));
88121e8709bSJuan Quintela     }
88221e8709bSJuan Quintela     error_propagate(errp, err);
88321e8709bSJuan Quintela }
88421e8709bSJuan Quintela 
885d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
8866e790746SPaolo Bonzini {
88717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
8889711cd0dSJens Freimann     Error *err = NULL;
8896e790746SPaolo Bonzini     int i;
8906e790746SPaolo Bonzini 
89175ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
89275ebec11SMaxime Coquelin             !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) {
89375ebec11SMaxime Coquelin         features &= ~(1ULL << VIRTIO_NET_F_MTU);
89475ebec11SMaxime Coquelin     }
89575ebec11SMaxime Coquelin 
896ef546f12SCornelia Huck     virtio_net_set_multiqueue(n,
89759079029SYuri Benditovich                               virtio_has_feature(features, VIRTIO_NET_F_RSS) ||
89895129d6fSCornelia Huck                               virtio_has_feature(features, VIRTIO_NET_F_MQ));
8996e790746SPaolo Bonzini 
900ef546f12SCornelia Huck     virtio_net_set_mrg_rx_bufs(n,
90195129d6fSCornelia Huck                                virtio_has_feature(features,
902bb9d17f8SCornelia Huck                                                   VIRTIO_NET_F_MRG_RXBUF),
90395129d6fSCornelia Huck                                virtio_has_feature(features,
904e22f0603SYuri Benditovich                                                   VIRTIO_F_VERSION_1),
905e22f0603SYuri Benditovich                                virtio_has_feature(features,
906e22f0603SYuri Benditovich                                                   VIRTIO_NET_F_HASH_REPORT));
9076e790746SPaolo Bonzini 
9082974e916SYuri Benditovich     n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9092974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4);
9102974e916SYuri Benditovich     n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9112974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6);
912e22f0603SYuri Benditovich     n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS);
9132974e916SYuri Benditovich 
9146e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
915644c9858SDmitry Fleytman         n->curr_guest_offloads =
916644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
917644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
9186e790746SPaolo Bonzini     }
9196e790746SPaolo Bonzini 
920441537f1SJason Wang     for (i = 0;  i < n->max_queue_pairs; i++) {
9216e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
9226e790746SPaolo Bonzini 
923ed8b4afeSNikolay Nikolaev         if (!get_vhost_net(nc->peer)) {
9246e790746SPaolo Bonzini             continue;
9256e790746SPaolo Bonzini         }
926ed8b4afeSNikolay Nikolaev         vhost_net_ack_features(get_vhost_net(nc->peer), features);
9276e790746SPaolo Bonzini     }
9280b1eaa88SStefan Fritsch 
92995129d6fSCornelia Huck     if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
9300b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
9310b1eaa88SStefan Fritsch     } else {
9320b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
9330b1eaa88SStefan Fritsch     }
9349711cd0dSJens Freimann 
9359711cd0dSJens Freimann     if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) {
9369711cd0dSJens Freimann         qapi_event_send_failover_negotiated(n->netclient_name);
937e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, false);
9389711cd0dSJens Freimann         failover_add_primary(n, &err);
9399711cd0dSJens Freimann         if (err) {
9401b529d90SLaurent Vivier             if (!qtest_enabled()) {
9419711cd0dSJens Freimann                 warn_report_err(err);
9421b529d90SLaurent Vivier             } else {
9431b529d90SLaurent Vivier                 error_free(err);
9441b529d90SLaurent Vivier             }
9459711cd0dSJens Freimann         }
9466e790746SPaolo Bonzini     }
94721e8709bSJuan Quintela }
9486e790746SPaolo Bonzini 
9496e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
9506e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
9516e790746SPaolo Bonzini {
9526e790746SPaolo Bonzini     uint8_t on;
9536e790746SPaolo Bonzini     size_t s;
954b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
9556e790746SPaolo Bonzini 
9566e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
9576e790746SPaolo Bonzini     if (s != sizeof(on)) {
9586e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9596e790746SPaolo Bonzini     }
9606e790746SPaolo Bonzini 
9616e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
9626e790746SPaolo Bonzini         n->promisc = on;
9636e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
9646e790746SPaolo Bonzini         n->allmulti = on;
9656e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
9666e790746SPaolo Bonzini         n->alluni = on;
9676e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
9686e790746SPaolo Bonzini         n->nomulti = on;
9696e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
9706e790746SPaolo Bonzini         n->nouni = on;
9716e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
9726e790746SPaolo Bonzini         n->nobcast = on;
9736e790746SPaolo Bonzini     } else {
9746e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9756e790746SPaolo Bonzini     }
9766e790746SPaolo Bonzini 
977b1be4280SAmos Kong     rxfilter_notify(nc);
978b1be4280SAmos Kong 
9796e790746SPaolo Bonzini     return VIRTIO_NET_OK;
9806e790746SPaolo Bonzini }
9816e790746SPaolo Bonzini 
982644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
983644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
984644c9858SDmitry Fleytman {
985644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
986644c9858SDmitry Fleytman     uint64_t offloads;
987644c9858SDmitry Fleytman     size_t s;
988644c9858SDmitry Fleytman 
98995129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
990644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
991644c9858SDmitry Fleytman     }
992644c9858SDmitry Fleytman 
993644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
994644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
995644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
996644c9858SDmitry Fleytman     }
997644c9858SDmitry Fleytman 
998644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
999644c9858SDmitry Fleytman         uint64_t supported_offloads;
1000644c9858SDmitry Fleytman 
1001189ae6bbSJason Wang         offloads = virtio_ldq_p(vdev, &offloads);
1002189ae6bbSJason Wang 
1003644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
1004644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1005644c9858SDmitry Fleytman         }
1006644c9858SDmitry Fleytman 
10072974e916SYuri Benditovich         n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10082974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4);
10092974e916SYuri Benditovich         n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10102974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6);
10112974e916SYuri Benditovich         virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT);
10122974e916SYuri Benditovich 
1013644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
1014644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
1015644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1016644c9858SDmitry Fleytman         }
1017644c9858SDmitry Fleytman 
1018644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
1019644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1020644c9858SDmitry Fleytman 
1021644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
1022644c9858SDmitry Fleytman     } else {
1023644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1024644c9858SDmitry Fleytman     }
1025644c9858SDmitry Fleytman }
1026644c9858SDmitry Fleytman 
10276e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
10286e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
10296e790746SPaolo Bonzini {
10301399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10316e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
10326e790746SPaolo Bonzini     size_t s;
1033b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10346e790746SPaolo Bonzini 
10356e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
10366e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
10376e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
10386e790746SPaolo Bonzini         }
10396e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
10406e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
10416e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1042b1be4280SAmos Kong         rxfilter_notify(nc);
1043b1be4280SAmos Kong 
10446e790746SPaolo Bonzini         return VIRTIO_NET_OK;
10456e790746SPaolo Bonzini     }
10466e790746SPaolo Bonzini 
10476e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
10486e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10496e790746SPaolo Bonzini     }
10506e790746SPaolo Bonzini 
1051cae2e556SAmos Kong     int in_use = 0;
1052cae2e556SAmos Kong     int first_multi = 0;
1053cae2e556SAmos Kong     uint8_t uni_overflow = 0;
1054cae2e556SAmos Kong     uint8_t multi_overflow = 0;
1055cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
10566e790746SPaolo Bonzini 
10576e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10586e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10591399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10606e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1061b1be4280SAmos Kong         goto error;
10626e790746SPaolo Bonzini     }
10636e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10646e790746SPaolo Bonzini 
10656e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
1066b1be4280SAmos Kong         goto error;
10676e790746SPaolo Bonzini     }
10686e790746SPaolo Bonzini 
10696e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
1070cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
10716e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
10726e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1073b1be4280SAmos Kong             goto error;
10746e790746SPaolo Bonzini         }
1075cae2e556SAmos Kong         in_use += mac_data.entries;
10766e790746SPaolo Bonzini     } else {
1077cae2e556SAmos Kong         uni_overflow = 1;
10786e790746SPaolo Bonzini     }
10796e790746SPaolo Bonzini 
10806e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
10816e790746SPaolo Bonzini 
1082cae2e556SAmos Kong     first_multi = in_use;
10836e790746SPaolo Bonzini 
10846e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10856e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10861399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10876e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1088b1be4280SAmos Kong         goto error;
10896e790746SPaolo Bonzini     }
10906e790746SPaolo Bonzini 
10916e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10926e790746SPaolo Bonzini 
10936e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
1094b1be4280SAmos Kong         goto error;
10956e790746SPaolo Bonzini     }
10966e790746SPaolo Bonzini 
1097edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
1098cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
10996e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
11006e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1101b1be4280SAmos Kong             goto error;
11026e790746SPaolo Bonzini         }
1103cae2e556SAmos Kong         in_use += mac_data.entries;
11046e790746SPaolo Bonzini     } else {
1105cae2e556SAmos Kong         multi_overflow = 1;
11066e790746SPaolo Bonzini     }
11076e790746SPaolo Bonzini 
1108cae2e556SAmos Kong     n->mac_table.in_use = in_use;
1109cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
1110cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
1111cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
1112cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
1113cae2e556SAmos Kong     g_free(macs);
1114b1be4280SAmos Kong     rxfilter_notify(nc);
1115b1be4280SAmos Kong 
11166e790746SPaolo Bonzini     return VIRTIO_NET_OK;
1117b1be4280SAmos Kong 
1118b1be4280SAmos Kong error:
1119cae2e556SAmos Kong     g_free(macs);
1120b1be4280SAmos Kong     return VIRTIO_NET_ERR;
11216e790746SPaolo Bonzini }
11226e790746SPaolo Bonzini 
11236e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
11246e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
11256e790746SPaolo Bonzini {
11261399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
11276e790746SPaolo Bonzini     uint16_t vid;
11286e790746SPaolo Bonzini     size_t s;
1129b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
11306e790746SPaolo Bonzini 
11316e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
11321399c60dSRusty Russell     vid = virtio_lduw_p(vdev, &vid);
11336e790746SPaolo Bonzini     if (s != sizeof(vid)) {
11346e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11356e790746SPaolo Bonzini     }
11366e790746SPaolo Bonzini 
11376e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
11386e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11396e790746SPaolo Bonzini 
11406e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
11416e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
11426e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
11436e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
11446e790746SPaolo Bonzini     else
11456e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11466e790746SPaolo Bonzini 
1147b1be4280SAmos Kong     rxfilter_notify(nc);
1148b1be4280SAmos Kong 
11496e790746SPaolo Bonzini     return VIRTIO_NET_OK;
11506e790746SPaolo Bonzini }
11516e790746SPaolo Bonzini 
1152f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
1153f57fcf70SJason Wang                                       struct iovec *iov, unsigned int iov_cnt)
1154f57fcf70SJason Wang {
11559d8c6a25SDr. David Alan Gilbert     trace_virtio_net_handle_announce(n->announce_timer.round);
1156f57fcf70SJason Wang     if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
1157f57fcf70SJason Wang         n->status & VIRTIO_NET_S_ANNOUNCE) {
1158f57fcf70SJason Wang         n->status &= ~VIRTIO_NET_S_ANNOUNCE;
11599d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
11609d8c6a25SDr. David Alan Gilbert             qemu_announce_timer_step(&n->announce_timer);
1161f57fcf70SJason Wang         }
1162f57fcf70SJason Wang         return VIRTIO_NET_OK;
1163f57fcf70SJason Wang     } else {
1164f57fcf70SJason Wang         return VIRTIO_NET_ERR;
1165f57fcf70SJason Wang     }
1166f57fcf70SJason Wang }
1167f57fcf70SJason Wang 
11680145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n);
11690145c393SAndrew Melnychenko 
117059079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n)
117159079029SYuri Benditovich {
117259079029SYuri Benditovich     if (n->rss_data.enabled) {
117359079029SYuri Benditovich         trace_virtio_net_rss_disable();
117459079029SYuri Benditovich     }
117559079029SYuri Benditovich     n->rss_data.enabled = false;
11760145c393SAndrew Melnychenko 
11770145c393SAndrew Melnychenko     virtio_net_detach_epbf_rss(n);
11780145c393SAndrew Melnychenko }
11790145c393SAndrew Melnychenko 
11800145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd)
11810145c393SAndrew Melnychenko {
11820145c393SAndrew Melnychenko     NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0);
11830145c393SAndrew Melnychenko     if (nc == NULL || nc->info->set_steering_ebpf == NULL) {
11840145c393SAndrew Melnychenko         return false;
11850145c393SAndrew Melnychenko     }
11860145c393SAndrew Melnychenko 
11870145c393SAndrew Melnychenko     return nc->info->set_steering_ebpf(nc, prog_fd);
11880145c393SAndrew Melnychenko }
11890145c393SAndrew Melnychenko 
11900145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data,
11910145c393SAndrew Melnychenko                                    struct EBPFRSSConfig *config)
11920145c393SAndrew Melnychenko {
11930145c393SAndrew Melnychenko     config->redirect = data->redirect;
11940145c393SAndrew Melnychenko     config->populate_hash = data->populate_hash;
11950145c393SAndrew Melnychenko     config->hash_types = data->hash_types;
11960145c393SAndrew Melnychenko     config->indirections_len = data->indirections_len;
11970145c393SAndrew Melnychenko     config->default_queue = data->default_queue;
11980145c393SAndrew Melnychenko }
11990145c393SAndrew Melnychenko 
12000145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n)
12010145c393SAndrew Melnychenko {
12020145c393SAndrew Melnychenko     struct EBPFRSSConfig config = {};
12030145c393SAndrew Melnychenko 
12040145c393SAndrew Melnychenko     if (!ebpf_rss_is_loaded(&n->ebpf_rss)) {
12050145c393SAndrew Melnychenko         return false;
12060145c393SAndrew Melnychenko     }
12070145c393SAndrew Melnychenko 
12080145c393SAndrew Melnychenko     rss_data_to_rss_config(&n->rss_data, &config);
12090145c393SAndrew Melnychenko 
12100145c393SAndrew Melnychenko     if (!ebpf_rss_set_all(&n->ebpf_rss, &config,
12110145c393SAndrew Melnychenko                           n->rss_data.indirections_table, n->rss_data.key)) {
12120145c393SAndrew Melnychenko         return false;
12130145c393SAndrew Melnychenko     }
12140145c393SAndrew Melnychenko 
12150145c393SAndrew Melnychenko     if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) {
12160145c393SAndrew Melnychenko         return false;
12170145c393SAndrew Melnychenko     }
12180145c393SAndrew Melnychenko 
12190145c393SAndrew Melnychenko     return true;
12200145c393SAndrew Melnychenko }
12210145c393SAndrew Melnychenko 
12220145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n)
12230145c393SAndrew Melnychenko {
12240145c393SAndrew Melnychenko     virtio_net_attach_ebpf_to_backend(n->nic, -1);
12250145c393SAndrew Melnychenko }
12260145c393SAndrew Melnychenko 
12270145c393SAndrew Melnychenko static bool virtio_net_load_ebpf(VirtIONet *n)
12280145c393SAndrew Melnychenko {
12290145c393SAndrew Melnychenko     if (!virtio_net_attach_ebpf_to_backend(n->nic, -1)) {
12300145c393SAndrew Melnychenko         /* backend does't support steering ebpf */
12310145c393SAndrew Melnychenko         return false;
12320145c393SAndrew Melnychenko     }
12330145c393SAndrew Melnychenko 
12340145c393SAndrew Melnychenko     return ebpf_rss_load(&n->ebpf_rss);
12350145c393SAndrew Melnychenko }
12360145c393SAndrew Melnychenko 
12370145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n)
12380145c393SAndrew Melnychenko {
12390145c393SAndrew Melnychenko     virtio_net_attach_ebpf_to_backend(n->nic, -1);
12400145c393SAndrew Melnychenko     ebpf_rss_unload(&n->ebpf_rss);
124159079029SYuri Benditovich }
124259079029SYuri Benditovich 
124359079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n,
1244e22f0603SYuri Benditovich                                       struct iovec *iov,
1245e22f0603SYuri Benditovich                                       unsigned int iov_cnt,
1246e22f0603SYuri Benditovich                                       bool do_rss)
124759079029SYuri Benditovich {
124859079029SYuri Benditovich     VirtIODevice *vdev = VIRTIO_DEVICE(n);
124959079029SYuri Benditovich     struct virtio_net_rss_config cfg;
125059079029SYuri Benditovich     size_t s, offset = 0, size_get;
1251441537f1SJason Wang     uint16_t queue_pairs, i;
125259079029SYuri Benditovich     struct {
125359079029SYuri Benditovich         uint16_t us;
125459079029SYuri Benditovich         uint8_t b;
125559079029SYuri Benditovich     } QEMU_PACKED temp;
125659079029SYuri Benditovich     const char *err_msg = "";
125759079029SYuri Benditovich     uint32_t err_value = 0;
125859079029SYuri Benditovich 
1259e22f0603SYuri Benditovich     if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) {
126059079029SYuri Benditovich         err_msg = "RSS is not negotiated";
126159079029SYuri Benditovich         goto error;
126259079029SYuri Benditovich     }
1263e22f0603SYuri Benditovich     if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) {
1264e22f0603SYuri Benditovich         err_msg = "Hash report is not negotiated";
1265e22f0603SYuri Benditovich         goto error;
1266e22f0603SYuri Benditovich     }
126759079029SYuri Benditovich     size_get = offsetof(struct virtio_net_rss_config, indirection_table);
126859079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get);
126959079029SYuri Benditovich     if (s != size_get) {
127059079029SYuri Benditovich         err_msg = "Short command buffer";
127159079029SYuri Benditovich         err_value = (uint32_t)s;
127259079029SYuri Benditovich         goto error;
127359079029SYuri Benditovich     }
127459079029SYuri Benditovich     n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types);
127559079029SYuri Benditovich     n->rss_data.indirections_len =
127659079029SYuri Benditovich         virtio_lduw_p(vdev, &cfg.indirection_table_mask);
127759079029SYuri Benditovich     n->rss_data.indirections_len++;
1278e22f0603SYuri Benditovich     if (!do_rss) {
1279e22f0603SYuri Benditovich         n->rss_data.indirections_len = 1;
1280e22f0603SYuri Benditovich     }
128159079029SYuri Benditovich     if (!is_power_of_2(n->rss_data.indirections_len)) {
128259079029SYuri Benditovich         err_msg = "Invalid size of indirection table";
128359079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
128459079029SYuri Benditovich         goto error;
128559079029SYuri Benditovich     }
128659079029SYuri Benditovich     if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) {
128759079029SYuri Benditovich         err_msg = "Too large indirection table";
128859079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
128959079029SYuri Benditovich         goto error;
129059079029SYuri Benditovich     }
1291e22f0603SYuri Benditovich     n->rss_data.default_queue = do_rss ?
1292e22f0603SYuri Benditovich         virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0;
1293441537f1SJason Wang     if (n->rss_data.default_queue >= n->max_queue_pairs) {
129459079029SYuri Benditovich         err_msg = "Invalid default queue";
129559079029SYuri Benditovich         err_value = n->rss_data.default_queue;
129659079029SYuri Benditovich         goto error;
129759079029SYuri Benditovich     }
129859079029SYuri Benditovich     offset += size_get;
129959079029SYuri Benditovich     size_get = sizeof(uint16_t) * n->rss_data.indirections_len;
130059079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
130159079029SYuri Benditovich     n->rss_data.indirections_table = g_malloc(size_get);
130259079029SYuri Benditovich     if (!n->rss_data.indirections_table) {
130359079029SYuri Benditovich         err_msg = "Can't allocate indirections table";
130459079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
130559079029SYuri Benditovich         goto error;
130659079029SYuri Benditovich     }
130759079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset,
130859079029SYuri Benditovich                    n->rss_data.indirections_table, size_get);
130959079029SYuri Benditovich     if (s != size_get) {
131059079029SYuri Benditovich         err_msg = "Short indirection table buffer";
131159079029SYuri Benditovich         err_value = (uint32_t)s;
131259079029SYuri Benditovich         goto error;
131359079029SYuri Benditovich     }
131459079029SYuri Benditovich     for (i = 0; i < n->rss_data.indirections_len; ++i) {
131559079029SYuri Benditovich         uint16_t val = n->rss_data.indirections_table[i];
131659079029SYuri Benditovich         n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val);
131759079029SYuri Benditovich     }
131859079029SYuri Benditovich     offset += size_get;
131959079029SYuri Benditovich     size_get = sizeof(temp);
132059079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get);
132159079029SYuri Benditovich     if (s != size_get) {
1322441537f1SJason Wang         err_msg = "Can't get queue_pairs";
132359079029SYuri Benditovich         err_value = (uint32_t)s;
132459079029SYuri Benditovich         goto error;
132559079029SYuri Benditovich     }
1326441537f1SJason Wang     queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs;
1327441537f1SJason Wang     if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) {
1328441537f1SJason Wang         err_msg = "Invalid number of queue_pairs";
1329441537f1SJason Wang         err_value = queue_pairs;
133059079029SYuri Benditovich         goto error;
133159079029SYuri Benditovich     }
133259079029SYuri Benditovich     if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) {
133359079029SYuri Benditovich         err_msg = "Invalid key size";
133459079029SYuri Benditovich         err_value = temp.b;
133559079029SYuri Benditovich         goto error;
133659079029SYuri Benditovich     }
133759079029SYuri Benditovich     if (!temp.b && n->rss_data.hash_types) {
133859079029SYuri Benditovich         err_msg = "No key provided";
133959079029SYuri Benditovich         err_value = 0;
134059079029SYuri Benditovich         goto error;
134159079029SYuri Benditovich     }
134259079029SYuri Benditovich     if (!temp.b && !n->rss_data.hash_types) {
134359079029SYuri Benditovich         virtio_net_disable_rss(n);
1344441537f1SJason Wang         return queue_pairs;
134559079029SYuri Benditovich     }
134659079029SYuri Benditovich     offset += size_get;
134759079029SYuri Benditovich     size_get = temp.b;
134859079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get);
134959079029SYuri Benditovich     if (s != size_get) {
135059079029SYuri Benditovich         err_msg = "Can get key buffer";
135159079029SYuri Benditovich         err_value = (uint32_t)s;
135259079029SYuri Benditovich         goto error;
135359079029SYuri Benditovich     }
135459079029SYuri Benditovich     n->rss_data.enabled = true;
13550145c393SAndrew Melnychenko 
13560145c393SAndrew Melnychenko     if (!n->rss_data.populate_hash) {
13570145c393SAndrew Melnychenko         if (!virtio_net_attach_epbf_rss(n)) {
13580145c393SAndrew Melnychenko             /* EBPF must be loaded for vhost */
13590145c393SAndrew Melnychenko             if (get_vhost_net(qemu_get_queue(n->nic)->peer)) {
13600145c393SAndrew Melnychenko                 warn_report("Can't load eBPF RSS for vhost");
13610145c393SAndrew Melnychenko                 goto error;
13620145c393SAndrew Melnychenko             }
13630145c393SAndrew Melnychenko             /* fallback to software RSS */
13640145c393SAndrew Melnychenko             warn_report("Can't load eBPF RSS - fallback to software RSS");
13650145c393SAndrew Melnychenko             n->rss_data.enabled_software_rss = true;
13660145c393SAndrew Melnychenko         }
13670145c393SAndrew Melnychenko     } else {
13680145c393SAndrew Melnychenko         /* use software RSS for hash populating */
13690145c393SAndrew Melnychenko         /* and detach eBPF if was loaded before */
13700145c393SAndrew Melnychenko         virtio_net_detach_epbf_rss(n);
13710145c393SAndrew Melnychenko         n->rss_data.enabled_software_rss = true;
13720145c393SAndrew Melnychenko     }
13730145c393SAndrew Melnychenko 
137459079029SYuri Benditovich     trace_virtio_net_rss_enable(n->rss_data.hash_types,
137559079029SYuri Benditovich                                 n->rss_data.indirections_len,
137659079029SYuri Benditovich                                 temp.b);
1377441537f1SJason Wang     return queue_pairs;
137859079029SYuri Benditovich error:
137959079029SYuri Benditovich     trace_virtio_net_rss_error(err_msg, err_value);
138059079029SYuri Benditovich     virtio_net_disable_rss(n);
138159079029SYuri Benditovich     return 0;
138259079029SYuri Benditovich }
138359079029SYuri Benditovich 
13846e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
13856e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
13866e790746SPaolo Bonzini {
138717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1388441537f1SJason Wang     uint16_t queue_pairs;
13892a7888ccSSi-Wei Liu     NetClientState *nc = qemu_get_queue(n->nic);
13906e790746SPaolo Bonzini 
139159079029SYuri Benditovich     virtio_net_disable_rss(n);
1392e22f0603SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) {
1393441537f1SJason Wang         queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false);
1394441537f1SJason Wang         return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR;
1395e22f0603SYuri Benditovich     }
139659079029SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) {
1397441537f1SJason Wang         queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true);
139859079029SYuri Benditovich     } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
139959079029SYuri Benditovich         struct virtio_net_ctrl_mq mq;
140059079029SYuri Benditovich         size_t s;
140159079029SYuri Benditovich         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) {
140259079029SYuri Benditovich             return VIRTIO_NET_ERR;
140359079029SYuri Benditovich         }
14046e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
14056e790746SPaolo Bonzini         if (s != sizeof(mq)) {
14066e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
14076e790746SPaolo Bonzini         }
1408441537f1SJason Wang         queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
14096e790746SPaolo Bonzini 
141059079029SYuri Benditovich     } else {
14116e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
14126e790746SPaolo Bonzini     }
14136e790746SPaolo Bonzini 
1414441537f1SJason Wang     if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
1415441537f1SJason Wang         queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
1416441537f1SJason Wang         queue_pairs > n->max_queue_pairs ||
14176e790746SPaolo Bonzini         !n->multiqueue) {
14186e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
14196e790746SPaolo Bonzini     }
14206e790746SPaolo Bonzini 
1421441537f1SJason Wang     n->curr_queue_pairs = queue_pairs;
1422ca8717f9SEugenio Pérez     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
1423ca8717f9SEugenio Pérez         /*
1424ca8717f9SEugenio Pérez          * Avoid updating the backend for a vdpa device: We're only interested
1425ca8717f9SEugenio Pérez          * in updating the device model queues.
1426ca8717f9SEugenio Pérez          */
1427ca8717f9SEugenio Pérez         return VIRTIO_NET_OK;
1428ca8717f9SEugenio Pérez     }
1429441537f1SJason Wang     /* stop the backend before changing the number of queue_pairs to avoid handling a
14306e790746SPaolo Bonzini      * disabled queue */
143117a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
1432441537f1SJason Wang     virtio_net_set_queue_pairs(n);
14336e790746SPaolo Bonzini 
14346e790746SPaolo Bonzini     return VIRTIO_NET_OK;
14356e790746SPaolo Bonzini }
1436ba7eadb5SGreg Kurz 
1437640b8a1cSEugenio Pérez size_t virtio_net_handle_ctrl_iov(VirtIODevice *vdev,
1438640b8a1cSEugenio Pérez                                   const struct iovec *in_sg, unsigned in_num,
1439640b8a1cSEugenio Pérez                                   const struct iovec *out_sg,
1440640b8a1cSEugenio Pérez                                   unsigned out_num)
14416e790746SPaolo Bonzini {
144217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
14436e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
14446e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
14456e790746SPaolo Bonzini     size_t s;
1446771b6ed3SJason Wang     struct iovec *iov, *iov2;
1447640b8a1cSEugenio Pérez 
1448640b8a1cSEugenio Pérez     if (iov_size(in_sg, in_num) < sizeof(status) ||
1449640b8a1cSEugenio Pérez         iov_size(out_sg, out_num) < sizeof(ctrl)) {
1450640b8a1cSEugenio Pérez         virtio_error(vdev, "virtio-net ctrl missing headers");
1451640b8a1cSEugenio Pérez         return 0;
1452640b8a1cSEugenio Pérez     }
1453640b8a1cSEugenio Pérez 
1454640b8a1cSEugenio Pérez     iov2 = iov = g_memdup2(out_sg, sizeof(struct iovec) * out_num);
1455640b8a1cSEugenio Pérez     s = iov_to_buf(iov, out_num, 0, &ctrl, sizeof(ctrl));
1456640b8a1cSEugenio Pérez     iov_discard_front(&iov, &out_num, sizeof(ctrl));
1457640b8a1cSEugenio Pérez     if (s != sizeof(ctrl)) {
1458640b8a1cSEugenio Pérez         status = VIRTIO_NET_ERR;
1459640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
1460640b8a1cSEugenio Pérez         status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, out_num);
1461640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
1462640b8a1cSEugenio Pérez         status = virtio_net_handle_mac(n, ctrl.cmd, iov, out_num);
1463640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
1464640b8a1cSEugenio Pérez         status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, out_num);
1465640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
1466640b8a1cSEugenio Pérez         status = virtio_net_handle_announce(n, ctrl.cmd, iov, out_num);
1467640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
1468640b8a1cSEugenio Pérez         status = virtio_net_handle_mq(n, ctrl.cmd, iov, out_num);
1469640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
1470640b8a1cSEugenio Pérez         status = virtio_net_handle_offloads(n, ctrl.cmd, iov, out_num);
1471640b8a1cSEugenio Pérez     }
1472640b8a1cSEugenio Pérez 
1473640b8a1cSEugenio Pérez     s = iov_from_buf(in_sg, in_num, 0, &status, sizeof(status));
1474640b8a1cSEugenio Pérez     assert(s == sizeof(status));
1475640b8a1cSEugenio Pérez 
1476640b8a1cSEugenio Pérez     g_free(iov2);
1477640b8a1cSEugenio Pérez     return sizeof(status);
1478640b8a1cSEugenio Pérez }
1479640b8a1cSEugenio Pérez 
1480640b8a1cSEugenio Pérez static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
1481640b8a1cSEugenio Pérez {
1482640b8a1cSEugenio Pérez     VirtQueueElement *elem;
14836e790746SPaolo Bonzini 
148451b19ebeSPaolo Bonzini     for (;;) {
1485640b8a1cSEugenio Pérez         size_t written;
148651b19ebeSPaolo Bonzini         elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
148751b19ebeSPaolo Bonzini         if (!elem) {
148851b19ebeSPaolo Bonzini             break;
148951b19ebeSPaolo Bonzini         }
1490640b8a1cSEugenio Pérez 
1491640b8a1cSEugenio Pérez         written = virtio_net_handle_ctrl_iov(vdev, elem->in_sg, elem->in_num,
1492640b8a1cSEugenio Pérez                                              elem->out_sg, elem->out_num);
1493640b8a1cSEugenio Pérez         if (written > 0) {
1494640b8a1cSEugenio Pérez             virtqueue_push(vq, elem, written);
1495640b8a1cSEugenio Pérez             virtio_notify(vdev, vq);
1496640b8a1cSEugenio Pérez             g_free(elem);
1497640b8a1cSEugenio Pérez         } else {
1498ba7eadb5SGreg Kurz             virtqueue_detach_element(vq, elem, 0);
1499ba7eadb5SGreg Kurz             g_free(elem);
1500ba7eadb5SGreg Kurz             break;
15016e790746SPaolo Bonzini         }
15026e790746SPaolo Bonzini     }
15036e790746SPaolo Bonzini }
15046e790746SPaolo Bonzini 
15056e790746SPaolo Bonzini /* RX */
15066e790746SPaolo Bonzini 
15076e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
15086e790746SPaolo Bonzini {
150917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
15106e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
15116e790746SPaolo Bonzini 
15126e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
15136e790746SPaolo Bonzini }
15146e790746SPaolo Bonzini 
1515b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc)
15166e790746SPaolo Bonzini {
15176e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
151817a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
15196e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
15206e790746SPaolo Bonzini 
152117a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
1522b8c4b67eSPhilippe Mathieu-Daudé         return false;
15236e790746SPaolo Bonzini     }
15246e790746SPaolo Bonzini 
1525441537f1SJason Wang     if (nc->queue_index >= n->curr_queue_pairs) {
1526b8c4b67eSPhilippe Mathieu-Daudé         return false;
15276e790746SPaolo Bonzini     }
15286e790746SPaolo Bonzini 
15296e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
153017a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
1531b8c4b67eSPhilippe Mathieu-Daudé         return false;
15326e790746SPaolo Bonzini     }
15336e790746SPaolo Bonzini 
1534b8c4b67eSPhilippe Mathieu-Daudé     return true;
15356e790746SPaolo Bonzini }
15366e790746SPaolo Bonzini 
15376e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
15386e790746SPaolo Bonzini {
15396e790746SPaolo Bonzini     VirtIONet *n = q->n;
15406e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
15416e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
15426e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
15436e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
15446e790746SPaolo Bonzini 
15456e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
15466e790746SPaolo Bonzini          * available after the above check but before notification was
15476e790746SPaolo Bonzini          * enabled, check for available buffers again.
15486e790746SPaolo Bonzini          */
15496e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
15506e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
15516e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
15526e790746SPaolo Bonzini             return 0;
15536e790746SPaolo Bonzini         }
15546e790746SPaolo Bonzini     }
15556e790746SPaolo Bonzini 
15566e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
15576e790746SPaolo Bonzini     return 1;
15586e790746SPaolo Bonzini }
15596e790746SPaolo Bonzini 
15601399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
1561032a74a1SCédric Le Goater {
15621399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->hdr_len);
15631399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->gso_size);
15641399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_start);
15651399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_offset);
1566032a74a1SCédric Le Goater }
1567032a74a1SCédric Le Goater 
15686e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
15696e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
15706e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
15716e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
15726e790746SPaolo Bonzini  * dhclient yet.
15736e790746SPaolo Bonzini  *
15746e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
15756e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
15766e790746SPaolo Bonzini  * kernels.
15776e790746SPaolo Bonzini  *
15786e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
15796e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
15806e790746SPaolo Bonzini  * cache.
15816e790746SPaolo Bonzini  */
15826e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
15836e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
15846e790746SPaolo Bonzini {
15856e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
15866e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
15876e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
15886e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
15896e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
1590f5746335SBin Meng         net_checksum_calculate(buf, size, CSUM_UDP);
15916e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
15926e790746SPaolo Bonzini     }
15936e790746SPaolo Bonzini }
15946e790746SPaolo Bonzini 
15956e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
15966e790746SPaolo Bonzini                            const void *buf, size_t size)
15976e790746SPaolo Bonzini {
15986e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
15996e790746SPaolo Bonzini         /* FIXME this cast is evil */
16006e790746SPaolo Bonzini         void *wbuf = (void *)buf;
16016e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
16026e790746SPaolo Bonzini                                     size - n->host_hdr_len);
16031bfa316cSGreg Kurz 
16041bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
16051399c60dSRusty Russell             virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
16061bfa316cSGreg Kurz         }
16076e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
16086e790746SPaolo Bonzini     } else {
16096e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
16106e790746SPaolo Bonzini             .flags = 0,
16116e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
16126e790746SPaolo Bonzini         };
16136e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
16146e790746SPaolo Bonzini     }
16156e790746SPaolo Bonzini }
16166e790746SPaolo Bonzini 
16176e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
16186e790746SPaolo Bonzini {
16196e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
16206e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
16216e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
16226e790746SPaolo Bonzini     int i;
16236e790746SPaolo Bonzini 
16246e790746SPaolo Bonzini     if (n->promisc)
16256e790746SPaolo Bonzini         return 1;
16266e790746SPaolo Bonzini 
16276e790746SPaolo Bonzini     ptr += n->host_hdr_len;
16286e790746SPaolo Bonzini 
16296e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
16307542d3e7SPeter Maydell         int vid = lduw_be_p(ptr + 14) & 0xfff;
16316e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
16326e790746SPaolo Bonzini             return 0;
16336e790746SPaolo Bonzini     }
16346e790746SPaolo Bonzini 
16356e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
16366e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
16376e790746SPaolo Bonzini             return !n->nobcast;
16386e790746SPaolo Bonzini         } else if (n->nomulti) {
16396e790746SPaolo Bonzini             return 0;
16406e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
16416e790746SPaolo Bonzini             return 1;
16426e790746SPaolo Bonzini         }
16436e790746SPaolo Bonzini 
16446e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
16456e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
16466e790746SPaolo Bonzini                 return 1;
16476e790746SPaolo Bonzini             }
16486e790746SPaolo Bonzini         }
16496e790746SPaolo Bonzini     } else { // unicast
16506e790746SPaolo Bonzini         if (n->nouni) {
16516e790746SPaolo Bonzini             return 0;
16526e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
16536e790746SPaolo Bonzini             return 1;
16546e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
16556e790746SPaolo Bonzini             return 1;
16566e790746SPaolo Bonzini         }
16576e790746SPaolo Bonzini 
16586e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
16596e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
16606e790746SPaolo Bonzini                 return 1;
16616e790746SPaolo Bonzini             }
16626e790746SPaolo Bonzini         }
16636e790746SPaolo Bonzini     }
16646e790746SPaolo Bonzini 
16656e790746SPaolo Bonzini     return 0;
16666e790746SPaolo Bonzini }
16676e790746SPaolo Bonzini 
16684474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4,
16694474e37aSYuri Benditovich                                         bool isip6,
16704474e37aSYuri Benditovich                                         bool isudp,
16714474e37aSYuri Benditovich                                         bool istcp,
16724474e37aSYuri Benditovich                                         uint32_t types)
16734474e37aSYuri Benditovich {
16744474e37aSYuri Benditovich     if (isip4) {
16754474e37aSYuri Benditovich         if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) {
16764474e37aSYuri Benditovich             return NetPktRssIpV4Tcp;
16774474e37aSYuri Benditovich         }
16784474e37aSYuri Benditovich         if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) {
16794474e37aSYuri Benditovich             return NetPktRssIpV4Udp;
16804474e37aSYuri Benditovich         }
16814474e37aSYuri Benditovich         if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) {
16824474e37aSYuri Benditovich             return NetPktRssIpV4;
16834474e37aSYuri Benditovich         }
16844474e37aSYuri Benditovich     } else if (isip6) {
16854474e37aSYuri Benditovich         uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX |
16864474e37aSYuri Benditovich                         VIRTIO_NET_RSS_HASH_TYPE_TCPv6;
16874474e37aSYuri Benditovich 
16884474e37aSYuri Benditovich         if (istcp && (types & mask)) {
16894474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ?
16904474e37aSYuri Benditovich                 NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp;
16914474e37aSYuri Benditovich         }
16924474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6;
16934474e37aSYuri Benditovich         if (isudp && (types & mask)) {
16944474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ?
16954474e37aSYuri Benditovich                 NetPktRssIpV6UdpEx : NetPktRssIpV6Udp;
16964474e37aSYuri Benditovich         }
16974474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6;
16984474e37aSYuri Benditovich         if (types & mask) {
16994474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ?
17004474e37aSYuri Benditovich                 NetPktRssIpV6Ex : NetPktRssIpV6;
17014474e37aSYuri Benditovich         }
17024474e37aSYuri Benditovich     }
17034474e37aSYuri Benditovich     return 0xff;
17044474e37aSYuri Benditovich }
17054474e37aSYuri Benditovich 
1706e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report,
1707e22f0603SYuri Benditovich                                    uint32_t hash)
1708e22f0603SYuri Benditovich {
1709e22f0603SYuri Benditovich     struct virtio_net_hdr_v1_hash *hdr = (void *)buf;
1710e22f0603SYuri Benditovich     hdr->hash_value = hash;
1711e22f0603SYuri Benditovich     hdr->hash_report = report;
1712e22f0603SYuri Benditovich }
1713e22f0603SYuri Benditovich 
17144474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf,
171597cd965cSPaolo Bonzini                                   size_t size)
17166e790746SPaolo Bonzini {
17176e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1718e22f0603SYuri Benditovich     unsigned int index = nc->queue_index, new_index = index;
17194474e37aSYuri Benditovich     struct NetRxPkt *pkt = n->rx_pkt;
17204474e37aSYuri Benditovich     uint8_t net_hash_type;
17214474e37aSYuri Benditovich     uint32_t hash;
17224474e37aSYuri Benditovich     bool isip4, isip6, isudp, istcp;
1723e22f0603SYuri Benditovich     static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = {
1724e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv4,
1725e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv4,
1726e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6,
1727e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6,
1728e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6_EX,
1729e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6_EX,
1730e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv4,
1731e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6,
1732e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6_EX
1733e22f0603SYuri Benditovich     };
17344474e37aSYuri Benditovich 
17354474e37aSYuri Benditovich     net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len,
17364474e37aSYuri Benditovich                              size - n->host_hdr_len);
17374474e37aSYuri Benditovich     net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp);
17384474e37aSYuri Benditovich     if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) {
17394474e37aSYuri Benditovich         istcp = isudp = false;
17404474e37aSYuri Benditovich     }
17414474e37aSYuri Benditovich     if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) {
17424474e37aSYuri Benditovich         istcp = isudp = false;
17434474e37aSYuri Benditovich     }
17444474e37aSYuri Benditovich     net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp,
17454474e37aSYuri Benditovich                                              n->rss_data.hash_types);
17464474e37aSYuri Benditovich     if (net_hash_type > NetPktRssIpV6UdpEx) {
1747e22f0603SYuri Benditovich         if (n->rss_data.populate_hash) {
1748e22f0603SYuri Benditovich             virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0);
1749e22f0603SYuri Benditovich         }
1750e22f0603SYuri Benditovich         return n->rss_data.redirect ? n->rss_data.default_queue : -1;
17514474e37aSYuri Benditovich     }
17524474e37aSYuri Benditovich 
17534474e37aSYuri Benditovich     hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key);
1754e22f0603SYuri Benditovich 
1755e22f0603SYuri Benditovich     if (n->rss_data.populate_hash) {
1756e22f0603SYuri Benditovich         virtio_set_packet_hash(buf, reports[net_hash_type], hash);
1757e22f0603SYuri Benditovich     }
1758e22f0603SYuri Benditovich 
1759e22f0603SYuri Benditovich     if (n->rss_data.redirect) {
17604474e37aSYuri Benditovich         new_index = hash & (n->rss_data.indirections_len - 1);
17614474e37aSYuri Benditovich         new_index = n->rss_data.indirections_table[new_index];
17624474e37aSYuri Benditovich     }
1763e22f0603SYuri Benditovich 
1764e22f0603SYuri Benditovich     return (index == new_index) ? -1 : new_index;
17654474e37aSYuri Benditovich }
17664474e37aSYuri Benditovich 
17674474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf,
17684474e37aSYuri Benditovich                                       size_t size, bool no_rss)
17694474e37aSYuri Benditovich {
17704474e37aSYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
17716e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
177217a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1773bedd7e93SJason Wang     VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE];
1774bedd7e93SJason Wang     size_t lens[VIRTQUEUE_MAX_SIZE];
17756e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
17766e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
17776e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
1778bedd7e93SJason Wang     size_t offset, i, guest_offset, j;
1779bedd7e93SJason Wang     ssize_t err;
17806e790746SPaolo Bonzini 
17816e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
17826e790746SPaolo Bonzini         return -1;
17836e790746SPaolo Bonzini     }
17846e790746SPaolo Bonzini 
17850145c393SAndrew Melnychenko     if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) {
17864474e37aSYuri Benditovich         int index = virtio_net_process_rss(nc, buf, size);
17874474e37aSYuri Benditovich         if (index >= 0) {
17884474e37aSYuri Benditovich             NetClientState *nc2 = qemu_get_subqueue(n->nic, index);
17894474e37aSYuri Benditovich             return virtio_net_receive_rcu(nc2, buf, size, true);
17904474e37aSYuri Benditovich         }
17914474e37aSYuri Benditovich     }
17924474e37aSYuri Benditovich 
17936e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
17946e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
17956e790746SPaolo Bonzini         return 0;
17966e790746SPaolo Bonzini     }
17976e790746SPaolo Bonzini 
17986e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
17996e790746SPaolo Bonzini         return size;
18006e790746SPaolo Bonzini 
18016e790746SPaolo Bonzini     offset = i = 0;
18026e790746SPaolo Bonzini 
18036e790746SPaolo Bonzini     while (offset < size) {
180451b19ebeSPaolo Bonzini         VirtQueueElement *elem;
18056e790746SPaolo Bonzini         int len, total;
180651b19ebeSPaolo Bonzini         const struct iovec *sg;
18076e790746SPaolo Bonzini 
18086e790746SPaolo Bonzini         total = 0;
18096e790746SPaolo Bonzini 
1810bedd7e93SJason Wang         if (i == VIRTQUEUE_MAX_SIZE) {
1811bedd7e93SJason Wang             virtio_error(vdev, "virtio-net unexpected long buffer chain");
1812bedd7e93SJason Wang             err = size;
1813bedd7e93SJason Wang             goto err;
1814bedd7e93SJason Wang         }
1815bedd7e93SJason Wang 
181651b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
181751b19ebeSPaolo Bonzini         if (!elem) {
1818ba10b9c0SGreg Kurz             if (i) {
1819ba10b9c0SGreg Kurz                 virtio_error(vdev, "virtio-net unexpected empty queue: "
18206e790746SPaolo Bonzini                              "i %zd mergeable %d offset %zd, size %zd, "
1821019a3edbSGerd Hoffmann                              "guest hdr len %zd, host hdr len %zd "
1822019a3edbSGerd Hoffmann                              "guest features 0x%" PRIx64,
18236e790746SPaolo Bonzini                              i, n->mergeable_rx_bufs, offset, size,
1824019a3edbSGerd Hoffmann                              n->guest_hdr_len, n->host_hdr_len,
1825019a3edbSGerd Hoffmann                              vdev->guest_features);
1826ba10b9c0SGreg Kurz             }
1827bedd7e93SJason Wang             err = -1;
1828bedd7e93SJason Wang             goto err;
18296e790746SPaolo Bonzini         }
18306e790746SPaolo Bonzini 
183151b19ebeSPaolo Bonzini         if (elem->in_num < 1) {
1832ba10b9c0SGreg Kurz             virtio_error(vdev,
1833ba10b9c0SGreg Kurz                          "virtio-net receive queue contains no in buffers");
1834ba10b9c0SGreg Kurz             virtqueue_detach_element(q->rx_vq, elem, 0);
1835ba10b9c0SGreg Kurz             g_free(elem);
1836bedd7e93SJason Wang             err = -1;
1837bedd7e93SJason Wang             goto err;
18386e790746SPaolo Bonzini         }
18396e790746SPaolo Bonzini 
184051b19ebeSPaolo Bonzini         sg = elem->in_sg;
18416e790746SPaolo Bonzini         if (i == 0) {
18426e790746SPaolo Bonzini             assert(offset == 0);
18436e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
18446e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
184551b19ebeSPaolo Bonzini                                     sg, elem->in_num,
18466e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
18476e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
18486e790746SPaolo Bonzini             }
18496e790746SPaolo Bonzini 
185051b19ebeSPaolo Bonzini             receive_header(n, sg, elem->in_num, buf, size);
1851e22f0603SYuri Benditovich             if (n->rss_data.populate_hash) {
1852e22f0603SYuri Benditovich                 offset = sizeof(mhdr);
1853e22f0603SYuri Benditovich                 iov_from_buf(sg, elem->in_num, offset,
1854e22f0603SYuri Benditovich                              buf + offset, n->host_hdr_len - sizeof(mhdr));
1855e22f0603SYuri Benditovich             }
18566e790746SPaolo Bonzini             offset = n->host_hdr_len;
18576e790746SPaolo Bonzini             total += n->guest_hdr_len;
18586e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
18596e790746SPaolo Bonzini         } else {
18606e790746SPaolo Bonzini             guest_offset = 0;
18616e790746SPaolo Bonzini         }
18626e790746SPaolo Bonzini 
18636e790746SPaolo Bonzini         /* copy in packet.  ugh */
186451b19ebeSPaolo Bonzini         len = iov_from_buf(sg, elem->in_num, guest_offset,
18656e790746SPaolo Bonzini                            buf + offset, size - offset);
18666e790746SPaolo Bonzini         total += len;
18676e790746SPaolo Bonzini         offset += len;
18686e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
18696e790746SPaolo Bonzini          * must have consumed the complete packet.
18706e790746SPaolo Bonzini          * Otherwise, drop it. */
18716e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
187227e57efeSLadi Prosek             virtqueue_unpop(q->rx_vq, elem, total);
187351b19ebeSPaolo Bonzini             g_free(elem);
1874bedd7e93SJason Wang             err = size;
1875bedd7e93SJason Wang             goto err;
18766e790746SPaolo Bonzini         }
18776e790746SPaolo Bonzini 
1878bedd7e93SJason Wang         elems[i] = elem;
1879bedd7e93SJason Wang         lens[i] = total;
1880bedd7e93SJason Wang         i++;
18816e790746SPaolo Bonzini     }
18826e790746SPaolo Bonzini 
18836e790746SPaolo Bonzini     if (mhdr_cnt) {
18841399c60dSRusty Russell         virtio_stw_p(vdev, &mhdr.num_buffers, i);
18856e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
18866e790746SPaolo Bonzini                      0,
18876e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
18886e790746SPaolo Bonzini     }
18896e790746SPaolo Bonzini 
1890bedd7e93SJason Wang     for (j = 0; j < i; j++) {
1891bedd7e93SJason Wang         /* signal other side */
1892bedd7e93SJason Wang         virtqueue_fill(q->rx_vq, elems[j], lens[j], j);
1893bedd7e93SJason Wang         g_free(elems[j]);
1894bedd7e93SJason Wang     }
1895bedd7e93SJason Wang 
18966e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
189717a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
18986e790746SPaolo Bonzini 
18996e790746SPaolo Bonzini     return size;
1900bedd7e93SJason Wang 
1901bedd7e93SJason Wang err:
1902bedd7e93SJason Wang     for (j = 0; j < i; j++) {
1903abe300d9SJason Wang         virtqueue_detach_element(q->rx_vq, elems[j], lens[j]);
1904bedd7e93SJason Wang         g_free(elems[j]);
1905bedd7e93SJason Wang     }
1906bedd7e93SJason Wang 
1907bedd7e93SJason Wang     return err;
19086e790746SPaolo Bonzini }
19096e790746SPaolo Bonzini 
19102974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf,
191197cd965cSPaolo Bonzini                                   size_t size)
191297cd965cSPaolo Bonzini {
1913068ddfa9SDr. David Alan Gilbert     RCU_READ_LOCK_GUARD();
191497cd965cSPaolo Bonzini 
19154474e37aSYuri Benditovich     return virtio_net_receive_rcu(nc, buf, size, false);
191697cd965cSPaolo Bonzini }
191797cd965cSPaolo Bonzini 
19182974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain,
19192974e916SYuri Benditovich                                          const uint8_t *buf,
19202974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
19212974e916SYuri Benditovich {
19222974e916SYuri Benditovich     uint16_t ip_hdrlen;
19232974e916SYuri Benditovich     struct ip_header *ip;
19242974e916SYuri Benditovich 
19252974e916SYuri Benditovich     ip = (struct ip_header *)(buf + chain->n->guest_hdr_len
19262974e916SYuri Benditovich                               + sizeof(struct eth_header));
19272974e916SYuri Benditovich     unit->ip = (void *)ip;
19282974e916SYuri Benditovich     ip_hdrlen = (ip->ip_ver_len & 0xF) << 2;
19292974e916SYuri Benditovich     unit->ip_plen = &ip->ip_len;
19302974e916SYuri Benditovich     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen);
19312974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
19322974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen;
19332974e916SYuri Benditovich }
19342974e916SYuri Benditovich 
19352974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain,
19362974e916SYuri Benditovich                                          const uint8_t *buf,
19372974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
19382974e916SYuri Benditovich {
19392974e916SYuri Benditovich     struct ip6_header *ip6;
19402974e916SYuri Benditovich 
19412974e916SYuri Benditovich     ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len
19422974e916SYuri Benditovich                                  + sizeof(struct eth_header));
19432974e916SYuri Benditovich     unit->ip = ip6;
19442974e916SYuri Benditovich     unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
194578ee6bd0SPhilippe Mathieu-Daudé     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip)
19462974e916SYuri Benditovich                                         + sizeof(struct ip6_header));
19472974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
19482974e916SYuri Benditovich 
19492974e916SYuri Benditovich     /* There is a difference between payload lenght in ipv4 and v6,
19502974e916SYuri Benditovich        ip header is excluded in ipv6 */
19512974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen;
19522974e916SYuri Benditovich }
19532974e916SYuri Benditovich 
19542974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain,
19552974e916SYuri Benditovich                                        VirtioNetRscSeg *seg)
19562974e916SYuri Benditovich {
19572974e916SYuri Benditovich     int ret;
1958dd3d85e8SYuri Benditovich     struct virtio_net_hdr_v1 *h;
19592974e916SYuri Benditovich 
1960dd3d85e8SYuri Benditovich     h = (struct virtio_net_hdr_v1 *)seg->buf;
19612974e916SYuri Benditovich     h->flags = 0;
19622974e916SYuri Benditovich     h->gso_type = VIRTIO_NET_HDR_GSO_NONE;
19632974e916SYuri Benditovich 
19642974e916SYuri Benditovich     if (seg->is_coalesced) {
1965dd3d85e8SYuri Benditovich         h->rsc.segments = seg->packets;
1966dd3d85e8SYuri Benditovich         h->rsc.dup_acks = seg->dup_ack;
19672974e916SYuri Benditovich         h->flags = VIRTIO_NET_HDR_F_RSC_INFO;
19682974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
19692974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
19702974e916SYuri Benditovich         } else {
19712974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
19722974e916SYuri Benditovich         }
19732974e916SYuri Benditovich     }
19742974e916SYuri Benditovich 
19752974e916SYuri Benditovich     ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size);
19762974e916SYuri Benditovich     QTAILQ_REMOVE(&chain->buffers, seg, next);
19772974e916SYuri Benditovich     g_free(seg->buf);
19782974e916SYuri Benditovich     g_free(seg);
19792974e916SYuri Benditovich 
19802974e916SYuri Benditovich     return ret;
19812974e916SYuri Benditovich }
19822974e916SYuri Benditovich 
19832974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq)
19842974e916SYuri Benditovich {
19852974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn;
19862974e916SYuri Benditovich     VirtioNetRscChain *chain = (VirtioNetRscChain *)opq;
19872974e916SYuri Benditovich 
19882974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) {
19892974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
19902974e916SYuri Benditovich             chain->stat.purge_failed++;
19912974e916SYuri Benditovich             continue;
19922974e916SYuri Benditovich         }
19932974e916SYuri Benditovich     }
19942974e916SYuri Benditovich 
19952974e916SYuri Benditovich     chain->stat.timer++;
19962974e916SYuri Benditovich     if (!QTAILQ_EMPTY(&chain->buffers)) {
19972974e916SYuri Benditovich         timer_mod(chain->drain_timer,
19982974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
19992974e916SYuri Benditovich     }
20002974e916SYuri Benditovich }
20012974e916SYuri Benditovich 
20022974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n)
20032974e916SYuri Benditovich {
20042974e916SYuri Benditovich     VirtioNetRscChain *chain, *rn_chain;
20052974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn_seg;
20062974e916SYuri Benditovich 
20072974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) {
20082974e916SYuri Benditovich         QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) {
20092974e916SYuri Benditovich             QTAILQ_REMOVE(&chain->buffers, seg, next);
20102974e916SYuri Benditovich             g_free(seg->buf);
20112974e916SYuri Benditovich             g_free(seg);
20122974e916SYuri Benditovich         }
20132974e916SYuri Benditovich 
20142974e916SYuri Benditovich         timer_free(chain->drain_timer);
20152974e916SYuri Benditovich         QTAILQ_REMOVE(&n->rsc_chains, chain, next);
20162974e916SYuri Benditovich         g_free(chain);
20172974e916SYuri Benditovich     }
20182974e916SYuri Benditovich }
20192974e916SYuri Benditovich 
20202974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain,
20212974e916SYuri Benditovich                                      NetClientState *nc,
20222974e916SYuri Benditovich                                      const uint8_t *buf, size_t size)
20232974e916SYuri Benditovich {
20242974e916SYuri Benditovich     uint16_t hdr_len;
20252974e916SYuri Benditovich     VirtioNetRscSeg *seg;
20262974e916SYuri Benditovich 
20272974e916SYuri Benditovich     hdr_len = chain->n->guest_hdr_len;
2028b21e2380SMarkus Armbruster     seg = g_new(VirtioNetRscSeg, 1);
20292974e916SYuri Benditovich     seg->buf = g_malloc(hdr_len + sizeof(struct eth_header)
20302974e916SYuri Benditovich         + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD);
20312974e916SYuri Benditovich     memcpy(seg->buf, buf, size);
20322974e916SYuri Benditovich     seg->size = size;
20332974e916SYuri Benditovich     seg->packets = 1;
20342974e916SYuri Benditovich     seg->dup_ack = 0;
20352974e916SYuri Benditovich     seg->is_coalesced = 0;
20362974e916SYuri Benditovich     seg->nc = nc;
20372974e916SYuri Benditovich 
20382974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&chain->buffers, seg, next);
20392974e916SYuri Benditovich     chain->stat.cache++;
20402974e916SYuri Benditovich 
20412974e916SYuri Benditovich     switch (chain->proto) {
20422974e916SYuri Benditovich     case ETH_P_IP:
20432974e916SYuri Benditovich         virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit);
20442974e916SYuri Benditovich         break;
20452974e916SYuri Benditovich     case ETH_P_IPV6:
20462974e916SYuri Benditovich         virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit);
20472974e916SYuri Benditovich         break;
20482974e916SYuri Benditovich     default:
20492974e916SYuri Benditovich         g_assert_not_reached();
20502974e916SYuri Benditovich     }
20512974e916SYuri Benditovich }
20522974e916SYuri Benditovich 
20532974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain,
20542974e916SYuri Benditovich                                          VirtioNetRscSeg *seg,
20552974e916SYuri Benditovich                                          const uint8_t *buf,
20562974e916SYuri Benditovich                                          struct tcp_header *n_tcp,
20572974e916SYuri Benditovich                                          struct tcp_header *o_tcp)
20582974e916SYuri Benditovich {
20592974e916SYuri Benditovich     uint32_t nack, oack;
20602974e916SYuri Benditovich     uint16_t nwin, owin;
20612974e916SYuri Benditovich 
20622974e916SYuri Benditovich     nack = htonl(n_tcp->th_ack);
20632974e916SYuri Benditovich     nwin = htons(n_tcp->th_win);
20642974e916SYuri Benditovich     oack = htonl(o_tcp->th_ack);
20652974e916SYuri Benditovich     owin = htons(o_tcp->th_win);
20662974e916SYuri Benditovich 
20672974e916SYuri Benditovich     if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) {
20682974e916SYuri Benditovich         chain->stat.ack_out_of_win++;
20692974e916SYuri Benditovich         return RSC_FINAL;
20702974e916SYuri Benditovich     } else if (nack == oack) {
20712974e916SYuri Benditovich         /* duplicated ack or window probe */
20722974e916SYuri Benditovich         if (nwin == owin) {
20732974e916SYuri Benditovich             /* duplicated ack, add dup ack count due to whql test up to 1 */
20742974e916SYuri Benditovich             chain->stat.dup_ack++;
20752974e916SYuri Benditovich             return RSC_FINAL;
20762974e916SYuri Benditovich         } else {
20772974e916SYuri Benditovich             /* Coalesce window update */
20782974e916SYuri Benditovich             o_tcp->th_win = n_tcp->th_win;
20792974e916SYuri Benditovich             chain->stat.win_update++;
20802974e916SYuri Benditovich             return RSC_COALESCE;
20812974e916SYuri Benditovich         }
20822974e916SYuri Benditovich     } else {
20832974e916SYuri Benditovich         /* pure ack, go to 'C', finalize*/
20842974e916SYuri Benditovich         chain->stat.pure_ack++;
20852974e916SYuri Benditovich         return RSC_FINAL;
20862974e916SYuri Benditovich     }
20872974e916SYuri Benditovich }
20882974e916SYuri Benditovich 
20892974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain,
20902974e916SYuri Benditovich                                             VirtioNetRscSeg *seg,
20912974e916SYuri Benditovich                                             const uint8_t *buf,
20922974e916SYuri Benditovich                                             VirtioNetRscUnit *n_unit)
20932974e916SYuri Benditovich {
20942974e916SYuri Benditovich     void *data;
20952974e916SYuri Benditovich     uint16_t o_ip_len;
20962974e916SYuri Benditovich     uint32_t nseq, oseq;
20972974e916SYuri Benditovich     VirtioNetRscUnit *o_unit;
20982974e916SYuri Benditovich 
20992974e916SYuri Benditovich     o_unit = &seg->unit;
21002974e916SYuri Benditovich     o_ip_len = htons(*o_unit->ip_plen);
21012974e916SYuri Benditovich     nseq = htonl(n_unit->tcp->th_seq);
21022974e916SYuri Benditovich     oseq = htonl(o_unit->tcp->th_seq);
21032974e916SYuri Benditovich 
21042974e916SYuri Benditovich     /* out of order or retransmitted. */
21052974e916SYuri Benditovich     if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) {
21062974e916SYuri Benditovich         chain->stat.data_out_of_win++;
21072974e916SYuri Benditovich         return RSC_FINAL;
21082974e916SYuri Benditovich     }
21092974e916SYuri Benditovich 
21102974e916SYuri Benditovich     data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen;
21112974e916SYuri Benditovich     if (nseq == oseq) {
21122974e916SYuri Benditovich         if ((o_unit->payload == 0) && n_unit->payload) {
21132974e916SYuri Benditovich             /* From no payload to payload, normal case, not a dup ack or etc */
21142974e916SYuri Benditovich             chain->stat.data_after_pure_ack++;
21152974e916SYuri Benditovich             goto coalesce;
21162974e916SYuri Benditovich         } else {
21172974e916SYuri Benditovich             return virtio_net_rsc_handle_ack(chain, seg, buf,
21182974e916SYuri Benditovich                                              n_unit->tcp, o_unit->tcp);
21192974e916SYuri Benditovich         }
21202974e916SYuri Benditovich     } else if ((nseq - oseq) != o_unit->payload) {
21212974e916SYuri Benditovich         /* Not a consistent packet, out of order */
21222974e916SYuri Benditovich         chain->stat.data_out_of_order++;
21232974e916SYuri Benditovich         return RSC_FINAL;
21242974e916SYuri Benditovich     } else {
21252974e916SYuri Benditovich coalesce:
21262974e916SYuri Benditovich         if ((o_ip_len + n_unit->payload) > chain->max_payload) {
21272974e916SYuri Benditovich             chain->stat.over_size++;
21282974e916SYuri Benditovich             return RSC_FINAL;
21292974e916SYuri Benditovich         }
21302974e916SYuri Benditovich 
21312974e916SYuri Benditovich         /* Here comes the right data, the payload length in v4/v6 is different,
21322974e916SYuri Benditovich            so use the field value to update and record the new data len */
21332974e916SYuri Benditovich         o_unit->payload += n_unit->payload; /* update new data len */
21342974e916SYuri Benditovich 
21352974e916SYuri Benditovich         /* update field in ip header */
21362974e916SYuri Benditovich         *o_unit->ip_plen = htons(o_ip_len + n_unit->payload);
21372974e916SYuri Benditovich 
21382974e916SYuri Benditovich         /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced
21392974e916SYuri Benditovich            for windows guest, while this may change the behavior for linux
21402974e916SYuri Benditovich            guest (only if it uses RSC feature). */
21412974e916SYuri Benditovich         o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags;
21422974e916SYuri Benditovich 
21432974e916SYuri Benditovich         o_unit->tcp->th_ack = n_unit->tcp->th_ack;
21442974e916SYuri Benditovich         o_unit->tcp->th_win = n_unit->tcp->th_win;
21452974e916SYuri Benditovich 
21462974e916SYuri Benditovich         memmove(seg->buf + seg->size, data, n_unit->payload);
21472974e916SYuri Benditovich         seg->size += n_unit->payload;
21482974e916SYuri Benditovich         seg->packets++;
21492974e916SYuri Benditovich         chain->stat.coalesced++;
21502974e916SYuri Benditovich         return RSC_COALESCE;
21512974e916SYuri Benditovich     }
21522974e916SYuri Benditovich }
21532974e916SYuri Benditovich 
21542974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain,
21552974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
21562974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21572974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
21582974e916SYuri Benditovich {
21592974e916SYuri Benditovich     struct ip_header *ip1, *ip2;
21602974e916SYuri Benditovich 
21612974e916SYuri Benditovich     ip1 = (struct ip_header *)(unit->ip);
21622974e916SYuri Benditovich     ip2 = (struct ip_header *)(seg->unit.ip);
21632974e916SYuri Benditovich     if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst)
21642974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
21652974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
21662974e916SYuri Benditovich         chain->stat.no_match++;
21672974e916SYuri Benditovich         return RSC_NO_MATCH;
21682974e916SYuri Benditovich     }
21692974e916SYuri Benditovich 
21702974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
21712974e916SYuri Benditovich }
21722974e916SYuri Benditovich 
21732974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain,
21742974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
21752974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21762974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
21772974e916SYuri Benditovich {
21782974e916SYuri Benditovich     struct ip6_header *ip1, *ip2;
21792974e916SYuri Benditovich 
21802974e916SYuri Benditovich     ip1 = (struct ip6_header *)(unit->ip);
21812974e916SYuri Benditovich     ip2 = (struct ip6_header *)(seg->unit.ip);
21822974e916SYuri Benditovich     if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address))
21832974e916SYuri Benditovich         || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address))
21842974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
21852974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
21862974e916SYuri Benditovich             chain->stat.no_match++;
21872974e916SYuri Benditovich             return RSC_NO_MATCH;
21882974e916SYuri Benditovich     }
21892974e916SYuri Benditovich 
21902974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
21912974e916SYuri Benditovich }
21922974e916SYuri Benditovich 
21932974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain
21942974e916SYuri Benditovich  * to prevent out of order */
21952974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain,
21962974e916SYuri Benditovich                                          struct tcp_header *tcp)
21972974e916SYuri Benditovich {
21982974e916SYuri Benditovich     uint16_t tcp_hdr;
21992974e916SYuri Benditovich     uint16_t tcp_flag;
22002974e916SYuri Benditovich 
22012974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags);
22022974e916SYuri Benditovich     tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10;
22032974e916SYuri Benditovich     tcp_flag &= VIRTIO_NET_TCP_FLAG;
22042974e916SYuri Benditovich     if (tcp_flag & TH_SYN) {
22052974e916SYuri Benditovich         chain->stat.tcp_syn++;
22062974e916SYuri Benditovich         return RSC_BYPASS;
22072974e916SYuri Benditovich     }
22082974e916SYuri Benditovich 
22092974e916SYuri Benditovich     if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) {
22102974e916SYuri Benditovich         chain->stat.tcp_ctrl_drain++;
22112974e916SYuri Benditovich         return RSC_FINAL;
22122974e916SYuri Benditovich     }
22132974e916SYuri Benditovich 
22142974e916SYuri Benditovich     if (tcp_hdr > sizeof(struct tcp_header)) {
22152974e916SYuri Benditovich         chain->stat.tcp_all_opt++;
22162974e916SYuri Benditovich         return RSC_FINAL;
22172974e916SYuri Benditovich     }
22182974e916SYuri Benditovich 
22192974e916SYuri Benditovich     return RSC_CANDIDATE;
22202974e916SYuri Benditovich }
22212974e916SYuri Benditovich 
22222974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain,
22232974e916SYuri Benditovich                                          NetClientState *nc,
22242974e916SYuri Benditovich                                          const uint8_t *buf, size_t size,
22252974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
22262974e916SYuri Benditovich {
22272974e916SYuri Benditovich     int ret;
22282974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
22292974e916SYuri Benditovich 
22302974e916SYuri Benditovich     if (QTAILQ_EMPTY(&chain->buffers)) {
22312974e916SYuri Benditovich         chain->stat.empty_cache++;
22322974e916SYuri Benditovich         virtio_net_rsc_cache_buf(chain, nc, buf, size);
22332974e916SYuri Benditovich         timer_mod(chain->drain_timer,
22342974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
22352974e916SYuri Benditovich         return size;
22362974e916SYuri Benditovich     }
22372974e916SYuri Benditovich 
22382974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
22392974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
22402974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit);
22412974e916SYuri Benditovich         } else {
22422974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit);
22432974e916SYuri Benditovich         }
22442974e916SYuri Benditovich 
22452974e916SYuri Benditovich         if (ret == RSC_FINAL) {
22462974e916SYuri Benditovich             if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
22472974e916SYuri Benditovich                 /* Send failed */
22482974e916SYuri Benditovich                 chain->stat.final_failed++;
22492974e916SYuri Benditovich                 return 0;
22502974e916SYuri Benditovich             }
22512974e916SYuri Benditovich 
22522974e916SYuri Benditovich             /* Send current packet */
22532974e916SYuri Benditovich             return virtio_net_do_receive(nc, buf, size);
22542974e916SYuri Benditovich         } else if (ret == RSC_NO_MATCH) {
22552974e916SYuri Benditovich             continue;
22562974e916SYuri Benditovich         } else {
22572974e916SYuri Benditovich             /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */
22582974e916SYuri Benditovich             seg->is_coalesced = 1;
22592974e916SYuri Benditovich             return size;
22602974e916SYuri Benditovich         }
22612974e916SYuri Benditovich     }
22622974e916SYuri Benditovich 
22632974e916SYuri Benditovich     chain->stat.no_match_cache++;
22642974e916SYuri Benditovich     virtio_net_rsc_cache_buf(chain, nc, buf, size);
22652974e916SYuri Benditovich     return size;
22662974e916SYuri Benditovich }
22672974e916SYuri Benditovich 
22682974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */
22692974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain,
22702974e916SYuri Benditovich                                         NetClientState *nc,
22712974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
22722974e916SYuri Benditovich                                         uint16_t ip_start, uint16_t ip_size,
22732974e916SYuri Benditovich                                         uint16_t tcp_port)
22742974e916SYuri Benditovich {
22752974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
22762974e916SYuri Benditovich     uint32_t ppair1, ppair2;
22772974e916SYuri Benditovich 
22782974e916SYuri Benditovich     ppair1 = *(uint32_t *)(buf + tcp_port);
22792974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
22802974e916SYuri Benditovich         ppair2 = *(uint32_t *)(seg->buf + tcp_port);
22812974e916SYuri Benditovich         if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size)
22822974e916SYuri Benditovich             || (ppair1 != ppair2)) {
22832974e916SYuri Benditovich             continue;
22842974e916SYuri Benditovich         }
22852974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
22862974e916SYuri Benditovich             chain->stat.drain_failed++;
22872974e916SYuri Benditovich         }
22882974e916SYuri Benditovich 
22892974e916SYuri Benditovich         break;
22902974e916SYuri Benditovich     }
22912974e916SYuri Benditovich 
22922974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
22932974e916SYuri Benditovich }
22942974e916SYuri Benditovich 
22952974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain,
22962974e916SYuri Benditovich                                             struct ip_header *ip,
22972974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
22982974e916SYuri Benditovich {
22992974e916SYuri Benditovich     uint16_t ip_len;
23002974e916SYuri Benditovich 
23012974e916SYuri Benditovich     /* Not an ipv4 packet */
23022974e916SYuri Benditovich     if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) {
23032974e916SYuri Benditovich         chain->stat.ip_option++;
23042974e916SYuri Benditovich         return RSC_BYPASS;
23052974e916SYuri Benditovich     }
23062974e916SYuri Benditovich 
23072974e916SYuri Benditovich     /* Don't handle packets with ip option */
23082974e916SYuri Benditovich     if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) {
23092974e916SYuri Benditovich         chain->stat.ip_option++;
23102974e916SYuri Benditovich         return RSC_BYPASS;
23112974e916SYuri Benditovich     }
23122974e916SYuri Benditovich 
23132974e916SYuri Benditovich     if (ip->ip_p != IPPROTO_TCP) {
23142974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23152974e916SYuri Benditovich         return RSC_BYPASS;
23162974e916SYuri Benditovich     }
23172974e916SYuri Benditovich 
23182974e916SYuri Benditovich     /* Don't handle packets with ip fragment */
23192974e916SYuri Benditovich     if (!(htons(ip->ip_off) & IP_DF)) {
23202974e916SYuri Benditovich         chain->stat.ip_frag++;
23212974e916SYuri Benditovich         return RSC_BYPASS;
23222974e916SYuri Benditovich     }
23232974e916SYuri Benditovich 
23242974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
23252974e916SYuri Benditovich     if (IPTOS_ECN(ip->ip_tos)) {
23262974e916SYuri Benditovich         chain->stat.ip_ecn++;
23272974e916SYuri Benditovich         return RSC_BYPASS;
23282974e916SYuri Benditovich     }
23292974e916SYuri Benditovich 
23302974e916SYuri Benditovich     ip_len = htons(ip->ip_len);
23312974e916SYuri Benditovich     if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header))
23322974e916SYuri Benditovich         || ip_len > (size - chain->n->guest_hdr_len -
23332974e916SYuri Benditovich                      sizeof(struct eth_header))) {
23342974e916SYuri Benditovich         chain->stat.ip_hacked++;
23352974e916SYuri Benditovich         return RSC_BYPASS;
23362974e916SYuri Benditovich     }
23372974e916SYuri Benditovich 
23382974e916SYuri Benditovich     return RSC_CANDIDATE;
23392974e916SYuri Benditovich }
23402974e916SYuri Benditovich 
23412974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain,
23422974e916SYuri Benditovich                                       NetClientState *nc,
23432974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
23442974e916SYuri Benditovich {
23452974e916SYuri Benditovich     int32_t ret;
23462974e916SYuri Benditovich     uint16_t hdr_len;
23472974e916SYuri Benditovich     VirtioNetRscUnit unit;
23482974e916SYuri Benditovich 
23492974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
23502974e916SYuri Benditovich 
23512974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)
23522974e916SYuri Benditovich         + sizeof(struct tcp_header))) {
23532974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23542974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23552974e916SYuri Benditovich     }
23562974e916SYuri Benditovich 
23572974e916SYuri Benditovich     virtio_net_rsc_extract_unit4(chain, buf, &unit);
23582974e916SYuri Benditovich     if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size)
23592974e916SYuri Benditovich         != RSC_CANDIDATE) {
23602974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23612974e916SYuri Benditovich     }
23622974e916SYuri Benditovich 
23632974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
23642974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
23652974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23662974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
23672974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
23682974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 12),
23692974e916SYuri Benditovich                 VIRTIO_NET_IP4_ADDR_SIZE,
23702974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header));
23712974e916SYuri Benditovich     }
23722974e916SYuri Benditovich 
23732974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
23742974e916SYuri Benditovich }
23752974e916SYuri Benditovich 
23762974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain,
23772974e916SYuri Benditovich                                             struct ip6_header *ip6,
23782974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
23792974e916SYuri Benditovich {
23802974e916SYuri Benditovich     uint16_t ip_len;
23812974e916SYuri Benditovich 
23822974e916SYuri Benditovich     if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4)
23832974e916SYuri Benditovich         != IP_HEADER_VERSION_6) {
23842974e916SYuri Benditovich         return RSC_BYPASS;
23852974e916SYuri Benditovich     }
23862974e916SYuri Benditovich 
23872974e916SYuri Benditovich     /* Both option and protocol is checked in this */
23882974e916SYuri Benditovich     if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) {
23892974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23902974e916SYuri Benditovich         return RSC_BYPASS;
23912974e916SYuri Benditovich     }
23922974e916SYuri Benditovich 
23932974e916SYuri Benditovich     ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
23942974e916SYuri Benditovich     if (ip_len < sizeof(struct tcp_header) ||
23952974e916SYuri Benditovich         ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header)
23962974e916SYuri Benditovich                   - sizeof(struct ip6_header))) {
23972974e916SYuri Benditovich         chain->stat.ip_hacked++;
23982974e916SYuri Benditovich         return RSC_BYPASS;
23992974e916SYuri Benditovich     }
24002974e916SYuri Benditovich 
24012974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
24022974e916SYuri Benditovich     if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) {
24032974e916SYuri Benditovich         chain->stat.ip_ecn++;
24042974e916SYuri Benditovich         return RSC_BYPASS;
24052974e916SYuri Benditovich     }
24062974e916SYuri Benditovich 
24072974e916SYuri Benditovich     return RSC_CANDIDATE;
24082974e916SYuri Benditovich }
24092974e916SYuri Benditovich 
24102974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc,
24112974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
24122974e916SYuri Benditovich {
24132974e916SYuri Benditovich     int32_t ret;
24142974e916SYuri Benditovich     uint16_t hdr_len;
24152974e916SYuri Benditovich     VirtioNetRscChain *chain;
24162974e916SYuri Benditovich     VirtioNetRscUnit unit;
24172974e916SYuri Benditovich 
24182974e916SYuri Benditovich     chain = (VirtioNetRscChain *)opq;
24192974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
24202974e916SYuri Benditovich 
24212974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header)
24222974e916SYuri Benditovich         + sizeof(tcp_header))) {
24232974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24242974e916SYuri Benditovich     }
24252974e916SYuri Benditovich 
24262974e916SYuri Benditovich     virtio_net_rsc_extract_unit6(chain, buf, &unit);
24272974e916SYuri Benditovich     if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain,
24282974e916SYuri Benditovich                                                  unit.ip, buf, size)) {
24292974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24302974e916SYuri Benditovich     }
24312974e916SYuri Benditovich 
24322974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
24332974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
24342974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24352974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
24362974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
24372974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 8),
24382974e916SYuri Benditovich                 VIRTIO_NET_IP6_ADDR_SIZE,
24392974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header)
24402974e916SYuri Benditovich                 + sizeof(struct ip6_header));
24412974e916SYuri Benditovich     }
24422974e916SYuri Benditovich 
24432974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
24442974e916SYuri Benditovich }
24452974e916SYuri Benditovich 
24462974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n,
24472974e916SYuri Benditovich                                                       NetClientState *nc,
24482974e916SYuri Benditovich                                                       uint16_t proto)
24492974e916SYuri Benditovich {
24502974e916SYuri Benditovich     VirtioNetRscChain *chain;
24512974e916SYuri Benditovich 
24522974e916SYuri Benditovich     if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) {
24532974e916SYuri Benditovich         return NULL;
24542974e916SYuri Benditovich     }
24552974e916SYuri Benditovich 
24562974e916SYuri Benditovich     QTAILQ_FOREACH(chain, &n->rsc_chains, next) {
24572974e916SYuri Benditovich         if (chain->proto == proto) {
24582974e916SYuri Benditovich             return chain;
24592974e916SYuri Benditovich         }
24602974e916SYuri Benditovich     }
24612974e916SYuri Benditovich 
24622974e916SYuri Benditovich     chain = g_malloc(sizeof(*chain));
24632974e916SYuri Benditovich     chain->n = n;
24642974e916SYuri Benditovich     chain->proto = proto;
24652974e916SYuri Benditovich     if (proto == (uint16_t)ETH_P_IP) {
24662974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD;
24672974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
24682974e916SYuri Benditovich     } else {
24692974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD;
24702974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
24712974e916SYuri Benditovich     }
24722974e916SYuri Benditovich     chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST,
24732974e916SYuri Benditovich                                       virtio_net_rsc_purge, chain);
24742974e916SYuri Benditovich     memset(&chain->stat, 0, sizeof(chain->stat));
24752974e916SYuri Benditovich 
24762974e916SYuri Benditovich     QTAILQ_INIT(&chain->buffers);
24772974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next);
24782974e916SYuri Benditovich 
24792974e916SYuri Benditovich     return chain;
24802974e916SYuri Benditovich }
24812974e916SYuri Benditovich 
24822974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc,
24832974e916SYuri Benditovich                                       const uint8_t *buf,
24842974e916SYuri Benditovich                                       size_t size)
24852974e916SYuri Benditovich {
24862974e916SYuri Benditovich     uint16_t proto;
24872974e916SYuri Benditovich     VirtioNetRscChain *chain;
24882974e916SYuri Benditovich     struct eth_header *eth;
24892974e916SYuri Benditovich     VirtIONet *n;
24902974e916SYuri Benditovich 
24912974e916SYuri Benditovich     n = qemu_get_nic_opaque(nc);
24922974e916SYuri Benditovich     if (size < (n->host_hdr_len + sizeof(struct eth_header))) {
24932974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24942974e916SYuri Benditovich     }
24952974e916SYuri Benditovich 
24962974e916SYuri Benditovich     eth = (struct eth_header *)(buf + n->guest_hdr_len);
24972974e916SYuri Benditovich     proto = htons(eth->h_proto);
24982974e916SYuri Benditovich 
24992974e916SYuri Benditovich     chain = virtio_net_rsc_lookup_chain(n, nc, proto);
25002974e916SYuri Benditovich     if (chain) {
25012974e916SYuri Benditovich         chain->stat.received++;
25022974e916SYuri Benditovich         if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) {
25032974e916SYuri Benditovich             return virtio_net_rsc_receive4(chain, nc, buf, size);
25042974e916SYuri Benditovich         } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) {
25052974e916SYuri Benditovich             return virtio_net_rsc_receive6(chain, nc, buf, size);
25062974e916SYuri Benditovich         }
25072974e916SYuri Benditovich     }
25082974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
25092974e916SYuri Benditovich }
25102974e916SYuri Benditovich 
25112974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf,
25122974e916SYuri Benditovich                                   size_t size)
25132974e916SYuri Benditovich {
25142974e916SYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
25152974e916SYuri Benditovich     if ((n->rsc4_enabled || n->rsc6_enabled)) {
25162974e916SYuri Benditovich         return virtio_net_rsc_receive(nc, buf, size);
25172974e916SYuri Benditovich     } else {
25182974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
25192974e916SYuri Benditovich     }
25202974e916SYuri Benditovich }
25212974e916SYuri Benditovich 
25226e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
25236e790746SPaolo Bonzini 
25246e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
25256e790746SPaolo Bonzini {
25266e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
25276e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
252817a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2529*df8d0708SLaurent Vivier     int ret;
25306e790746SPaolo Bonzini 
253151b19ebeSPaolo Bonzini     virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
253217a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
25336e790746SPaolo Bonzini 
253451b19ebeSPaolo Bonzini     g_free(q->async_tx.elem);
253551b19ebeSPaolo Bonzini     q->async_tx.elem = NULL;
25366e790746SPaolo Bonzini 
25376e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2538*df8d0708SLaurent Vivier     ret = virtio_net_flush_tx(q);
2539*df8d0708SLaurent Vivier     if (q->tx_bh && ret >= n->tx_burst) {
2540*df8d0708SLaurent Vivier         /*
2541*df8d0708SLaurent Vivier          * the flush has been stopped by tx_burst
2542*df8d0708SLaurent Vivier          * we will not receive notification for the
2543*df8d0708SLaurent Vivier          * remainining part, so re-schedule
2544*df8d0708SLaurent Vivier          */
2545*df8d0708SLaurent Vivier         virtio_queue_set_notification(q->tx_vq, 0);
2546*df8d0708SLaurent Vivier         qemu_bh_schedule(q->tx_bh);
2547*df8d0708SLaurent Vivier         q->tx_waiting = 1;
2548*df8d0708SLaurent Vivier     }
25496e790746SPaolo Bonzini }
25506e790746SPaolo Bonzini 
25516e790746SPaolo Bonzini /* TX */
25526e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
25536e790746SPaolo Bonzini {
25546e790746SPaolo Bonzini     VirtIONet *n = q->n;
255517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
255651b19ebeSPaolo Bonzini     VirtQueueElement *elem;
25576e790746SPaolo Bonzini     int32_t num_packets = 0;
25586e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
255917a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
25606e790746SPaolo Bonzini         return num_packets;
25616e790746SPaolo Bonzini     }
25626e790746SPaolo Bonzini 
256351b19ebeSPaolo Bonzini     if (q->async_tx.elem) {
25646e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
25656e790746SPaolo Bonzini         return num_packets;
25666e790746SPaolo Bonzini     }
25676e790746SPaolo Bonzini 
256851b19ebeSPaolo Bonzini     for (;;) {
2569bd89dd98SJason Wang         ssize_t ret;
257051b19ebeSPaolo Bonzini         unsigned int out_num;
257151b19ebeSPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
2572feb93f36SJason Wang         struct virtio_net_hdr_mrg_rxbuf mhdr;
25736e790746SPaolo Bonzini 
257451b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
257551b19ebeSPaolo Bonzini         if (!elem) {
257651b19ebeSPaolo Bonzini             break;
257751b19ebeSPaolo Bonzini         }
257851b19ebeSPaolo Bonzini 
257951b19ebeSPaolo Bonzini         out_num = elem->out_num;
258051b19ebeSPaolo Bonzini         out_sg = elem->out_sg;
25816e790746SPaolo Bonzini         if (out_num < 1) {
2582fa5e56c2SGreg Kurz             virtio_error(vdev, "virtio-net header not in first element");
2583fa5e56c2SGreg Kurz             virtqueue_detach_element(q->tx_vq, elem, 0);
2584fa5e56c2SGreg Kurz             g_free(elem);
2585fa5e56c2SGreg Kurz             return -EINVAL;
25866e790746SPaolo Bonzini         }
25876e790746SPaolo Bonzini 
2588032a74a1SCédric Le Goater         if (n->has_vnet_hdr) {
2589feb93f36SJason Wang             if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
2590feb93f36SJason Wang                 n->guest_hdr_len) {
2591fa5e56c2SGreg Kurz                 virtio_error(vdev, "virtio-net header incorrect");
2592fa5e56c2SGreg Kurz                 virtqueue_detach_element(q->tx_vq, elem, 0);
2593fa5e56c2SGreg Kurz                 g_free(elem);
2594fa5e56c2SGreg Kurz                 return -EINVAL;
2595032a74a1SCédric Le Goater             }
25961bfa316cSGreg Kurz             if (n->needs_vnet_hdr_swap) {
2597feb93f36SJason Wang                 virtio_net_hdr_swap(vdev, (void *) &mhdr);
2598feb93f36SJason Wang                 sg2[0].iov_base = &mhdr;
2599feb93f36SJason Wang                 sg2[0].iov_len = n->guest_hdr_len;
2600feb93f36SJason Wang                 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
2601feb93f36SJason Wang                                    out_sg, out_num,
2602feb93f36SJason Wang                                    n->guest_hdr_len, -1);
2603feb93f36SJason Wang                 if (out_num == VIRTQUEUE_MAX_SIZE) {
2604feb93f36SJason Wang                     goto drop;
2605032a74a1SCédric Le Goater                 }
2606feb93f36SJason Wang                 out_num += 1;
2607feb93f36SJason Wang                 out_sg = sg2;
2608feb93f36SJason Wang             }
2609feb93f36SJason Wang         }
26106e790746SPaolo Bonzini         /*
26116e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
26126e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
26136e790746SPaolo Bonzini          * that host is interested in.
26146e790746SPaolo Bonzini          */
26156e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
26166e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
26176e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
26186e790746SPaolo Bonzini                                        out_sg, out_num,
26196e790746SPaolo Bonzini                                        0, n->host_hdr_len);
26206e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
26216e790746SPaolo Bonzini                              out_sg, out_num,
26226e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
26236e790746SPaolo Bonzini             out_num = sg_num;
26246e790746SPaolo Bonzini             out_sg = sg;
26256e790746SPaolo Bonzini         }
26266e790746SPaolo Bonzini 
26276e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
26286e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
26296e790746SPaolo Bonzini         if (ret == 0) {
26306e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
26316e790746SPaolo Bonzini             q->async_tx.elem = elem;
26326e790746SPaolo Bonzini             return -EBUSY;
26336e790746SPaolo Bonzini         }
26346e790746SPaolo Bonzini 
2635feb93f36SJason Wang drop:
263651b19ebeSPaolo Bonzini         virtqueue_push(q->tx_vq, elem, 0);
263717a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
263851b19ebeSPaolo Bonzini         g_free(elem);
26396e790746SPaolo Bonzini 
26406e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
26416e790746SPaolo Bonzini             break;
26426e790746SPaolo Bonzini         }
26436e790746SPaolo Bonzini     }
26446e790746SPaolo Bonzini     return num_packets;
26456e790746SPaolo Bonzini }
26466e790746SPaolo Bonzini 
26476e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
26486e790746SPaolo Bonzini {
264917a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
26506e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
26516e790746SPaolo Bonzini 
2652283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2653283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2654283e2c2aSYuri Benditovich         return;
2655283e2c2aSYuri Benditovich     }
2656283e2c2aSYuri Benditovich 
26576e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
265817a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
26596e790746SPaolo Bonzini         q->tx_waiting = 1;
26606e790746SPaolo Bonzini         return;
26616e790746SPaolo Bonzini     }
26626e790746SPaolo Bonzini 
26636e790746SPaolo Bonzini     if (q->tx_waiting) {
26646e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 1);
2665bc72ad67SAlex Bligh         timer_del(q->tx_timer);
26666e790746SPaolo Bonzini         q->tx_waiting = 0;
2667fa5e56c2SGreg Kurz         if (virtio_net_flush_tx(q) == -EINVAL) {
2668fa5e56c2SGreg Kurz             return;
2669fa5e56c2SGreg Kurz         }
26706e790746SPaolo Bonzini     } else {
2671bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
2672bc72ad67SAlex Bligh                        qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
26736e790746SPaolo Bonzini         q->tx_waiting = 1;
26746e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
26756e790746SPaolo Bonzini     }
26766e790746SPaolo Bonzini }
26776e790746SPaolo Bonzini 
26786e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
26796e790746SPaolo Bonzini {
268017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
26816e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
26826e790746SPaolo Bonzini 
2683283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2684283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2685283e2c2aSYuri Benditovich         return;
2686283e2c2aSYuri Benditovich     }
2687283e2c2aSYuri Benditovich 
26886e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
26896e790746SPaolo Bonzini         return;
26906e790746SPaolo Bonzini     }
26916e790746SPaolo Bonzini     q->tx_waiting = 1;
26926e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
269317a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
26946e790746SPaolo Bonzini         return;
26956e790746SPaolo Bonzini     }
26966e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
26976e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
26986e790746SPaolo Bonzini }
26996e790746SPaolo Bonzini 
27006e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
27016e790746SPaolo Bonzini {
27026e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
27036e790746SPaolo Bonzini     VirtIONet *n = q->n;
270417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2705e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2706e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2707e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2708e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2709e8bcf842SMichael S. Tsirkin         return;
2710e8bcf842SMichael S. Tsirkin     }
27116e790746SPaolo Bonzini 
27126e790746SPaolo Bonzini     q->tx_waiting = 0;
27136e790746SPaolo Bonzini 
27146e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
271517a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
27166e790746SPaolo Bonzini         return;
271717a0ca55SKONRAD Frederic     }
27186e790746SPaolo Bonzini 
27196e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
27206e790746SPaolo Bonzini     virtio_net_flush_tx(q);
27216e790746SPaolo Bonzini }
27226e790746SPaolo Bonzini 
27236e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
27246e790746SPaolo Bonzini {
27256e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
27266e790746SPaolo Bonzini     VirtIONet *n = q->n;
272717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
27286e790746SPaolo Bonzini     int32_t ret;
27296e790746SPaolo Bonzini 
2730e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2731e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2732e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2733e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2734e8bcf842SMichael S. Tsirkin         return;
2735e8bcf842SMichael S. Tsirkin     }
27366e790746SPaolo Bonzini 
27376e790746SPaolo Bonzini     q->tx_waiting = 0;
27386e790746SPaolo Bonzini 
27396e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
274017a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
27416e790746SPaolo Bonzini         return;
274217a0ca55SKONRAD Frederic     }
27436e790746SPaolo Bonzini 
27446e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
2745fa5e56c2SGreg Kurz     if (ret == -EBUSY || ret == -EINVAL) {
2746fa5e56c2SGreg Kurz         return; /* Notification re-enable handled by tx_complete or device
2747fa5e56c2SGreg Kurz                  * broken */
27486e790746SPaolo Bonzini     }
27496e790746SPaolo Bonzini 
27506e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
27516e790746SPaolo Bonzini      * more coming and immediately reschedule */
27526e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
27536e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
27546e790746SPaolo Bonzini         q->tx_waiting = 1;
27556e790746SPaolo Bonzini         return;
27566e790746SPaolo Bonzini     }
27576e790746SPaolo Bonzini 
27586e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
27596e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
27606e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
27616e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2762fa5e56c2SGreg Kurz     ret = virtio_net_flush_tx(q);
2763fa5e56c2SGreg Kurz     if (ret == -EINVAL) {
2764fa5e56c2SGreg Kurz         return;
2765fa5e56c2SGreg Kurz     } else if (ret > 0) {
27666e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
27676e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
27686e790746SPaolo Bonzini         q->tx_waiting = 1;
27696e790746SPaolo Bonzini     }
27706e790746SPaolo Bonzini }
27716e790746SPaolo Bonzini 
2772f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index)
2773f9d6dbf0SWen Congyang {
2774f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2775f9d6dbf0SWen Congyang 
27761c0fbfa3SMichael S. Tsirkin     n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
27771c0fbfa3SMichael S. Tsirkin                                            virtio_net_handle_rx);
27789b02e161SWei Wang 
2779f9d6dbf0SWen Congyang     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
2780f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
27819b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
27829b02e161SWei Wang                              virtio_net_handle_tx_timer);
2783f9d6dbf0SWen Congyang         n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
2784f9d6dbf0SWen Congyang                                               virtio_net_tx_timer,
2785f9d6dbf0SWen Congyang                                               &n->vqs[index]);
2786f9d6dbf0SWen Congyang     } else {
2787f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
27889b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
27899b02e161SWei Wang                              virtio_net_handle_tx_bh);
2790f9d6dbf0SWen Congyang         n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
2791f9d6dbf0SWen Congyang     }
2792f9d6dbf0SWen Congyang 
2793f9d6dbf0SWen Congyang     n->vqs[index].tx_waiting = 0;
2794f9d6dbf0SWen Congyang     n->vqs[index].n = n;
2795f9d6dbf0SWen Congyang }
2796f9d6dbf0SWen Congyang 
2797f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index)
2798f9d6dbf0SWen Congyang {
2799f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2800f9d6dbf0SWen Congyang     VirtIONetQueue *q = &n->vqs[index];
2801f9d6dbf0SWen Congyang     NetClientState *nc = qemu_get_subqueue(n->nic, index);
2802f9d6dbf0SWen Congyang 
2803f9d6dbf0SWen Congyang     qemu_purge_queued_packets(nc);
2804f9d6dbf0SWen Congyang 
2805f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2);
2806f9d6dbf0SWen Congyang     if (q->tx_timer) {
2807f9d6dbf0SWen Congyang         timer_free(q->tx_timer);
2808f989c30cSYunjian Wang         q->tx_timer = NULL;
2809f9d6dbf0SWen Congyang     } else {
2810f9d6dbf0SWen Congyang         qemu_bh_delete(q->tx_bh);
2811f989c30cSYunjian Wang         q->tx_bh = NULL;
2812f9d6dbf0SWen Congyang     }
2813f989c30cSYunjian Wang     q->tx_waiting = 0;
2814f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2 + 1);
2815f9d6dbf0SWen Congyang }
2816f9d6dbf0SWen Congyang 
2817441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs)
2818f9d6dbf0SWen Congyang {
2819f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2820f9d6dbf0SWen Congyang     int old_num_queues = virtio_get_num_queues(vdev);
2821441537f1SJason Wang     int new_num_queues = new_max_queue_pairs * 2 + 1;
2822f9d6dbf0SWen Congyang     int i;
2823f9d6dbf0SWen Congyang 
2824f9d6dbf0SWen Congyang     assert(old_num_queues >= 3);
2825f9d6dbf0SWen Congyang     assert(old_num_queues % 2 == 1);
2826f9d6dbf0SWen Congyang 
2827f9d6dbf0SWen Congyang     if (old_num_queues == new_num_queues) {
2828f9d6dbf0SWen Congyang         return;
2829f9d6dbf0SWen Congyang     }
2830f9d6dbf0SWen Congyang 
2831f9d6dbf0SWen Congyang     /*
2832f9d6dbf0SWen Congyang      * We always need to remove and add ctrl vq if
2833f9d6dbf0SWen Congyang      * old_num_queues != new_num_queues. Remove ctrl_vq first,
283420f86a75SYuval Shaia      * and then we only enter one of the following two loops.
2835f9d6dbf0SWen Congyang      */
2836f9d6dbf0SWen Congyang     virtio_del_queue(vdev, old_num_queues - 1);
2837f9d6dbf0SWen Congyang 
2838f9d6dbf0SWen Congyang     for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
2839f9d6dbf0SWen Congyang         /* new_num_queues < old_num_queues */
2840f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i / 2);
2841f9d6dbf0SWen Congyang     }
2842f9d6dbf0SWen Congyang 
2843f9d6dbf0SWen Congyang     for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
2844f9d6dbf0SWen Congyang         /* new_num_queues > old_num_queues */
2845f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i / 2);
2846f9d6dbf0SWen Congyang     }
2847f9d6dbf0SWen Congyang 
2848f9d6dbf0SWen Congyang     /* add ctrl_vq last */
2849f9d6dbf0SWen Congyang     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
2850f9d6dbf0SWen Congyang }
2851f9d6dbf0SWen Congyang 
2852ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
28536e790746SPaolo Bonzini {
2854441537f1SJason Wang     int max = multiqueue ? n->max_queue_pairs : 1;
2855f9d6dbf0SWen Congyang 
28566e790746SPaolo Bonzini     n->multiqueue = multiqueue;
2857441537f1SJason Wang     virtio_net_change_num_queue_pairs(n, max);
28586e790746SPaolo Bonzini 
2859441537f1SJason Wang     virtio_net_set_queue_pairs(n);
28606e790746SPaolo Bonzini }
28616e790746SPaolo Bonzini 
2862982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id)
2863037dab2fSGreg Kurz {
2864982b78c5SDr. David Alan Gilbert     VirtIONet *n = opaque;
2865982b78c5SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2866037dab2fSGreg Kurz     int i, link_down;
2867037dab2fSGreg Kurz 
28689d8c6a25SDr. David Alan Gilbert     trace_virtio_net_post_load_device();
2869982b78c5SDr. David Alan Gilbert     virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs,
287095129d6fSCornelia Huck                                virtio_vdev_has_feature(vdev,
2871e22f0603SYuri Benditovich                                                        VIRTIO_F_VERSION_1),
2872e22f0603SYuri Benditovich                                virtio_vdev_has_feature(vdev,
2873e22f0603SYuri Benditovich                                                        VIRTIO_NET_F_HASH_REPORT));
28746e790746SPaolo Bonzini 
28756e790746SPaolo Bonzini     /* MAC_TABLE_ENTRIES may be different from the saved image */
2876982b78c5SDr. David Alan Gilbert     if (n->mac_table.in_use > MAC_TABLE_ENTRIES) {
28776e790746SPaolo Bonzini         n->mac_table.in_use = 0;
28786e790746SPaolo Bonzini     }
28796e790746SPaolo Bonzini 
2880982b78c5SDr. David Alan Gilbert     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
28816c666823SMichael S. Tsirkin         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
28826c666823SMichael S. Tsirkin     }
28836c666823SMichael S. Tsirkin 
28847788c3f2SMikhail Sennikovsky     /*
28857788c3f2SMikhail Sennikovsky      * curr_guest_offloads will be later overwritten by the
28867788c3f2SMikhail Sennikovsky      * virtio_set_features_nocheck call done from the virtio_load.
28877788c3f2SMikhail Sennikovsky      * Here we make sure it is preserved and restored accordingly
28887788c3f2SMikhail Sennikovsky      * in the virtio_net_post_load_virtio callback.
28897788c3f2SMikhail Sennikovsky      */
28907788c3f2SMikhail Sennikovsky     n->saved_guest_offloads = n->curr_guest_offloads;
28916c666823SMichael S. Tsirkin 
2892441537f1SJason Wang     virtio_net_set_queue_pairs(n);
28936e790746SPaolo Bonzini 
28946e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
28956e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
28966e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
28976e790746SPaolo Bonzini             break;
28986e790746SPaolo Bonzini         }
28996e790746SPaolo Bonzini     }
29006e790746SPaolo Bonzini     n->mac_table.first_multi = i;
29016e790746SPaolo Bonzini 
29026e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
29036e790746SPaolo Bonzini      * to link status bit in n->status */
29046e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
2905441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
29066e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
29076e790746SPaolo Bonzini     }
29086e790746SPaolo Bonzini 
29096c666823SMichael S. Tsirkin     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
29106c666823SMichael S. Tsirkin         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
29119d8c6a25SDr. David Alan Gilbert         qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
29129d8c6a25SDr. David Alan Gilbert                                   QEMU_CLOCK_VIRTUAL,
29139d8c6a25SDr. David Alan Gilbert                                   virtio_net_announce_timer, n);
29149d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
29159d8c6a25SDr. David Alan Gilbert             timer_mod(n->announce_timer.tm,
29169d8c6a25SDr. David Alan Gilbert                       qemu_clock_get_ms(n->announce_timer.type));
29179d8c6a25SDr. David Alan Gilbert         } else {
2918944458b6SDr. David Alan Gilbert             qemu_announce_timer_del(&n->announce_timer, false);
29199d8c6a25SDr. David Alan Gilbert         }
29206c666823SMichael S. Tsirkin     }
29216c666823SMichael S. Tsirkin 
2922e41b7114SYuri Benditovich     if (n->rss_data.enabled) {
29230145c393SAndrew Melnychenko         n->rss_data.enabled_software_rss = n->rss_data.populate_hash;
29240145c393SAndrew Melnychenko         if (!n->rss_data.populate_hash) {
29250145c393SAndrew Melnychenko             if (!virtio_net_attach_epbf_rss(n)) {
29260145c393SAndrew Melnychenko                 if (get_vhost_net(qemu_get_queue(n->nic)->peer)) {
29270145c393SAndrew Melnychenko                     warn_report("Can't post-load eBPF RSS for vhost");
29280145c393SAndrew Melnychenko                 } else {
29290145c393SAndrew Melnychenko                     warn_report("Can't post-load eBPF RSS - "
29300145c393SAndrew Melnychenko                                 "fallback to software RSS");
29310145c393SAndrew Melnychenko                     n->rss_data.enabled_software_rss = true;
29320145c393SAndrew Melnychenko                 }
29330145c393SAndrew Melnychenko             }
29340145c393SAndrew Melnychenko         }
29350145c393SAndrew Melnychenko 
2936e41b7114SYuri Benditovich         trace_virtio_net_rss_enable(n->rss_data.hash_types,
2937e41b7114SYuri Benditovich                                     n->rss_data.indirections_len,
2938e41b7114SYuri Benditovich                                     sizeof(n->rss_data.key));
2939e41b7114SYuri Benditovich     } else {
2940e41b7114SYuri Benditovich         trace_virtio_net_rss_disable();
2941e41b7114SYuri Benditovich     }
29426e790746SPaolo Bonzini     return 0;
29436e790746SPaolo Bonzini }
29446e790746SPaolo Bonzini 
29457788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev)
29467788c3f2SMikhail Sennikovsky {
29477788c3f2SMikhail Sennikovsky     VirtIONet *n = VIRTIO_NET(vdev);
29487788c3f2SMikhail Sennikovsky     /*
29497788c3f2SMikhail Sennikovsky      * The actual needed state is now in saved_guest_offloads,
29507788c3f2SMikhail Sennikovsky      * see virtio_net_post_load_device for detail.
29517788c3f2SMikhail Sennikovsky      * Restore it back and apply the desired offloads.
29527788c3f2SMikhail Sennikovsky      */
29537788c3f2SMikhail Sennikovsky     n->curr_guest_offloads = n->saved_guest_offloads;
29547788c3f2SMikhail Sennikovsky     if (peer_has_vnet_hdr(n)) {
29557788c3f2SMikhail Sennikovsky         virtio_net_apply_guest_offloads(n);
29567788c3f2SMikhail Sennikovsky     }
29577788c3f2SMikhail Sennikovsky 
29587788c3f2SMikhail Sennikovsky     return 0;
29597788c3f2SMikhail Sennikovsky }
29607788c3f2SMikhail Sennikovsky 
2961982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */
2962982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = {
2963982b78c5SDr. David Alan Gilbert     .name = "virtio-net-queue-tx_waiting",
2964982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
2965982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(tx_waiting, VirtIONetQueue),
2966982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
2967982b78c5SDr. David Alan Gilbert    },
2968982b78c5SDr. David Alan Gilbert };
2969982b78c5SDr. David Alan Gilbert 
2970441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id)
2971982b78c5SDr. David Alan Gilbert {
2972441537f1SJason Wang     return VIRTIO_NET(opaque)->max_queue_pairs > 1;
2973982b78c5SDr. David Alan Gilbert }
2974982b78c5SDr. David Alan Gilbert 
2975982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id)
2976982b78c5SDr. David Alan Gilbert {
2977982b78c5SDr. David Alan Gilbert     return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque),
2978982b78c5SDr. David Alan Gilbert                                    VIRTIO_NET_F_CTRL_GUEST_OFFLOADS);
2979982b78c5SDr. David Alan Gilbert }
2980982b78c5SDr. David Alan Gilbert 
2981982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id)
2982982b78c5SDr. David Alan Gilbert {
2983982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES;
2984982b78c5SDr. David Alan Gilbert }
2985982b78c5SDr. David Alan Gilbert 
2986982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id)
2987982b78c5SDr. David Alan Gilbert {
2988982b78c5SDr. David Alan Gilbert     return !mac_table_fits(opaque, version_id);
2989982b78c5SDr. David Alan Gilbert }
2990982b78c5SDr. David Alan Gilbert 
2991982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods
2992982b78c5SDr. David Alan Gilbert  * although only some fields are used by each.
2993982b78c5SDr. David Alan Gilbert  */
2994982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp {
2995982b78c5SDr. David Alan Gilbert     VirtIONet      *parent;
2996982b78c5SDr. David Alan Gilbert     VirtIONetQueue *vqs_1;
2997441537f1SJason Wang     uint16_t        curr_queue_pairs_1;
2998982b78c5SDr. David Alan Gilbert     uint8_t         has_ufo;
2999982b78c5SDr. David Alan Gilbert     uint32_t        has_vnet_hdr;
3000982b78c5SDr. David Alan Gilbert };
3001982b78c5SDr. David Alan Gilbert 
3002982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than
3003441537f1SJason Wang  * the 1st entry in the queue_pairs and only if there's more than one
3004982b78c5SDr. David Alan Gilbert  * entry.  We use the tmp mechanism to calculate a temporary
3005982b78c5SDr. David Alan Gilbert  * pointer and count and also validate the count.
3006982b78c5SDr. David Alan Gilbert  */
3007982b78c5SDr. David Alan Gilbert 
300844b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque)
3009982b78c5SDr. David Alan Gilbert {
3010982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3011982b78c5SDr. David Alan Gilbert 
3012982b78c5SDr. David Alan Gilbert     tmp->vqs_1 = tmp->parent->vqs + 1;
3013441537f1SJason Wang     tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1;
3014441537f1SJason Wang     if (tmp->parent->curr_queue_pairs == 0) {
3015441537f1SJason Wang         tmp->curr_queue_pairs_1 = 0;
3016982b78c5SDr. David Alan Gilbert     }
301744b1ff31SDr. David Alan Gilbert 
301844b1ff31SDr. David Alan Gilbert     return 0;
3019982b78c5SDr. David Alan Gilbert }
3020982b78c5SDr. David Alan Gilbert 
3021982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque)
3022982b78c5SDr. David Alan Gilbert {
3023982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3024982b78c5SDr. David Alan Gilbert 
3025982b78c5SDr. David Alan Gilbert     /* Reuse the pointer setup from save */
3026982b78c5SDr. David Alan Gilbert     virtio_net_tx_waiting_pre_save(opaque);
3027982b78c5SDr. David Alan Gilbert 
3028441537f1SJason Wang     if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) {
3029441537f1SJason Wang         error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x",
3030441537f1SJason Wang             tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs);
3031982b78c5SDr. David Alan Gilbert 
3032982b78c5SDr. David Alan Gilbert         return -EINVAL;
3033982b78c5SDr. David Alan Gilbert     }
3034982b78c5SDr. David Alan Gilbert 
3035982b78c5SDr. David Alan Gilbert     return 0; /* all good */
3036982b78c5SDr. David Alan Gilbert }
3037982b78c5SDr. David Alan Gilbert 
3038982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = {
3039982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-tx_waiting",
3040982b78c5SDr. David Alan Gilbert     .pre_load  = virtio_net_tx_waiting_pre_load,
3041982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_tx_waiting_pre_save,
3042982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3043982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp,
3044441537f1SJason Wang                                      curr_queue_pairs_1,
3045982b78c5SDr. David Alan Gilbert                                      vmstate_virtio_net_queue_tx_waiting,
3046982b78c5SDr. David Alan Gilbert                                      struct VirtIONetQueue),
3047982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3048982b78c5SDr. David Alan Gilbert     },
3049982b78c5SDr. David Alan Gilbert };
3050982b78c5SDr. David Alan Gilbert 
3051982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the
3052982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
3053982b78c5SDr. David Alan Gilbert  */
3054982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id)
3055982b78c5SDr. David Alan Gilbert {
3056982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3057982b78c5SDr. David Alan Gilbert 
3058982b78c5SDr. David Alan Gilbert     if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) {
3059982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires TUN_F_UFO support");
3060982b78c5SDr. David Alan Gilbert         return -EINVAL;
3061982b78c5SDr. David Alan Gilbert     }
3062982b78c5SDr. David Alan Gilbert 
3063982b78c5SDr. David Alan Gilbert     return 0;
3064982b78c5SDr. David Alan Gilbert }
3065982b78c5SDr. David Alan Gilbert 
306644b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque)
3067982b78c5SDr. David Alan Gilbert {
3068982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3069982b78c5SDr. David Alan Gilbert 
3070982b78c5SDr. David Alan Gilbert     tmp->has_ufo = tmp->parent->has_ufo;
307144b1ff31SDr. David Alan Gilbert 
307244b1ff31SDr. David Alan Gilbert     return 0;
3073982b78c5SDr. David Alan Gilbert }
3074982b78c5SDr. David Alan Gilbert 
3075982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = {
3076982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-ufo",
3077982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_ufo_post_load,
3078982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_ufo_pre_save,
3079982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3080982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp),
3081982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3082982b78c5SDr. David Alan Gilbert     },
3083982b78c5SDr. David Alan Gilbert };
3084982b78c5SDr. David Alan Gilbert 
3085982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the
3086982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
3087982b78c5SDr. David Alan Gilbert  */
3088982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id)
3089982b78c5SDr. David Alan Gilbert {
3090982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3091982b78c5SDr. David Alan Gilbert 
3092982b78c5SDr. David Alan Gilbert     if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) {
3093982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires vnet_hdr=on");
3094982b78c5SDr. David Alan Gilbert         return -EINVAL;
3095982b78c5SDr. David Alan Gilbert     }
3096982b78c5SDr. David Alan Gilbert 
3097982b78c5SDr. David Alan Gilbert     return 0;
3098982b78c5SDr. David Alan Gilbert }
3099982b78c5SDr. David Alan Gilbert 
310044b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque)
3101982b78c5SDr. David Alan Gilbert {
3102982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3103982b78c5SDr. David Alan Gilbert 
3104982b78c5SDr. David Alan Gilbert     tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr;
310544b1ff31SDr. David Alan Gilbert 
310644b1ff31SDr. David Alan Gilbert     return 0;
3107982b78c5SDr. David Alan Gilbert }
3108982b78c5SDr. David Alan Gilbert 
3109982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = {
3110982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-vnet",
3111982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_vnet_post_load,
3112982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_vnet_pre_save,
3113982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3114982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp),
3115982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3116982b78c5SDr. David Alan Gilbert     },
3117982b78c5SDr. David Alan Gilbert };
3118982b78c5SDr. David Alan Gilbert 
3119e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque)
3120e41b7114SYuri Benditovich {
3121e41b7114SYuri Benditovich     return VIRTIO_NET(opaque)->rss_data.enabled;
3122e41b7114SYuri Benditovich }
3123e41b7114SYuri Benditovich 
3124e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = {
3125e41b7114SYuri Benditovich     .name      = "virtio-net-device/rss",
3126e41b7114SYuri Benditovich     .version_id = 1,
3127e41b7114SYuri Benditovich     .minimum_version_id = 1,
3128e41b7114SYuri Benditovich     .needed = virtio_net_rss_needed,
3129e41b7114SYuri Benditovich     .fields = (VMStateField[]) {
3130e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.enabled, VirtIONet),
3131e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.redirect, VirtIONet),
3132e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.populate_hash, VirtIONet),
3133e41b7114SYuri Benditovich         VMSTATE_UINT32(rss_data.hash_types, VirtIONet),
3134e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.indirections_len, VirtIONet),
3135e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.default_queue, VirtIONet),
3136e41b7114SYuri Benditovich         VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet,
3137e41b7114SYuri Benditovich                             VIRTIO_NET_RSS_MAX_KEY_SIZE),
3138e41b7114SYuri Benditovich         VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet,
3139e41b7114SYuri Benditovich                                     rss_data.indirections_len, 0,
3140e41b7114SYuri Benditovich                                     vmstate_info_uint16, uint16_t),
3141e41b7114SYuri Benditovich         VMSTATE_END_OF_LIST()
3142e41b7114SYuri Benditovich     },
3143e41b7114SYuri Benditovich };
3144e41b7114SYuri Benditovich 
3145982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = {
3146982b78c5SDr. David Alan Gilbert     .name = "virtio-net-device",
3147982b78c5SDr. David Alan Gilbert     .version_id = VIRTIO_NET_VM_VERSION,
3148982b78c5SDr. David Alan Gilbert     .minimum_version_id = VIRTIO_NET_VM_VERSION,
3149982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_post_load_device,
3150982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
3151982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN),
3152982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_POINTER(vqs, VirtIONet,
3153982b78c5SDr. David Alan Gilbert                                vmstate_virtio_net_queue_tx_waiting,
3154982b78c5SDr. David Alan Gilbert                                VirtIONetQueue),
3155982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet),
3156982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16(status, VirtIONet),
3157982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(promisc, VirtIONet),
3158982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(allmulti, VirtIONet),
3159982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mac_table.in_use, VirtIONet),
3160982b78c5SDr. David Alan Gilbert 
3161982b78c5SDr. David Alan Gilbert         /* Guarded pair: If it fits we load it, else we throw it away
3162982b78c5SDr. David Alan Gilbert          * - can happen if source has a larger MAC table.; post-load
3163982b78c5SDr. David Alan Gilbert          *  sets flags in this case.
3164982b78c5SDr. David Alan Gilbert          */
3165982b78c5SDr. David Alan Gilbert         VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet,
3166982b78c5SDr. David Alan Gilbert                                 0, mac_table_fits, mac_table.in_use,
3167982b78c5SDr. David Alan Gilbert                                  ETH_ALEN),
3168982b78c5SDr. David Alan Gilbert         VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0,
3169982b78c5SDr. David Alan Gilbert                                      mac_table.in_use, ETH_ALEN),
3170982b78c5SDr. David Alan Gilbert 
3171982b78c5SDr. David Alan Gilbert         /* Note: This is an array of uint32's that's always been saved as a
3172982b78c5SDr. David Alan Gilbert          * buffer; hold onto your endiannesses; it's actually used as a bitmap
3173982b78c5SDr. David Alan Gilbert          * but based on the uint.
3174982b78c5SDr. David Alan Gilbert          */
3175982b78c5SDr. David Alan Gilbert         VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3),
3176982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3177982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_vnet),
3178982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet),
3179982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet),
3180982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(alluni, VirtIONet),
3181982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nomulti, VirtIONet),
3182982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nouni, VirtIONet),
3183982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nobcast, VirtIONet),
3184982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3185982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_ufo),
3186441537f1SJason Wang         VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0,
3187982b78c5SDr. David Alan Gilbert                             vmstate_info_uint16_equal, uint16_t),
3188441537f1SJason Wang         VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1),
3189982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3190982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_tx_waiting),
3191982b78c5SDr. David Alan Gilbert         VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet,
3192982b78c5SDr. David Alan Gilbert                             has_ctrl_guest_offloads),
3193982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3194982b78c5SDr. David Alan Gilbert    },
3195e41b7114SYuri Benditovich     .subsections = (const VMStateDescription * []) {
3196e41b7114SYuri Benditovich         &vmstate_virtio_net_rss,
3197e41b7114SYuri Benditovich         NULL
3198e41b7114SYuri Benditovich     }
3199982b78c5SDr. David Alan Gilbert };
3200982b78c5SDr. David Alan Gilbert 
32016e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
3202f394b2e2SEric Blake     .type = NET_CLIENT_DRIVER_NIC,
32036e790746SPaolo Bonzini     .size = sizeof(NICState),
32046e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
32056e790746SPaolo Bonzini     .receive = virtio_net_receive,
32066e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
3207b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
3208b2c929f0SDr. David Alan Gilbert     .announce = virtio_net_announce,
32096e790746SPaolo Bonzini };
32106e790746SPaolo Bonzini 
32116e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
32126e790746SPaolo Bonzini {
321317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
321468b0a639SSi-Wei Liu     NetClientState *nc;
32156e790746SPaolo Bonzini     assert(n->vhost_started);
321668b0a639SSi-Wei Liu     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) {
321768b0a639SSi-Wei Liu         /* Must guard against invalid features and bogus queue index
321868b0a639SSi-Wei Liu          * from being set by malicious guest, or penetrated through
321968b0a639SSi-Wei Liu          * buggy migration stream.
322068b0a639SSi-Wei Liu          */
322168b0a639SSi-Wei Liu         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
322268b0a639SSi-Wei Liu             qemu_log_mask(LOG_GUEST_ERROR,
322368b0a639SSi-Wei Liu                           "%s: bogus vq index ignored\n", __func__);
322468b0a639SSi-Wei Liu             return false;
322568b0a639SSi-Wei Liu         }
322668b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, n->max_queue_pairs);
322768b0a639SSi-Wei Liu     } else {
322868b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, vq2q(idx));
322968b0a639SSi-Wei Liu     }
3230ed8b4afeSNikolay Nikolaev     return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
32316e790746SPaolo Bonzini }
32326e790746SPaolo Bonzini 
32336e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
32346e790746SPaolo Bonzini                                            bool mask)
32356e790746SPaolo Bonzini {
323617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
323768b0a639SSi-Wei Liu     NetClientState *nc;
32386e790746SPaolo Bonzini     assert(n->vhost_started);
323968b0a639SSi-Wei Liu     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) {
324068b0a639SSi-Wei Liu         /* Must guard against invalid features and bogus queue index
324168b0a639SSi-Wei Liu          * from being set by malicious guest, or penetrated through
324268b0a639SSi-Wei Liu          * buggy migration stream.
324368b0a639SSi-Wei Liu          */
324468b0a639SSi-Wei Liu         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
324568b0a639SSi-Wei Liu             qemu_log_mask(LOG_GUEST_ERROR,
324668b0a639SSi-Wei Liu                           "%s: bogus vq index ignored\n", __func__);
324768b0a639SSi-Wei Liu             return;
324868b0a639SSi-Wei Liu         }
324968b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, n->max_queue_pairs);
325068b0a639SSi-Wei Liu     } else {
325168b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, vq2q(idx));
325268b0a639SSi-Wei Liu     }
3253a882b571SMichael S. Tsirkin     vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
3254a882b571SMichael S. Tsirkin                              vdev, idx, mask);
32556e790746SPaolo Bonzini }
32566e790746SPaolo Bonzini 
3257019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
32586e790746SPaolo Bonzini {
32590cd09c3aSCornelia Huck     virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
3260a93e599dSMaxime Coquelin 
3261d74c30c8SDaniil Tatianin     n->config_size = virtio_get_config_size(&cfg_size_params, host_features);
326217ec5a86SKONRAD Frederic }
32636e790746SPaolo Bonzini 
32648a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
32658a253ec2SKONRAD Frederic                                    const char *type)
32668a253ec2SKONRAD Frederic {
32678a253ec2SKONRAD Frederic     /*
32688a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
32698a253ec2SKONRAD Frederic      */
32708a253ec2SKONRAD Frederic     assert(type != NULL);
32718a253ec2SKONRAD Frederic 
32728a253ec2SKONRAD Frederic     g_free(n->netclient_name);
32738a253ec2SKONRAD Frederic     g_free(n->netclient_type);
32748a253ec2SKONRAD Frederic     n->netclient_name = g_strdup(name);
32758a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
32768a253ec2SKONRAD Frederic }
32778a253ec2SKONRAD Frederic 
32780e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev)
32799711cd0dSJens Freimann {
32809711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
32819711cd0dSJens Freimann     PCIDevice *pci_dev;
32829711cd0dSJens Freimann     Error *err = NULL;
32839711cd0dSJens Freimann 
32840e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
32859711cd0dSJens Freimann     if (hotplug_ctrl) {
32860e9a65c5SJuan Quintela         pci_dev = PCI_DEVICE(dev);
32879711cd0dSJens Freimann         pci_dev->partially_hotplugged = true;
32880e9a65c5SJuan Quintela         hotplug_handler_unplug_request(hotplug_ctrl, dev, &err);
32899711cd0dSJens Freimann         if (err) {
32909711cd0dSJens Freimann             error_report_err(err);
32919711cd0dSJens Freimann             return false;
32929711cd0dSJens Freimann         }
32939711cd0dSJens Freimann     } else {
32949711cd0dSJens Freimann         return false;
32959711cd0dSJens Freimann     }
32969711cd0dSJens Freimann     return true;
32979711cd0dSJens Freimann }
32989711cd0dSJens Freimann 
32990e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev,
33000e9a65c5SJuan Quintela                                     Error **errp)
33019711cd0dSJens Freimann {
33025a0948d3SMarkus Armbruster     Error *err = NULL;
33039711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
33040e9a65c5SJuan Quintela     PCIDevice *pdev = PCI_DEVICE(dev);
330578274682SJuan Quintela     BusState *primary_bus;
33069711cd0dSJens Freimann 
33079711cd0dSJens Freimann     if (!pdev->partially_hotplugged) {
33089711cd0dSJens Freimann         return true;
33099711cd0dSJens Freimann     }
33100e9a65c5SJuan Quintela     primary_bus = dev->parent_bus;
331178274682SJuan Quintela     if (!primary_bus) {
3312150ab54aSJens Freimann         error_setg(errp, "virtio_net: couldn't find primary bus");
33135a0948d3SMarkus Armbruster         return false;
33149711cd0dSJens Freimann     }
33150e9a65c5SJuan Quintela     qdev_set_parent_bus(dev, primary_bus, &error_abort);
3316e2bde83eSJuan Quintela     qatomic_set(&n->failover_primary_hidden, false);
33170e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
33189711cd0dSJens Freimann     if (hotplug_ctrl) {
33190e9a65c5SJuan Quintela         hotplug_handler_pre_plug(hotplug_ctrl, dev, &err);
33205a0948d3SMarkus Armbruster         if (err) {
33215a0948d3SMarkus Armbruster             goto out;
33225a0948d3SMarkus Armbruster         }
33230e9a65c5SJuan Quintela         hotplug_handler_plug(hotplug_ctrl, dev, &err);
33249711cd0dSJens Freimann     }
3325109c20eaSLaurent Vivier     pdev->partially_hotplugged = false;
3326150ab54aSJens Freimann 
3327150ab54aSJens Freimann out:
33285a0948d3SMarkus Armbruster     error_propagate(errp, err);
33295a0948d3SMarkus Armbruster     return !err;
33309711cd0dSJens Freimann }
33319711cd0dSJens Freimann 
333207a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s)
33339711cd0dSJens Freimann {
33349711cd0dSJens Freimann     bool should_be_hidden;
33359711cd0dSJens Freimann     Error *err = NULL;
333607a5d816SJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
333707a5d816SJuan Quintela 
333807a5d816SJuan Quintela     if (!dev) {
333907a5d816SJuan Quintela         return;
334007a5d816SJuan Quintela     }
33419711cd0dSJens Freimann 
3342e2bde83eSJuan Quintela     should_be_hidden = qatomic_read(&n->failover_primary_hidden);
33439711cd0dSJens Freimann 
33444dbac1aeSMarkus Armbruster     if (migration_in_setup(s) && !should_be_hidden) {
334507a5d816SJuan Quintela         if (failover_unplug_primary(n, dev)) {
334607a5d816SJuan Quintela             vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev);
334707a5d816SJuan Quintela             qapi_event_send_unplug_primary(dev->id);
3348e2bde83eSJuan Quintela             qatomic_set(&n->failover_primary_hidden, true);
33499711cd0dSJens Freimann         } else {
33509711cd0dSJens Freimann             warn_report("couldn't unplug primary device");
33519711cd0dSJens Freimann         }
33529711cd0dSJens Freimann     } else if (migration_has_failed(s)) {
3353150ab54aSJens Freimann         /* We already unplugged the device let's plug it back */
335407a5d816SJuan Quintela         if (!failover_replug_primary(n, dev, &err)) {
33559711cd0dSJens Freimann             if (err) {
33569711cd0dSJens Freimann                 error_report_err(err);
33579711cd0dSJens Freimann             }
33589711cd0dSJens Freimann         }
33599711cd0dSJens Freimann     }
33609711cd0dSJens Freimann }
33619711cd0dSJens Freimann 
33629711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data)
33639711cd0dSJens Freimann {
33649711cd0dSJens Freimann     MigrationState *s = data;
33659711cd0dSJens Freimann     VirtIONet *n = container_of(notifier, VirtIONet, migration_state);
33669711cd0dSJens Freimann     virtio_net_handle_migration_primary(n, s);
33679711cd0dSJens Freimann }
33689711cd0dSJens Freimann 
3369b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener,
3370f3558b1bSKevin Wolf                                          const QDict *device_opts,
3371f3558b1bSKevin Wolf                                          bool from_json,
3372f3558b1bSKevin Wolf                                          Error **errp)
33739711cd0dSJens Freimann {
33749711cd0dSJens Freimann     VirtIONet *n = container_of(listener, VirtIONet, primary_listener);
33754f0303aeSJuan Quintela     const char *standby_id;
33769711cd0dSJens Freimann 
33774d0e59acSJens Freimann     if (!device_opts) {
337889631fedSJuan Quintela         return false;
33794d0e59acSJens Freimann     }
3380bcfc906bSLaurent Vivier 
3381bcfc906bSLaurent Vivier     if (!qdict_haskey(device_opts, "failover_pair_id")) {
3382bcfc906bSLaurent Vivier         return false;
3383bcfc906bSLaurent Vivier     }
3384bcfc906bSLaurent Vivier 
3385bcfc906bSLaurent Vivier     if (!qdict_haskey(device_opts, "id")) {
3386bcfc906bSLaurent Vivier         error_setg(errp, "Device with failover_pair_id needs to have id");
3387bcfc906bSLaurent Vivier         return false;
3388bcfc906bSLaurent Vivier     }
3389bcfc906bSLaurent Vivier 
3390bcfc906bSLaurent Vivier     standby_id = qdict_get_str(device_opts, "failover_pair_id");
339189631fedSJuan Quintela     if (g_strcmp0(standby_id, n->netclient_name) != 0) {
339289631fedSJuan Quintela         return false;
33939711cd0dSJens Freimann     }
33949711cd0dSJens Freimann 
33957fe7791eSLaurent Vivier     /*
33967fe7791eSLaurent Vivier      * The hide helper can be called several times for a given device.
33977fe7791eSLaurent Vivier      * Check there is only one primary for a virtio-net device but
33987fe7791eSLaurent Vivier      * don't duplicate the qdict several times if it's called for the same
33997fe7791eSLaurent Vivier      * device.
34007fe7791eSLaurent Vivier      */
3401259a10dbSKevin Wolf     if (n->primary_opts) {
34027fe7791eSLaurent Vivier         const char *old, *new;
34037fe7791eSLaurent Vivier         /* devices with failover_pair_id always have an id */
34047fe7791eSLaurent Vivier         old = qdict_get_str(n->primary_opts, "id");
34057fe7791eSLaurent Vivier         new = qdict_get_str(device_opts, "id");
34067fe7791eSLaurent Vivier         if (strcmp(old, new) != 0) {
34077fe7791eSLaurent Vivier             error_setg(errp, "Cannot attach more than one primary device to "
34087fe7791eSLaurent Vivier                        "'%s': '%s' and '%s'", n->netclient_name, old, new);
3409259a10dbSKevin Wolf             return false;
3410259a10dbSKevin Wolf         }
34117fe7791eSLaurent Vivier     } else {
3412f3558b1bSKevin Wolf         n->primary_opts = qdict_clone_shallow(device_opts);
3413f3558b1bSKevin Wolf         n->primary_opts_from_json = from_json;
34147fe7791eSLaurent Vivier     }
3415259a10dbSKevin Wolf 
3416e2bde83eSJuan Quintela     /* failover_primary_hidden is set during feature negotiation */
34173abad4a2SJuan Quintela     return qatomic_read(&n->failover_primary_hidden);
34189711cd0dSJens Freimann }
34199711cd0dSJens Freimann 
3420e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
342117ec5a86SKONRAD Frederic {
3422e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3423284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3424284a32f0SAndreas Färber     NetClientState *nc;
34251773d9eeSKONRAD Frederic     int i;
342617ec5a86SKONRAD Frederic 
3427a93e599dSMaxime Coquelin     if (n->net_conf.mtu) {
3428127833eeSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_MTU);
3429a93e599dSMaxime Coquelin     }
3430a93e599dSMaxime Coquelin 
34319473939eSJason Baron     if (n->net_conf.duplex_str) {
34329473939eSJason Baron         if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) {
34339473939eSJason Baron             n->net_conf.duplex = DUPLEX_HALF;
34349473939eSJason Baron         } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) {
34359473939eSJason Baron             n->net_conf.duplex = DUPLEX_FULL;
34369473939eSJason Baron         } else {
34379473939eSJason Baron             error_setg(errp, "'duplex' must be 'half' or 'full'");
3438843c4cfcSMarkus Armbruster             return;
34399473939eSJason Baron         }
34409473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
34419473939eSJason Baron     } else {
34429473939eSJason Baron         n->net_conf.duplex = DUPLEX_UNKNOWN;
34439473939eSJason Baron     }
34449473939eSJason Baron 
34459473939eSJason Baron     if (n->net_conf.speed < SPEED_UNKNOWN) {
34469473939eSJason Baron         error_setg(errp, "'speed' must be between 0 and INT_MAX");
3447843c4cfcSMarkus Armbruster         return;
3448843c4cfcSMarkus Armbruster     }
3449843c4cfcSMarkus Armbruster     if (n->net_conf.speed >= 0) {
34509473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
34519473939eSJason Baron     }
34529473939eSJason Baron 
34539711cd0dSJens Freimann     if (n->failover) {
3454b91ad981SJuan Quintela         n->primary_listener.hide_device = failover_hide_primary_device;
3455e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, true);
34569711cd0dSJens Freimann         device_listener_register(&n->primary_listener);
34579711cd0dSJens Freimann         n->migration_state.notify = virtio_net_migration_state_notifier;
34589711cd0dSJens Freimann         add_migration_state_change_notifier(&n->migration_state);
34599711cd0dSJens Freimann         n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY);
34609711cd0dSJens Freimann     }
34619711cd0dSJens Freimann 
3462da3e8a23SShannon Zhao     virtio_net_set_config_size(n, n->host_features);
34633857cd5cSJonah Palmer     virtio_init(vdev, VIRTIO_ID_NET, n->config_size);
346417ec5a86SKONRAD Frederic 
34651c0fbfa3SMichael S. Tsirkin     /*
34661c0fbfa3SMichael S. Tsirkin      * We set a lower limit on RX queue size to what it always was.
34671c0fbfa3SMichael S. Tsirkin      * Guests that want a smaller ring can always resize it without
34681c0fbfa3SMichael S. Tsirkin      * help from us (using virtio 1 and up).
34691c0fbfa3SMichael S. Tsirkin      */
34701c0fbfa3SMichael S. Tsirkin     if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
34711c0fbfa3SMichael S. Tsirkin         n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
34725f997fd1SMichal Privoznik         !is_power_of_2(n->net_conf.rx_queue_size)) {
34731c0fbfa3SMichael S. Tsirkin         error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
34741c0fbfa3SMichael S. Tsirkin                    "must be a power of 2 between %d and %d.",
34751c0fbfa3SMichael S. Tsirkin                    n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
34761c0fbfa3SMichael S. Tsirkin                    VIRTQUEUE_MAX_SIZE);
34771c0fbfa3SMichael S. Tsirkin         virtio_cleanup(vdev);
34781c0fbfa3SMichael S. Tsirkin         return;
34791c0fbfa3SMichael S. Tsirkin     }
34801c0fbfa3SMichael S. Tsirkin 
34819b02e161SWei Wang     if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE ||
34829b02e161SWei Wang         n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE ||
34839b02e161SWei Wang         !is_power_of_2(n->net_conf.tx_queue_size)) {
34849b02e161SWei Wang         error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), "
34859b02e161SWei Wang                    "must be a power of 2 between %d and %d",
34869b02e161SWei Wang                    n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE,
34879b02e161SWei Wang                    VIRTQUEUE_MAX_SIZE);
34889b02e161SWei Wang         virtio_cleanup(vdev);
34899b02e161SWei Wang         return;
34909b02e161SWei Wang     }
34919b02e161SWei Wang 
349222288fe5SJason Wang     n->max_ncs = MAX(n->nic_conf.peers.queues, 1);
349322288fe5SJason Wang 
349422288fe5SJason Wang     /*
349522288fe5SJason Wang      * Figure out the datapath queue pairs since the backend could
349622288fe5SJason Wang      * provide control queue via peers as well.
349722288fe5SJason Wang      */
349822288fe5SJason Wang     if (n->nic_conf.peers.queues) {
349922288fe5SJason Wang         for (i = 0; i < n->max_ncs; i++) {
350022288fe5SJason Wang             if (n->nic_conf.peers.ncs[i]->is_datapath) {
350122288fe5SJason Wang                 ++n->max_queue_pairs;
350222288fe5SJason Wang             }
350322288fe5SJason Wang         }
350422288fe5SJason Wang     }
350522288fe5SJason Wang     n->max_queue_pairs = MAX(n->max_queue_pairs, 1);
350622288fe5SJason Wang 
3507441537f1SJason Wang     if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) {
350822288fe5SJason Wang         error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), "
3509631b22eaSStefan Weil                    "must be a positive integer less than %d.",
3510441537f1SJason Wang                    n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2);
35117e0e736eSJason Wang         virtio_cleanup(vdev);
35127e0e736eSJason Wang         return;
35137e0e736eSJason Wang     }
3514b21e2380SMarkus Armbruster     n->vqs = g_new0(VirtIONetQueue, n->max_queue_pairs);
3515441537f1SJason Wang     n->curr_queue_pairs = 1;
35161773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
35176e790746SPaolo Bonzini 
35181773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
35191773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
35200765691eSMarkus Armbruster         warn_report("virtio-net: "
35216e790746SPaolo Bonzini                     "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
35221773d9eeSKONRAD Frederic                     n->net_conf.tx);
35230765691eSMarkus Armbruster         error_printf("Defaulting to \"bh\"");
35246e790746SPaolo Bonzini     }
35256e790746SPaolo Bonzini 
35262eef278bSMichael S. Tsirkin     n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n),
35272eef278bSMichael S. Tsirkin                                     n->net_conf.tx_queue_size);
35289b02e161SWei Wang 
3529441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
3530f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i);
3531da51a335SJason Wang     }
3532da51a335SJason Wang 
353317a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
35341773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
35351773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
35366e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
35379d8c6a25SDr. David Alan Gilbert     qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
35389d8c6a25SDr. David Alan Gilbert                               QEMU_CLOCK_VIRTUAL,
3539f57fcf70SJason Wang                               virtio_net_announce_timer, n);
3540b2c929f0SDr. David Alan Gilbert     n->announce_timer.round = 0;
35416e790746SPaolo Bonzini 
35428a253ec2SKONRAD Frederic     if (n->netclient_type) {
35438a253ec2SKONRAD Frederic         /*
35448a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
35458a253ec2SKONRAD Frederic          */
35468a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
35478a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
35488a253ec2SKONRAD Frederic     } else {
35491773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
3550284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
35518a253ec2SKONRAD Frederic     }
35528a253ec2SKONRAD Frederic 
3553441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
3554d4c62930SBin Meng         n->nic->ncs[i].do_not_pad = true;
3555d4c62930SBin Meng     }
3556d4c62930SBin Meng 
35576e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
35586e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
3559441537f1SJason Wang         for (i = 0; i < n->max_queue_pairs; i++) {
3560d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
35616e790746SPaolo Bonzini         }
35626e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
35636e790746SPaolo Bonzini     } else {
35646e790746SPaolo Bonzini         n->host_hdr_len = 0;
35656e790746SPaolo Bonzini     }
35666e790746SPaolo Bonzini 
35671773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
35686e790746SPaolo Bonzini 
35696e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
35701773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
3571e22f0603SYuri Benditovich     virtio_net_set_mrg_rx_bufs(n, 0, 0, 0);
35726e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
35736e790746SPaolo Bonzini 
35746e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
35756e790746SPaolo Bonzini 
35766e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
35776e790746SPaolo Bonzini 
3578b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
3579b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
3580b1be4280SAmos Kong 
3581e87936eaSCindy Lu    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
3582e87936eaSCindy Lu         struct virtio_net_config netcfg = {};
3583e87936eaSCindy Lu         memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN);
3584e87936eaSCindy Lu         vhost_net_set_config(get_vhost_net(nc->peer),
3585e87936eaSCindy Lu             (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER);
3586e87936eaSCindy Lu     }
35872974e916SYuri Benditovich     QTAILQ_INIT(&n->rsc_chains);
3588284a32f0SAndreas Färber     n->qdev = dev;
35894474e37aSYuri Benditovich 
35904474e37aSYuri Benditovich     net_rx_pkt_init(&n->rx_pkt, false);
35910145c393SAndrew Melnychenko 
35920145c393SAndrew Melnychenko     if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) {
35930145c393SAndrew Melnychenko         virtio_net_load_ebpf(n);
35940145c393SAndrew Melnychenko     }
359517ec5a86SKONRAD Frederic }
359617ec5a86SKONRAD Frederic 
3597b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev)
359817ec5a86SKONRAD Frederic {
3599306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3600306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3601441537f1SJason Wang     int i, max_queue_pairs;
360217ec5a86SKONRAD Frederic 
36030145c393SAndrew Melnychenko     if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) {
36040145c393SAndrew Melnychenko         virtio_net_unload_ebpf(n);
36050145c393SAndrew Melnychenko     }
36060145c393SAndrew Melnychenko 
360717ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
360817ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
360917ec5a86SKONRAD Frederic 
36108a253ec2SKONRAD Frederic     g_free(n->netclient_name);
36118a253ec2SKONRAD Frederic     n->netclient_name = NULL;
36128a253ec2SKONRAD Frederic     g_free(n->netclient_type);
36138a253ec2SKONRAD Frederic     n->netclient_type = NULL;
36148a253ec2SKONRAD Frederic 
361517ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
361617ec5a86SKONRAD Frederic     g_free(n->vlans);
361717ec5a86SKONRAD Frederic 
36189711cd0dSJens Freimann     if (n->failover) {
3619f3558b1bSKevin Wolf         qobject_unref(n->primary_opts);
362065018100SJuan Quintela         device_listener_unregister(&n->primary_listener);
36211e157667SLaurent Vivier         remove_migration_state_change_notifier(&n->migration_state);
3622f3558b1bSKevin Wolf     } else {
3623f3558b1bSKevin Wolf         assert(n->primary_opts == NULL);
36249711cd0dSJens Freimann     }
36259711cd0dSJens Freimann 
3626441537f1SJason Wang     max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
3627441537f1SJason Wang     for (i = 0; i < max_queue_pairs; i++) {
3628f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i);
362917ec5a86SKONRAD Frederic     }
3630d945d9f1SYuri Benditovich     /* delete also control vq */
3631441537f1SJason Wang     virtio_del_queue(vdev, max_queue_pairs * 2);
3632944458b6SDr. David Alan Gilbert     qemu_announce_timer_del(&n->announce_timer, false);
363317ec5a86SKONRAD Frederic     g_free(n->vqs);
363417ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
36352974e916SYuri Benditovich     virtio_net_rsc_cleanup(n);
363659079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
36374474e37aSYuri Benditovich     net_rx_pkt_uninit(n->rx_pkt);
36386a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
363917ec5a86SKONRAD Frederic }
364017ec5a86SKONRAD Frederic 
364117ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
364217ec5a86SKONRAD Frederic {
364317ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
364417ec5a86SKONRAD Frederic 
364517ec5a86SKONRAD Frederic     /*
364617ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
364717ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
364817ec5a86SKONRAD Frederic      */
364917ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
3650aa4197c3SGonglei     device_add_bootindex_property(obj, &n->nic_conf.bootindex,
3651aa4197c3SGonglei                                   "bootindex", "/ethernet-phy@0",
365240c2281cSMarkus Armbruster                                   DEVICE(n));
36530145c393SAndrew Melnychenko 
36540145c393SAndrew Melnychenko     ebpf_rss_init(&n->ebpf_rss);
365517ec5a86SKONRAD Frederic }
365617ec5a86SKONRAD Frederic 
365744b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque)
36584d45dcfbSHalil Pasic {
36594d45dcfbSHalil Pasic     VirtIONet *n = opaque;
36604d45dcfbSHalil Pasic 
36614d45dcfbSHalil Pasic     /* At this point, backend must be stopped, otherwise
36624d45dcfbSHalil Pasic      * it might keep writing to memory. */
36634d45dcfbSHalil Pasic     assert(!n->vhost_started);
366444b1ff31SDr. David Alan Gilbert 
366544b1ff31SDr. David Alan Gilbert     return 0;
36664d45dcfbSHalil Pasic }
36674d45dcfbSHalil Pasic 
36689711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque)
36699711cd0dSJens Freimann {
36709711cd0dSJens Freimann     DeviceState *dev = opaque;
367121e8709bSJuan Quintela     DeviceState *primary;
36729711cd0dSJens Freimann     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
36739711cd0dSJens Freimann     VirtIONet *n = VIRTIO_NET(vdev);
36749711cd0dSJens Freimann 
3675284f42a5SJens Freimann     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) {
3676284f42a5SJens Freimann         return false;
3677284f42a5SJens Freimann     }
367821e8709bSJuan Quintela     primary = failover_find_primary_device(n);
367921e8709bSJuan Quintela     return primary ? primary->pending_deleted_event : false;
36809711cd0dSJens Freimann }
36819711cd0dSJens Freimann 
36829711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque)
36839711cd0dSJens Freimann {
36849711cd0dSJens Freimann     DeviceState *dev = opaque;
36859711cd0dSJens Freimann     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
36869711cd0dSJens Freimann 
36879711cd0dSJens Freimann     return vdc->primary_unplug_pending(dev);
36889711cd0dSJens Freimann }
36899711cd0dSJens Freimann 
3690c255488dSJonah Palmer static struct vhost_dev *virtio_net_get_vhost(VirtIODevice *vdev)
3691c255488dSJonah Palmer {
3692c255488dSJonah Palmer     VirtIONet *n = VIRTIO_NET(vdev);
3693c255488dSJonah Palmer     NetClientState *nc = qemu_get_queue(n->nic);
3694c255488dSJonah Palmer     struct vhost_net *net = get_vhost_net(nc->peer);
3695c255488dSJonah Palmer     return &net->dev;
3696c255488dSJonah Palmer }
3697c255488dSJonah Palmer 
36984d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = {
36994d45dcfbSHalil Pasic     .name = "virtio-net",
37004d45dcfbSHalil Pasic     .minimum_version_id = VIRTIO_NET_VM_VERSION,
37014d45dcfbSHalil Pasic     .version_id = VIRTIO_NET_VM_VERSION,
37024d45dcfbSHalil Pasic     .fields = (VMStateField[]) {
37034d45dcfbSHalil Pasic         VMSTATE_VIRTIO_DEVICE,
37044d45dcfbSHalil Pasic         VMSTATE_END_OF_LIST()
37054d45dcfbSHalil Pasic     },
37064d45dcfbSHalil Pasic     .pre_save = virtio_net_pre_save,
37079711cd0dSJens Freimann     .dev_unplug_pending = dev_unplug_pending,
37084d45dcfbSHalil Pasic };
3709290c2428SDr. David Alan Gilbert 
371017ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
3711127833eeSJason Baron     DEFINE_PROP_BIT64("csum", VirtIONet, host_features,
3712127833eeSJason Baron                     VIRTIO_NET_F_CSUM, true),
3713127833eeSJason Baron     DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features,
371487108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_CSUM, true),
3715127833eeSJason Baron     DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
3716127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features,
371787108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO4, true),
3718127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features,
371987108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO6, true),
3720127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features,
372187108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ECN, true),
3722127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features,
372387108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_UFO, true),
3724127833eeSJason Baron     DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features,
372587108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ANNOUNCE, true),
3726127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features,
372787108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO4, true),
3728127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features,
372987108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO6, true),
3730127833eeSJason Baron     DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features,
373187108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_ECN, true),
3732127833eeSJason Baron     DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features,
373387108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_UFO, true),
3734127833eeSJason Baron     DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features,
373587108bb2SShannon Zhao                     VIRTIO_NET_F_MRG_RXBUF, true),
3736127833eeSJason Baron     DEFINE_PROP_BIT64("status", VirtIONet, host_features,
373787108bb2SShannon Zhao                     VIRTIO_NET_F_STATUS, true),
3738127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features,
373987108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VQ, true),
3740127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features,
374187108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX, true),
3742127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features,
374387108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VLAN, true),
3744127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features,
374587108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX_EXTRA, true),
3746127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features,
374787108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_MAC_ADDR, true),
3748127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features,
374987108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
3750127833eeSJason Baron     DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
375159079029SYuri Benditovich     DEFINE_PROP_BIT64("rss", VirtIONet, host_features,
375259079029SYuri Benditovich                     VIRTIO_NET_F_RSS, false),
3753e22f0603SYuri Benditovich     DEFINE_PROP_BIT64("hash", VirtIONet, host_features,
3754e22f0603SYuri Benditovich                     VIRTIO_NET_F_HASH_REPORT, false),
37552974e916SYuri Benditovich     DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features,
37562974e916SYuri Benditovich                     VIRTIO_NET_F_RSC_EXT, false),
37572974e916SYuri Benditovich     DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout,
37582974e916SYuri Benditovich                        VIRTIO_NET_RSC_DEFAULT_INTERVAL),
375917ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
376017ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
376117ec5a86SKONRAD Frederic                        TX_TIMER_INTERVAL),
376217ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
376317ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
37641c0fbfa3SMichael S. Tsirkin     DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
37651c0fbfa3SMichael S. Tsirkin                        VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
37669b02e161SWei Wang     DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size,
37679b02e161SWei Wang                        VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE),
3768a93e599dSMaxime Coquelin     DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0),
376975ebec11SMaxime Coquelin     DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend,
377075ebec11SMaxime Coquelin                      true),
37719473939eSJason Baron     DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN),
37729473939eSJason Baron     DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str),
37739711cd0dSJens Freimann     DEFINE_PROP_BOOL("failover", VirtIONet, failover, false),
377417ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
377517ec5a86SKONRAD Frederic };
377617ec5a86SKONRAD Frederic 
377717ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
377817ec5a86SKONRAD Frederic {
377917ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
378017ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
3781e6f746b3SAndreas Färber 
37824f67d30bSMarc-André Lureau     device_class_set_props(dc, virtio_net_properties);
3783290c2428SDr. David Alan Gilbert     dc->vmsd = &vmstate_virtio_net;
3784125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
3785e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
3786306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
378717ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
378817ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
378917ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
379017ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
379117ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
379217ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
379317ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
379417ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
379517ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
37962a083ffdSMichael S. Tsirkin     vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO);
37977788c3f2SMikhail Sennikovsky     vdc->post_load = virtio_net_post_load_virtio;
3798982b78c5SDr. David Alan Gilbert     vdc->vmsd = &vmstate_virtio_net_device;
37999711cd0dSJens Freimann     vdc->primary_unplug_pending = primary_unplug_pending;
3800c255488dSJonah Palmer     vdc->get_vhost = virtio_net_get_vhost;
380117ec5a86SKONRAD Frederic }
380217ec5a86SKONRAD Frederic 
380317ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
380417ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
380517ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
380617ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
380717ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
380817ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
380917ec5a86SKONRAD Frederic };
381017ec5a86SKONRAD Frederic 
381117ec5a86SKONRAD Frederic static void virtio_register_types(void)
381217ec5a86SKONRAD Frederic {
381317ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
381417ec5a86SKONRAD Frederic }
381517ec5a86SKONRAD Frederic 
381617ec5a86SKONRAD Frederic type_init(virtio_register_types)
3817