xref: /openbmc/qemu/hw/net/virtio-net.c (revision ebc141a62508dc91901373c1a19fe7e2cf560dfb)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
149b8bfe21SPeter Maydell #include "qemu/osdep.h"
159711cd0dSJens Freimann #include "qemu/atomic.h"
166e790746SPaolo Bonzini #include "qemu/iov.h"
1768b0a639SSi-Wei Liu #include "qemu/log.h"
18db725815SMarkus Armbruster #include "qemu/main-loop.h"
190b8fa32fSMarkus Armbruster #include "qemu/module.h"
206e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
216e790746SPaolo Bonzini #include "net/net.h"
226e790746SPaolo Bonzini #include "net/checksum.h"
236e790746SPaolo Bonzini #include "net/tap.h"
246e790746SPaolo Bonzini #include "qemu/error-report.h"
256e790746SPaolo Bonzini #include "qemu/timer.h"
269711cd0dSJens Freimann #include "qemu/option.h"
279711cd0dSJens Freimann #include "qemu/option_int.h"
289711cd0dSJens Freimann #include "qemu/config-file.h"
299711cd0dSJens Freimann #include "qapi/qmp/qdict.h"
306e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
316e790746SPaolo Bonzini #include "net/vhost_net.h"
329d8c6a25SDr. David Alan Gilbert #include "net/announce.h"
3317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
34e688df6bSMarkus Armbruster #include "qapi/error.h"
359af23989SMarkus Armbruster #include "qapi/qapi-events-net.h"
36a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h"
379711cd0dSJens Freimann #include "qapi/qapi-types-migration.h"
389711cd0dSJens Freimann #include "qapi/qapi-events-migration.h"
391399c60dSRusty Russell #include "hw/virtio/virtio-access.h"
40f8d806c9SJuan Quintela #include "migration/misc.h"
419473939eSJason Baron #include "standard-headers/linux/ethtool.h"
422f780b6aSMarkus Armbruster #include "sysemu/sysemu.h"
439d8c6a25SDr. David Alan Gilbert #include "trace.h"
449711cd0dSJens Freimann #include "monitor/qdev.h"
459711cd0dSJens Freimann #include "hw/pci/pci.h"
464474e37aSYuri Benditovich #include "net_rx_pkt.h"
47108a6481SCindy Lu #include "hw/virtio/vhost.h"
481b529d90SLaurent Vivier #include "sysemu/qtest.h"
496e790746SPaolo Bonzini 
506e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
516e790746SPaolo Bonzini 
526e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
536e790746SPaolo Bonzini 
541c0fbfa3SMichael S. Tsirkin /* previously fixed value */
551c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
569b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256
579b02e161SWei Wang 
58441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */
591c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
609b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE
611c0fbfa3SMichael S. Tsirkin 
622974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE   8        /* ipv4 saddr + daddr */
632974e916SYuri Benditovich 
642974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG         0x3F
652974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH   0xF000
662974e916SYuri Benditovich 
672974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */
682974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header))
692974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535
702974e916SYuri Benditovich 
712974e916SYuri Benditovich /* header length value in ip header without option */
722974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5
732974e916SYuri Benditovich 
742974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE   32      /* ipv6 saddr + daddr */
752974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD
762974e916SYuri Benditovich 
772974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance
782974e916SYuri Benditovich    a lot, and should be tuned carefully, '300000'(300us) is the recommended
792974e916SYuri Benditovich    value to pass the WHQL test, '50000' can gain 2x netperf throughput with
802974e916SYuri Benditovich    tso/gso/gro 'off'. */
812974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000
822974e916SYuri Benditovich 
8359079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \
8459079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \
8559079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \
8659079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \
8759079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \
8859079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \
8959079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \
9059079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \
9159079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDP_EX)
9259079029SYuri Benditovich 
93ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = {
94127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MAC,
955d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mac)},
96127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_STATUS,
975d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, status)},
98127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MQ,
995d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
100127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MTU,
1015d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mtu)},
1029473939eSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX,
1035d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, duplex)},
104e22f0603SYuri Benditovich     {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT),
10559079029SYuri Benditovich      .end = endof(struct virtio_net_config, supported_hash_types)},
1066e790746SPaolo Bonzini     {}
1076e790746SPaolo Bonzini };
1086e790746SPaolo Bonzini 
109d74c30c8SDaniil Tatianin static const VirtIOConfigSizeParams cfg_size_params = {
110d74c30c8SDaniil Tatianin     .min_size = endof(struct virtio_net_config, mac),
111d74c30c8SDaniil Tatianin     .max_size = sizeof(struct virtio_net_config),
112d74c30c8SDaniil Tatianin     .feature_sizes = feature_sizes
113d74c30c8SDaniil Tatianin };
114d74c30c8SDaniil Tatianin 
1156e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
1166e790746SPaolo Bonzini {
1176e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1186e790746SPaolo Bonzini 
1196e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
1206e790746SPaolo Bonzini }
1216e790746SPaolo Bonzini 
1226e790746SPaolo Bonzini static int vq2q(int queue_index)
1236e790746SPaolo Bonzini {
1246e790746SPaolo Bonzini     return queue_index / 2;
1256e790746SPaolo Bonzini }
1266e790746SPaolo Bonzini 
1274fdf69abSKangjie Xu static void flush_or_purge_queued_packets(NetClientState *nc)
1284fdf69abSKangjie Xu {
1294fdf69abSKangjie Xu     if (!nc->peer) {
1304fdf69abSKangjie Xu         return;
1314fdf69abSKangjie Xu     }
1324fdf69abSKangjie Xu 
1334fdf69abSKangjie Xu     qemu_flush_or_purge_queued_packets(nc->peer, true);
1344fdf69abSKangjie Xu     assert(!virtio_net_get_subqueue(nc)->async_tx.elem);
1354fdf69abSKangjie Xu }
1364fdf69abSKangjie Xu 
1376e790746SPaolo Bonzini /* TODO
1386e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
1396e790746SPaolo Bonzini  */
1406e790746SPaolo Bonzini 
1416e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
1426e790746SPaolo Bonzini {
14317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1446e790746SPaolo Bonzini     struct virtio_net_config netcfg;
145c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
146fb592882SCindy Lu     static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } };
1476e790746SPaolo Bonzini 
148108a6481SCindy Lu     int ret = 0;
149108a6481SCindy Lu     memset(&netcfg, 0 , sizeof(struct virtio_net_config));
1501399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.status, n->status);
151441537f1SJason Wang     virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs);
152a93e599dSMaxime Coquelin     virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu);
1536e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
1549473939eSJason Baron     virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed);
1559473939eSJason Baron     netcfg.duplex = n->net_conf.duplex;
15659079029SYuri Benditovich     netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE;
15759079029SYuri Benditovich     virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length,
158e22f0603SYuri Benditovich                  virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ?
159e22f0603SYuri Benditovich                  VIRTIO_NET_RSS_MAX_TABLE_LEN : 1);
16059079029SYuri Benditovich     virtio_stl_p(vdev, &netcfg.supported_hash_types,
16159079029SYuri Benditovich                  VIRTIO_NET_RSS_SUPPORTED_HASHES);
1626e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
163108a6481SCindy Lu 
164c546ecf2SJason Wang     /*
165c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
166c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
167c546ecf2SJason Wang      */
168c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
169108a6481SCindy Lu         ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
170108a6481SCindy Lu                                    n->config_size);
171*ebc141a6SEugenio Pérez         if (ret == -1) {
172*ebc141a6SEugenio Pérez             return;
173*ebc141a6SEugenio Pérez         }
174*ebc141a6SEugenio Pérez 
175fb592882SCindy Lu         /*
176*ebc141a6SEugenio Pérez          * Some NIC/kernel combinations present 0 as the mac address.  As that
177*ebc141a6SEugenio Pérez          * is not a legal address, try to proceed with the address from the
178*ebc141a6SEugenio Pérez          * QEMU command line in the hope that the address has been configured
179*ebc141a6SEugenio Pérez          * correctly elsewhere - just not reported by the device.
180fb592882SCindy Lu          */
181fb592882SCindy Lu         if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) {
182fb592882SCindy Lu             info_report("Zero hardware mac address detected. Ignoring.");
183fb592882SCindy Lu             memcpy(netcfg.mac, n->mac, ETH_ALEN);
184fb592882SCindy Lu         }
185*ebc141a6SEugenio Pérez 
186108a6481SCindy Lu         memcpy(config, &netcfg, n->config_size);
187108a6481SCindy Lu     }
188108a6481SCindy Lu }
1896e790746SPaolo Bonzini 
1906e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
1916e790746SPaolo Bonzini {
19217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1936e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
194c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1956e790746SPaolo Bonzini 
1966e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
1976e790746SPaolo Bonzini 
19895129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
19995129d6fSCornelia Huck         !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
2006e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
2016e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
2026e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
2036e790746SPaolo Bonzini     }
204108a6481SCindy Lu 
205c546ecf2SJason Wang     /*
206c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
207c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
208c546ecf2SJason Wang      */
209c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
210c546ecf2SJason Wang         vhost_net_set_config(get_vhost_net(nc->peer),
211c546ecf2SJason Wang                              (uint8_t *)&netcfg, 0, n->config_size,
212108a6481SCindy Lu                              VHOST_SET_CONFIG_TYPE_MASTER);
213108a6481SCindy Lu       }
2146e790746SPaolo Bonzini }
2156e790746SPaolo Bonzini 
2166e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
2176e790746SPaolo Bonzini {
21817a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2196e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
22017a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
2216e790746SPaolo Bonzini }
2226e790746SPaolo Bonzini 
223b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net)
224b2c929f0SDr. David Alan Gilbert {
225b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(net);
226b2c929f0SDr. David Alan Gilbert     trace_virtio_net_announce_notify();
227b2c929f0SDr. David Alan Gilbert 
228b2c929f0SDr. David Alan Gilbert     net->status |= VIRTIO_NET_S_ANNOUNCE;
229b2c929f0SDr. David Alan Gilbert     virtio_notify_config(vdev);
230b2c929f0SDr. David Alan Gilbert }
231b2c929f0SDr. David Alan Gilbert 
232f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque)
233f57fcf70SJason Wang {
234f57fcf70SJason Wang     VirtIONet *n = opaque;
2359d8c6a25SDr. David Alan Gilbert     trace_virtio_net_announce_timer(n->announce_timer.round);
236f57fcf70SJason Wang 
2379d8c6a25SDr. David Alan Gilbert     n->announce_timer.round--;
238b2c929f0SDr. David Alan Gilbert     virtio_net_announce_notify(n);
239b2c929f0SDr. David Alan Gilbert }
240b2c929f0SDr. David Alan Gilbert 
241b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc)
242b2c929f0SDr. David Alan Gilbert {
243b2c929f0SDr. David Alan Gilbert     VirtIONet *n = qemu_get_nic_opaque(nc);
244b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
245b2c929f0SDr. David Alan Gilbert 
246b2c929f0SDr. David Alan Gilbert     /*
247b2c929f0SDr. David Alan Gilbert      * Make sure the virtio migration announcement timer isn't running
248b2c929f0SDr. David Alan Gilbert      * If it is, let it trigger announcement so that we do not cause
249b2c929f0SDr. David Alan Gilbert      * confusion.
250b2c929f0SDr. David Alan Gilbert      */
251b2c929f0SDr. David Alan Gilbert     if (n->announce_timer.round) {
252b2c929f0SDr. David Alan Gilbert         return;
253b2c929f0SDr. David Alan Gilbert     }
254b2c929f0SDr. David Alan Gilbert 
255b2c929f0SDr. David Alan Gilbert     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
256b2c929f0SDr. David Alan Gilbert         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
257b2c929f0SDr. David Alan Gilbert             virtio_net_announce_notify(n);
258b2c929f0SDr. David Alan Gilbert     }
259f57fcf70SJason Wang }
260f57fcf70SJason Wang 
2616e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
2626e790746SPaolo Bonzini {
26317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2646e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
265441537f1SJason Wang     int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
266aa858194SSi-Wei Liu     int cvq = virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ) ?
267aa858194SSi-Wei Liu               n->max_ncs - n->max_queue_pairs : 0;
2686e790746SPaolo Bonzini 
269ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
2706e790746SPaolo Bonzini         return;
2716e790746SPaolo Bonzini     }
2726e790746SPaolo Bonzini 
2738c1ac475SRadim Krčmář     if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
2748c1ac475SRadim Krčmář         !!n->vhost_started) {
2756e790746SPaolo Bonzini         return;
2766e790746SPaolo Bonzini     }
2776e790746SPaolo Bonzini     if (!n->vhost_started) {
278086abc1cSMichael S. Tsirkin         int r, i;
279086abc1cSMichael S. Tsirkin 
2801bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
2811bfa316cSGreg Kurz             error_report("backend does not support %s vnet headers; "
2821bfa316cSGreg Kurz                          "falling back on userspace virtio",
2831bfa316cSGreg Kurz                          virtio_is_big_endian(vdev) ? "BE" : "LE");
2841bfa316cSGreg Kurz             return;
2851bfa316cSGreg Kurz         }
2861bfa316cSGreg Kurz 
287086abc1cSMichael S. Tsirkin         /* Any packets outstanding? Purge them to avoid touching rings
288086abc1cSMichael S. Tsirkin          * when vhost is running.
289086abc1cSMichael S. Tsirkin          */
290441537f1SJason Wang         for (i = 0;  i < queue_pairs; i++) {
291086abc1cSMichael S. Tsirkin             NetClientState *qnc = qemu_get_subqueue(n->nic, i);
292086abc1cSMichael S. Tsirkin 
293086abc1cSMichael S. Tsirkin             /* Purge both directions: TX and RX. */
294086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
295086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
296086abc1cSMichael S. Tsirkin         }
297086abc1cSMichael S. Tsirkin 
298a93e599dSMaxime Coquelin         if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) {
299a93e599dSMaxime Coquelin             r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu);
300a93e599dSMaxime Coquelin             if (r < 0) {
301a93e599dSMaxime Coquelin                 error_report("%uBytes MTU not supported by the backend",
302a93e599dSMaxime Coquelin                              n->net_conf.mtu);
303a93e599dSMaxime Coquelin 
304a93e599dSMaxime Coquelin                 return;
305a93e599dSMaxime Coquelin             }
306a93e599dSMaxime Coquelin         }
307a93e599dSMaxime Coquelin 
3086e790746SPaolo Bonzini         n->vhost_started = 1;
30922288fe5SJason Wang         r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq);
3106e790746SPaolo Bonzini         if (r < 0) {
3116e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
3126e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
3136e790746SPaolo Bonzini             n->vhost_started = 0;
3146e790746SPaolo Bonzini         }
3156e790746SPaolo Bonzini     } else {
31622288fe5SJason Wang         vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq);
3176e790746SPaolo Bonzini         n->vhost_started = 0;
3186e790746SPaolo Bonzini     }
3196e790746SPaolo Bonzini }
3206e790746SPaolo Bonzini 
3211bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
3221bfa316cSGreg Kurz                                           NetClientState *peer,
3231bfa316cSGreg Kurz                                           bool enable)
3241bfa316cSGreg Kurz {
3251bfa316cSGreg Kurz     if (virtio_is_big_endian(vdev)) {
3261bfa316cSGreg Kurz         return qemu_set_vnet_be(peer, enable);
3271bfa316cSGreg Kurz     } else {
3281bfa316cSGreg Kurz         return qemu_set_vnet_le(peer, enable);
3291bfa316cSGreg Kurz     }
3301bfa316cSGreg Kurz }
3311bfa316cSGreg Kurz 
3321bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
333441537f1SJason Wang                                        int queue_pairs, bool enable)
3341bfa316cSGreg Kurz {
3351bfa316cSGreg Kurz     int i;
3361bfa316cSGreg Kurz 
337441537f1SJason Wang     for (i = 0; i < queue_pairs; i++) {
3381bfa316cSGreg Kurz         if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
3391bfa316cSGreg Kurz             enable) {
3401bfa316cSGreg Kurz             while (--i >= 0) {
3411bfa316cSGreg Kurz                 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
3421bfa316cSGreg Kurz             }
3431bfa316cSGreg Kurz 
3441bfa316cSGreg Kurz             return true;
3451bfa316cSGreg Kurz         }
3461bfa316cSGreg Kurz     }
3471bfa316cSGreg Kurz 
3481bfa316cSGreg Kurz     return false;
3491bfa316cSGreg Kurz }
3501bfa316cSGreg Kurz 
3511bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
3521bfa316cSGreg Kurz {
3531bfa316cSGreg Kurz     VirtIODevice *vdev = VIRTIO_DEVICE(n);
354441537f1SJason Wang     int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
3551bfa316cSGreg Kurz 
3561bfa316cSGreg Kurz     if (virtio_net_started(n, status)) {
3571bfa316cSGreg Kurz         /* Before using the device, we tell the network backend about the
3581bfa316cSGreg Kurz          * endianness to use when parsing vnet headers. If the backend
3591bfa316cSGreg Kurz          * can't do it, we fallback onto fixing the headers in the core
3601bfa316cSGreg Kurz          * virtio-net code.
3611bfa316cSGreg Kurz          */
3621bfa316cSGreg Kurz         n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
363441537f1SJason Wang                                                             queue_pairs, true);
3641bfa316cSGreg Kurz     } else if (virtio_net_started(n, vdev->status)) {
3651bfa316cSGreg Kurz         /* After using the device, we need to reset the network backend to
3661bfa316cSGreg Kurz          * the default (guest native endianness), otherwise the guest may
3671bfa316cSGreg Kurz          * lose network connectivity if it is rebooted into a different
3681bfa316cSGreg Kurz          * endianness.
3691bfa316cSGreg Kurz          */
370441537f1SJason Wang         virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false);
3711bfa316cSGreg Kurz     }
3721bfa316cSGreg Kurz }
3731bfa316cSGreg Kurz 
374283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq)
375283e2c2aSYuri Benditovich {
376283e2c2aSYuri Benditovich     unsigned int dropped = virtqueue_drop_all(vq);
377283e2c2aSYuri Benditovich     if (dropped) {
378283e2c2aSYuri Benditovich         virtio_notify(vdev, vq);
379283e2c2aSYuri Benditovich     }
380283e2c2aSYuri Benditovich }
381283e2c2aSYuri Benditovich 
3826e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
3836e790746SPaolo Bonzini {
38417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3856e790746SPaolo Bonzini     VirtIONetQueue *q;
3866e790746SPaolo Bonzini     int i;
3876e790746SPaolo Bonzini     uint8_t queue_status;
3886e790746SPaolo Bonzini 
3891bfa316cSGreg Kurz     virtio_net_vnet_endian_status(n, status);
3906e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
3916e790746SPaolo Bonzini 
392441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
39338705bb5SFam Zheng         NetClientState *ncs = qemu_get_subqueue(n->nic, i);
39438705bb5SFam Zheng         bool queue_started;
3956e790746SPaolo Bonzini         q = &n->vqs[i];
3966e790746SPaolo Bonzini 
397441537f1SJason Wang         if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) {
3986e790746SPaolo Bonzini             queue_status = 0;
3996e790746SPaolo Bonzini         } else {
4006e790746SPaolo Bonzini             queue_status = status;
4016e790746SPaolo Bonzini         }
40238705bb5SFam Zheng         queue_started =
40338705bb5SFam Zheng             virtio_net_started(n, queue_status) && !n->vhost_started;
40438705bb5SFam Zheng 
40538705bb5SFam Zheng         if (queue_started) {
40638705bb5SFam Zheng             qemu_flush_queued_packets(ncs);
40738705bb5SFam Zheng         }
4086e790746SPaolo Bonzini 
4096e790746SPaolo Bonzini         if (!q->tx_waiting) {
4106e790746SPaolo Bonzini             continue;
4116e790746SPaolo Bonzini         }
4126e790746SPaolo Bonzini 
41338705bb5SFam Zheng         if (queue_started) {
4146e790746SPaolo Bonzini             if (q->tx_timer) {
415bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
416bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
4176e790746SPaolo Bonzini             } else {
4186e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
4196e790746SPaolo Bonzini             }
4206e790746SPaolo Bonzini         } else {
4216e790746SPaolo Bonzini             if (q->tx_timer) {
422bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
4236e790746SPaolo Bonzini             } else {
4246e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
4256e790746SPaolo Bonzini             }
426283e2c2aSYuri Benditovich             if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 &&
42770e53e6eSJason Wang                 (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) &&
42870e53e6eSJason Wang                 vdev->vm_running) {
429283e2c2aSYuri Benditovich                 /* if tx is waiting we are likely have some packets in tx queue
430283e2c2aSYuri Benditovich                  * and disabled notification */
431283e2c2aSYuri Benditovich                 q->tx_waiting = 0;
432283e2c2aSYuri Benditovich                 virtio_queue_set_notification(q->tx_vq, 1);
433283e2c2aSYuri Benditovich                 virtio_net_drop_tx_queue_data(vdev, q->tx_vq);
434283e2c2aSYuri Benditovich             }
4356e790746SPaolo Bonzini         }
4366e790746SPaolo Bonzini     }
4376e790746SPaolo Bonzini }
4386e790746SPaolo Bonzini 
4396e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
4406e790746SPaolo Bonzini {
4416e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
44217a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
4436e790746SPaolo Bonzini     uint16_t old_status = n->status;
4446e790746SPaolo Bonzini 
4456e790746SPaolo Bonzini     if (nc->link_down)
4466e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
4476e790746SPaolo Bonzini     else
4486e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
4496e790746SPaolo Bonzini 
4506e790746SPaolo Bonzini     if (n->status != old_status)
45117a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
4526e790746SPaolo Bonzini 
45317a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
4546e790746SPaolo Bonzini }
4556e790746SPaolo Bonzini 
456b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
457b1be4280SAmos Kong {
458b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
459b1be4280SAmos Kong 
460b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
461ddfb0baaSMarkus Armbruster         char *path = object_get_canonical_path(OBJECT(n->qdev));
4627480874aSMarkus Armbruster         qapi_event_send_nic_rx_filter_changed(n->netclient_name, path);
46396e35046SAmos Kong         g_free(path);
464b1be4280SAmos Kong 
465b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
466b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
467b1be4280SAmos Kong     }
468b1be4280SAmos Kong }
469b1be4280SAmos Kong 
470f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
471f7bc8ef8SAmos Kong {
47254aa3de7SEric Blake     intList *list;
473f7bc8ef8SAmos Kong     int i, j;
474f7bc8ef8SAmos Kong 
475f7bc8ef8SAmos Kong     list = NULL;
476f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
477f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
478f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
47954aa3de7SEric Blake                 QAPI_LIST_PREPEND(list, (i << 5) + j);
480f7bc8ef8SAmos Kong             }
481f7bc8ef8SAmos Kong         }
482f7bc8ef8SAmos Kong     }
483f7bc8ef8SAmos Kong 
484f7bc8ef8SAmos Kong     return list;
485f7bc8ef8SAmos Kong }
486f7bc8ef8SAmos Kong 
487b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
488b1be4280SAmos Kong {
489b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
490f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
491b1be4280SAmos Kong     RxFilterInfo *info;
49254aa3de7SEric Blake     strList *str_list;
493f7bc8ef8SAmos Kong     int i;
494b1be4280SAmos Kong 
495b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
496b1be4280SAmos Kong     info->name = g_strdup(nc->name);
497b1be4280SAmos Kong     info->promiscuous = n->promisc;
498b1be4280SAmos Kong 
499b1be4280SAmos Kong     if (n->nouni) {
500b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
501b1be4280SAmos Kong     } else if (n->alluni) {
502b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
503b1be4280SAmos Kong     } else {
504b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
505b1be4280SAmos Kong     }
506b1be4280SAmos Kong 
507b1be4280SAmos Kong     if (n->nomulti) {
508b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
509b1be4280SAmos Kong     } else if (n->allmulti) {
510b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
511b1be4280SAmos Kong     } else {
512b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
513b1be4280SAmos Kong     }
514b1be4280SAmos Kong 
515b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
516b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
517b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
518b1be4280SAmos Kong 
519b0575ba4SScott Feldman     info->main_mac = qemu_mac_strdup_printf(n->mac);
520b1be4280SAmos Kong 
521b1be4280SAmos Kong     str_list = NULL;
522b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
52354aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
52454aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
525b1be4280SAmos Kong     }
526b1be4280SAmos Kong     info->unicast_table = str_list;
527b1be4280SAmos Kong 
528b1be4280SAmos Kong     str_list = NULL;
529b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
53054aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
53154aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
532b1be4280SAmos Kong     }
533b1be4280SAmos Kong     info->multicast_table = str_list;
534f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
535b1be4280SAmos Kong 
53695129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
537f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
538f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
539f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
540f7bc8ef8SAmos Kong     } else {
541f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
542b1be4280SAmos Kong     }
543b1be4280SAmos Kong 
544b1be4280SAmos Kong     /* enable event notification after query */
545b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
546b1be4280SAmos Kong 
547b1be4280SAmos Kong     return info;
548b1be4280SAmos Kong }
549b1be4280SAmos Kong 
5507dc6be52SXuan Zhuo static void virtio_net_queue_reset(VirtIODevice *vdev, uint32_t queue_index)
5517dc6be52SXuan Zhuo {
5527dc6be52SXuan Zhuo     VirtIONet *n = VIRTIO_NET(vdev);
553f47af0afSXuan Zhuo     NetClientState *nc;
554f47af0afSXuan Zhuo 
555f47af0afSXuan Zhuo     /* validate queue_index and skip for cvq */
556f47af0afSXuan Zhuo     if (queue_index >= n->max_queue_pairs * 2) {
557f47af0afSXuan Zhuo         return;
558f47af0afSXuan Zhuo     }
559f47af0afSXuan Zhuo 
560f47af0afSXuan Zhuo     nc = qemu_get_subqueue(n->nic, vq2q(queue_index));
5617dc6be52SXuan Zhuo 
5627dc6be52SXuan Zhuo     if (!nc->peer) {
5637dc6be52SXuan Zhuo         return;
5647dc6be52SXuan Zhuo     }
5657dc6be52SXuan Zhuo 
5667dc6be52SXuan Zhuo     if (get_vhost_net(nc->peer) &&
5677dc6be52SXuan Zhuo         nc->peer->info->type == NET_CLIENT_DRIVER_TAP) {
5687dc6be52SXuan Zhuo         vhost_net_virtqueue_reset(vdev, nc, queue_index);
5697dc6be52SXuan Zhuo     }
5707dc6be52SXuan Zhuo 
5717dc6be52SXuan Zhuo     flush_or_purge_queued_packets(nc);
5727dc6be52SXuan Zhuo }
5737dc6be52SXuan Zhuo 
5747f863302SKangjie Xu static void virtio_net_queue_enable(VirtIODevice *vdev, uint32_t queue_index)
5757f863302SKangjie Xu {
5767f863302SKangjie Xu     VirtIONet *n = VIRTIO_NET(vdev);
577f47af0afSXuan Zhuo     NetClientState *nc;
5787f863302SKangjie Xu     int r;
5797f863302SKangjie Xu 
580f47af0afSXuan Zhuo     /* validate queue_index and skip for cvq */
581f47af0afSXuan Zhuo     if (queue_index >= n->max_queue_pairs * 2) {
582f47af0afSXuan Zhuo         return;
583f47af0afSXuan Zhuo     }
584f47af0afSXuan Zhuo 
585f47af0afSXuan Zhuo     nc = qemu_get_subqueue(n->nic, vq2q(queue_index));
586f47af0afSXuan Zhuo 
5877f863302SKangjie Xu     if (!nc->peer || !vdev->vhost_started) {
5887f863302SKangjie Xu         return;
5897f863302SKangjie Xu     }
5907f863302SKangjie Xu 
5917f863302SKangjie Xu     if (get_vhost_net(nc->peer) &&
5927f863302SKangjie Xu         nc->peer->info->type == NET_CLIENT_DRIVER_TAP) {
5937f863302SKangjie Xu         r = vhost_net_virtqueue_restart(vdev, nc, queue_index);
5947f863302SKangjie Xu         if (r < 0) {
5957f863302SKangjie Xu             error_report("unable to restart vhost net virtqueue: %d, "
5967f863302SKangjie Xu                             "when resetting the queue", queue_index);
5977f863302SKangjie Xu         }
5987f863302SKangjie Xu     }
5997f863302SKangjie Xu }
6007f863302SKangjie Xu 
6016e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
6026e790746SPaolo Bonzini {
60317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
60494b52958SGreg Kurz     int i;
6056e790746SPaolo Bonzini 
6066e790746SPaolo Bonzini     /* Reset back to compatibility mode */
6076e790746SPaolo Bonzini     n->promisc = 1;
6086e790746SPaolo Bonzini     n->allmulti = 0;
6096e790746SPaolo Bonzini     n->alluni = 0;
6106e790746SPaolo Bonzini     n->nomulti = 0;
6116e790746SPaolo Bonzini     n->nouni = 0;
6126e790746SPaolo Bonzini     n->nobcast = 0;
6136e790746SPaolo Bonzini     /* multiqueue is disabled by default */
614441537f1SJason Wang     n->curr_queue_pairs = 1;
6159d8c6a25SDr. David Alan Gilbert     timer_del(n->announce_timer.tm);
6169d8c6a25SDr. David Alan Gilbert     n->announce_timer.round = 0;
617f57fcf70SJason Wang     n->status &= ~VIRTIO_NET_S_ANNOUNCE;
6186e790746SPaolo Bonzini 
6196e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
6206e790746SPaolo Bonzini     n->mac_table.in_use = 0;
6216e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
6226e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
6236e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
6246e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
6256e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
626702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
6276e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
62894b52958SGreg Kurz 
62994b52958SGreg Kurz     /* Flush any async TX */
630441537f1SJason Wang     for (i = 0;  i < n->max_queue_pairs; i++) {
6314fdf69abSKangjie Xu         flush_or_purge_queued_packets(qemu_get_subqueue(n->nic, i));
63294b52958SGreg Kurz     }
6336e790746SPaolo Bonzini }
6346e790746SPaolo Bonzini 
6356e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
6366e790746SPaolo Bonzini {
6376e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
6386e790746SPaolo Bonzini     if (!nc->peer) {
6396e790746SPaolo Bonzini         return;
6406e790746SPaolo Bonzini     }
6416e790746SPaolo Bonzini 
642d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
6436e790746SPaolo Bonzini }
6446e790746SPaolo Bonzini 
6456e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
6466e790746SPaolo Bonzini {
6476e790746SPaolo Bonzini     return n->has_vnet_hdr;
6486e790746SPaolo Bonzini }
6496e790746SPaolo Bonzini 
6506e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
6516e790746SPaolo Bonzini {
6526e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
6536e790746SPaolo Bonzini         return 0;
6546e790746SPaolo Bonzini 
655d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
6566e790746SPaolo Bonzini 
6576e790746SPaolo Bonzini     return n->has_ufo;
6586e790746SPaolo Bonzini }
6596e790746SPaolo Bonzini 
660bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
661e22f0603SYuri Benditovich                                        int version_1, int hash_report)
6626e790746SPaolo Bonzini {
6636e790746SPaolo Bonzini     int i;
6646e790746SPaolo Bonzini     NetClientState *nc;
6656e790746SPaolo Bonzini 
6666e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
6676e790746SPaolo Bonzini 
668bb9d17f8SCornelia Huck     if (version_1) {
669e22f0603SYuri Benditovich         n->guest_hdr_len = hash_report ?
670e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_v1_hash) :
671e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_mrg_rxbuf);
672e22f0603SYuri Benditovich         n->rss_data.populate_hash = !!hash_report;
673bb9d17f8SCornelia Huck     } else {
6746e790746SPaolo Bonzini         n->guest_hdr_len = n->mergeable_rx_bufs ?
675bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr_mrg_rxbuf) :
676bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr);
677bb9d17f8SCornelia Huck     }
6786e790746SPaolo Bonzini 
679441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
6806e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
6816e790746SPaolo Bonzini 
6826e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
683d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
684d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
6856e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
6866e790746SPaolo Bonzini         }
6876e790746SPaolo Bonzini     }
6886e790746SPaolo Bonzini }
6896e790746SPaolo Bonzini 
6902eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n)
6912eef278bSMichael S. Tsirkin {
6922eef278bSMichael S. Tsirkin     NetClientState *peer = n->nic_conf.peers.ncs[0];
6932eef278bSMichael S. Tsirkin 
6942eef278bSMichael S. Tsirkin     /*
6950ea5778fSEugenio Pérez      * Backends other than vhost-user or vhost-vdpa don't support max queue
6960ea5778fSEugenio Pérez      * size.
6972eef278bSMichael S. Tsirkin      */
6982eef278bSMichael S. Tsirkin     if (!peer) {
6992eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
7002eef278bSMichael S. Tsirkin     }
7012eef278bSMichael S. Tsirkin 
7020ea5778fSEugenio Pérez     switch(peer->info->type) {
7030ea5778fSEugenio Pérez     case NET_CLIENT_DRIVER_VHOST_USER:
7040ea5778fSEugenio Pérez     case NET_CLIENT_DRIVER_VHOST_VDPA:
7052eef278bSMichael S. Tsirkin         return VIRTQUEUE_MAX_SIZE;
7060ea5778fSEugenio Pérez     default:
7070ea5778fSEugenio Pérez         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
7080ea5778fSEugenio Pérez     };
7092eef278bSMichael S. Tsirkin }
7102eef278bSMichael S. Tsirkin 
7116e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
7126e790746SPaolo Bonzini {
7136e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
7146e790746SPaolo Bonzini 
7156e790746SPaolo Bonzini     if (!nc->peer) {
7166e790746SPaolo Bonzini         return 0;
7176e790746SPaolo Bonzini     }
7186e790746SPaolo Bonzini 
719f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
7207263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 1);
7217263a0adSChangchun Ouyang     }
7227263a0adSChangchun Ouyang 
723f394b2e2SEric Blake     if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
7246e790746SPaolo Bonzini         return 0;
7256e790746SPaolo Bonzini     }
7266e790746SPaolo Bonzini 
727441537f1SJason Wang     if (n->max_queue_pairs == 1) {
7281074b879SJason Wang         return 0;
7291074b879SJason Wang     }
7301074b879SJason Wang 
7316e790746SPaolo Bonzini     return tap_enable(nc->peer);
7326e790746SPaolo Bonzini }
7336e790746SPaolo Bonzini 
7346e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
7356e790746SPaolo Bonzini {
7366e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
7376e790746SPaolo Bonzini 
7386e790746SPaolo Bonzini     if (!nc->peer) {
7396e790746SPaolo Bonzini         return 0;
7406e790746SPaolo Bonzini     }
7416e790746SPaolo Bonzini 
742f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
7437263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 0);
7447263a0adSChangchun Ouyang     }
7457263a0adSChangchun Ouyang 
746f394b2e2SEric Blake     if (nc->peer->info->type !=  NET_CLIENT_DRIVER_TAP) {
7476e790746SPaolo Bonzini         return 0;
7486e790746SPaolo Bonzini     }
7496e790746SPaolo Bonzini 
7506e790746SPaolo Bonzini     return tap_disable(nc->peer);
7516e790746SPaolo Bonzini }
7526e790746SPaolo Bonzini 
753441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n)
7546e790746SPaolo Bonzini {
7556e790746SPaolo Bonzini     int i;
756ddfa83eaSJoel Stanley     int r;
7576e790746SPaolo Bonzini 
75868b5f314SYuri Benditovich     if (n->nic->peer_deleted) {
75968b5f314SYuri Benditovich         return;
76068b5f314SYuri Benditovich     }
76168b5f314SYuri Benditovich 
762441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
763441537f1SJason Wang         if (i < n->curr_queue_pairs) {
764ddfa83eaSJoel Stanley             r = peer_attach(n, i);
765ddfa83eaSJoel Stanley             assert(!r);
7666e790746SPaolo Bonzini         } else {
767ddfa83eaSJoel Stanley             r = peer_detach(n, i);
768ddfa83eaSJoel Stanley             assert(!r);
7696e790746SPaolo Bonzini         }
7706e790746SPaolo Bonzini     }
7716e790746SPaolo Bonzini }
7726e790746SPaolo Bonzini 
773ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
7746e790746SPaolo Bonzini 
7759d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
7769d5b731dSJason Wang                                         Error **errp)
7776e790746SPaolo Bonzini {
77817a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
7796e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
7806e790746SPaolo Bonzini 
781da3e8a23SShannon Zhao     /* Firstly sync all virtio-net possible supported features */
782da3e8a23SShannon Zhao     features |= n->host_features;
783da3e8a23SShannon Zhao 
7840cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7856e790746SPaolo Bonzini 
7866e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
7870cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
7880cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7890cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7900cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
7916e790746SPaolo Bonzini 
7920cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
7930cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
7940cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
7950cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
796e22f0603SYuri Benditovich 
797e22f0603SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
7986e790746SPaolo Bonzini     }
7996e790746SPaolo Bonzini 
8006e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
8010cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
8020cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
8036e790746SPaolo Bonzini     }
8046e790746SPaolo Bonzini 
805ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
80693a97dc5SXuan Zhuo         virtio_add_feature(&features, VIRTIO_F_RING_RESET);
8076e790746SPaolo Bonzini         return features;
8086e790746SPaolo Bonzini     }
8092974e916SYuri Benditovich 
8100145c393SAndrew Melnychenko     if (!ebpf_rss_is_loaded(&n->ebpf_rss)) {
81159079029SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_RSS);
8120145c393SAndrew Melnychenko     }
81375ebec11SMaxime Coquelin     features = vhost_net_get_features(get_vhost_net(nc->peer), features);
81475ebec11SMaxime Coquelin     vdev->backend_features = features;
81575ebec11SMaxime Coquelin 
81675ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
81775ebec11SMaxime Coquelin             (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) {
81875ebec11SMaxime Coquelin         features |= (1ULL << VIRTIO_NET_F_MTU);
81975ebec11SMaxime Coquelin     }
82075ebec11SMaxime Coquelin 
82175ebec11SMaxime Coquelin     return features;
8226e790746SPaolo Bonzini }
8236e790746SPaolo Bonzini 
824019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
8256e790746SPaolo Bonzini {
826019a3edbSGerd Hoffmann     uint64_t features = 0;
8276e790746SPaolo Bonzini 
8286e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
8296e790746SPaolo Bonzini      * but also these: */
8300cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
8310cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
8320cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
8330cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
8340cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
8356e790746SPaolo Bonzini 
8366e790746SPaolo Bonzini     return features;
8376e790746SPaolo Bonzini }
8386e790746SPaolo Bonzini 
839644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
840644c9858SDmitry Fleytman {
841ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
842644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
843644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
844644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
845644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
846644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
847644c9858SDmitry Fleytman }
848644c9858SDmitry Fleytman 
849644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
850644c9858SDmitry Fleytman {
851644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
852644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
853644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
854644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
855644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
856644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
857644c9858SDmitry Fleytman 
858644c9858SDmitry Fleytman     return guest_offloads_mask & features;
859644c9858SDmitry Fleytman }
860644c9858SDmitry Fleytman 
861644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
862644c9858SDmitry Fleytman {
863644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
864644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
865644c9858SDmitry Fleytman }
866644c9858SDmitry Fleytman 
867f5e1847bSJuan Quintela typedef struct {
868f5e1847bSJuan Quintela     VirtIONet *n;
86912b2fad7SKevin Wolf     DeviceState *dev;
87012b2fad7SKevin Wolf } FailoverDevice;
871f5e1847bSJuan Quintela 
872f5e1847bSJuan Quintela /**
87312b2fad7SKevin Wolf  * Set the failover primary device
874f5e1847bSJuan Quintela  *
875f5e1847bSJuan Quintela  * @opaque: FailoverId to setup
876f5e1847bSJuan Quintela  * @opts: opts for device we are handling
877f5e1847bSJuan Quintela  * @errp: returns an error if this function fails
878f5e1847bSJuan Quintela  */
87912b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque)
880f5e1847bSJuan Quintela {
88112b2fad7SKevin Wolf     FailoverDevice *fdev = opaque;
88212b2fad7SKevin Wolf     PCIDevice *pci_dev = (PCIDevice *)
88312b2fad7SKevin Wolf         object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE);
884f5e1847bSJuan Quintela 
88512b2fad7SKevin Wolf     if (!pci_dev) {
88612b2fad7SKevin Wolf         return 0;
88712b2fad7SKevin Wolf     }
88812b2fad7SKevin Wolf 
88912b2fad7SKevin Wolf     if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) {
89012b2fad7SKevin Wolf         fdev->dev = dev;
891f5e1847bSJuan Quintela         return 1;
892f5e1847bSJuan Quintela     }
893f5e1847bSJuan Quintela 
894f5e1847bSJuan Quintela     return 0;
895f5e1847bSJuan Quintela }
896f5e1847bSJuan Quintela 
897f5e1847bSJuan Quintela /**
89885d3b931SJuan Quintela  * Find the primary device for this failover virtio-net
89985d3b931SJuan Quintela  *
90085d3b931SJuan Quintela  * @n: VirtIONet device
90185d3b931SJuan Quintela  * @errp: returns an error if this function fails
90285d3b931SJuan Quintela  */
9030a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n)
9049711cd0dSJens Freimann {
90512b2fad7SKevin Wolf     FailoverDevice fdev = {
90612b2fad7SKevin Wolf         .n = n,
90712b2fad7SKevin Wolf     };
9089711cd0dSJens Freimann 
90912b2fad7SKevin Wolf     qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL,
91012b2fad7SKevin Wolf                        NULL, NULL, &fdev);
91112b2fad7SKevin Wolf     return fdev.dev;
9129711cd0dSJens Freimann }
9139711cd0dSJens Freimann 
91421e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp)
91521e8709bSJuan Quintela {
91621e8709bSJuan Quintela     Error *err = NULL;
91721e8709bSJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
91821e8709bSJuan Quintela 
91921e8709bSJuan Quintela     if (dev) {
92021e8709bSJuan Quintela         return;
92121e8709bSJuan Quintela     }
92221e8709bSJuan Quintela 
923259a10dbSKevin Wolf     if (!n->primary_opts) {
92497ca9c59SLaurent Vivier         error_setg(errp, "Primary device not found");
92597ca9c59SLaurent Vivier         error_append_hint(errp, "Virtio-net failover will not work. Make "
92697ca9c59SLaurent Vivier                           "sure primary device has parameter"
92797ca9c59SLaurent Vivier                           " failover_pair_id=%s\n", n->netclient_name);
92821e8709bSJuan Quintela         return;
92921e8709bSJuan Quintela     }
930259a10dbSKevin Wolf 
931f3558b1bSKevin Wolf     dev = qdev_device_add_from_qdict(n->primary_opts,
932f3558b1bSKevin Wolf                                      n->primary_opts_from_json,
933f3558b1bSKevin Wolf                                      &err);
93421e8709bSJuan Quintela     if (err) {
935f3558b1bSKevin Wolf         qobject_unref(n->primary_opts);
936259a10dbSKevin Wolf         n->primary_opts = NULL;
93700e7b129SLaurent Vivier     } else {
93800e7b129SLaurent Vivier         object_unref(OBJECT(dev));
93921e8709bSJuan Quintela     }
94021e8709bSJuan Quintela     error_propagate(errp, err);
94121e8709bSJuan Quintela }
94221e8709bSJuan Quintela 
943d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
9446e790746SPaolo Bonzini {
94517a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
9469711cd0dSJens Freimann     Error *err = NULL;
9476e790746SPaolo Bonzini     int i;
9486e790746SPaolo Bonzini 
94975ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
95075ebec11SMaxime Coquelin             !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) {
95175ebec11SMaxime Coquelin         features &= ~(1ULL << VIRTIO_NET_F_MTU);
95275ebec11SMaxime Coquelin     }
95375ebec11SMaxime Coquelin 
954ef546f12SCornelia Huck     virtio_net_set_multiqueue(n,
95559079029SYuri Benditovich                               virtio_has_feature(features, VIRTIO_NET_F_RSS) ||
95695129d6fSCornelia Huck                               virtio_has_feature(features, VIRTIO_NET_F_MQ));
9576e790746SPaolo Bonzini 
958ef546f12SCornelia Huck     virtio_net_set_mrg_rx_bufs(n,
95995129d6fSCornelia Huck                                virtio_has_feature(features,
960bb9d17f8SCornelia Huck                                                   VIRTIO_NET_F_MRG_RXBUF),
96195129d6fSCornelia Huck                                virtio_has_feature(features,
962e22f0603SYuri Benditovich                                                   VIRTIO_F_VERSION_1),
963e22f0603SYuri Benditovich                                virtio_has_feature(features,
964e22f0603SYuri Benditovich                                                   VIRTIO_NET_F_HASH_REPORT));
9656e790746SPaolo Bonzini 
9662974e916SYuri Benditovich     n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9672974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4);
9682974e916SYuri Benditovich     n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9692974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6);
970e22f0603SYuri Benditovich     n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS);
9712974e916SYuri Benditovich 
9726e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
973644c9858SDmitry Fleytman         n->curr_guest_offloads =
974644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
975644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
9766e790746SPaolo Bonzini     }
9776e790746SPaolo Bonzini 
978441537f1SJason Wang     for (i = 0;  i < n->max_queue_pairs; i++) {
9796e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
9806e790746SPaolo Bonzini 
981ed8b4afeSNikolay Nikolaev         if (!get_vhost_net(nc->peer)) {
9826e790746SPaolo Bonzini             continue;
9836e790746SPaolo Bonzini         }
984ed8b4afeSNikolay Nikolaev         vhost_net_ack_features(get_vhost_net(nc->peer), features);
9856e790746SPaolo Bonzini     }
9860b1eaa88SStefan Fritsch 
98795129d6fSCornelia Huck     if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
9880b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
9890b1eaa88SStefan Fritsch     } else {
9900b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
9910b1eaa88SStefan Fritsch     }
9929711cd0dSJens Freimann 
9939711cd0dSJens Freimann     if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) {
9949711cd0dSJens Freimann         qapi_event_send_failover_negotiated(n->netclient_name);
995e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, false);
9969711cd0dSJens Freimann         failover_add_primary(n, &err);
9979711cd0dSJens Freimann         if (err) {
9981b529d90SLaurent Vivier             if (!qtest_enabled()) {
9999711cd0dSJens Freimann                 warn_report_err(err);
10001b529d90SLaurent Vivier             } else {
10011b529d90SLaurent Vivier                 error_free(err);
10021b529d90SLaurent Vivier             }
10039711cd0dSJens Freimann         }
10046e790746SPaolo Bonzini     }
100521e8709bSJuan Quintela }
10066e790746SPaolo Bonzini 
10076e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
10086e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
10096e790746SPaolo Bonzini {
10106e790746SPaolo Bonzini     uint8_t on;
10116e790746SPaolo Bonzini     size_t s;
1012b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10136e790746SPaolo Bonzini 
10146e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
10156e790746SPaolo Bonzini     if (s != sizeof(on)) {
10166e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10176e790746SPaolo Bonzini     }
10186e790746SPaolo Bonzini 
10196e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
10206e790746SPaolo Bonzini         n->promisc = on;
10216e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
10226e790746SPaolo Bonzini         n->allmulti = on;
10236e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
10246e790746SPaolo Bonzini         n->alluni = on;
10256e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
10266e790746SPaolo Bonzini         n->nomulti = on;
10276e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
10286e790746SPaolo Bonzini         n->nouni = on;
10296e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
10306e790746SPaolo Bonzini         n->nobcast = on;
10316e790746SPaolo Bonzini     } else {
10326e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10336e790746SPaolo Bonzini     }
10346e790746SPaolo Bonzini 
1035b1be4280SAmos Kong     rxfilter_notify(nc);
1036b1be4280SAmos Kong 
10376e790746SPaolo Bonzini     return VIRTIO_NET_OK;
10386e790746SPaolo Bonzini }
10396e790746SPaolo Bonzini 
1040644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
1041644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
1042644c9858SDmitry Fleytman {
1043644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1044644c9858SDmitry Fleytman     uint64_t offloads;
1045644c9858SDmitry Fleytman     size_t s;
1046644c9858SDmitry Fleytman 
104795129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
1048644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1049644c9858SDmitry Fleytman     }
1050644c9858SDmitry Fleytman 
1051644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
1052644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
1053644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1054644c9858SDmitry Fleytman     }
1055644c9858SDmitry Fleytman 
1056644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
1057644c9858SDmitry Fleytman         uint64_t supported_offloads;
1058644c9858SDmitry Fleytman 
1059189ae6bbSJason Wang         offloads = virtio_ldq_p(vdev, &offloads);
1060189ae6bbSJason Wang 
1061644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
1062644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1063644c9858SDmitry Fleytman         }
1064644c9858SDmitry Fleytman 
10652974e916SYuri Benditovich         n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10662974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4);
10672974e916SYuri Benditovich         n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10682974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6);
10692974e916SYuri Benditovich         virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT);
10702974e916SYuri Benditovich 
1071644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
1072644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
1073644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1074644c9858SDmitry Fleytman         }
1075644c9858SDmitry Fleytman 
1076644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
1077644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1078644c9858SDmitry Fleytman 
1079644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
1080644c9858SDmitry Fleytman     } else {
1081644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1082644c9858SDmitry Fleytman     }
1083644c9858SDmitry Fleytman }
1084644c9858SDmitry Fleytman 
10856e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
10866e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
10876e790746SPaolo Bonzini {
10881399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10896e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
10906e790746SPaolo Bonzini     size_t s;
1091b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10926e790746SPaolo Bonzini 
10936e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
10946e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
10956e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
10966e790746SPaolo Bonzini         }
10976e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
10986e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
10996e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1100b1be4280SAmos Kong         rxfilter_notify(nc);
1101b1be4280SAmos Kong 
11026e790746SPaolo Bonzini         return VIRTIO_NET_OK;
11036e790746SPaolo Bonzini     }
11046e790746SPaolo Bonzini 
11056e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
11066e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11076e790746SPaolo Bonzini     }
11086e790746SPaolo Bonzini 
1109cae2e556SAmos Kong     int in_use = 0;
1110cae2e556SAmos Kong     int first_multi = 0;
1111cae2e556SAmos Kong     uint8_t uni_overflow = 0;
1112cae2e556SAmos Kong     uint8_t multi_overflow = 0;
1113cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
11146e790746SPaolo Bonzini 
11156e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
11166e790746SPaolo Bonzini                    sizeof(mac_data.entries));
11171399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
11186e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1119b1be4280SAmos Kong         goto error;
11206e790746SPaolo Bonzini     }
11216e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
11226e790746SPaolo Bonzini 
11236e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
1124b1be4280SAmos Kong         goto error;
11256e790746SPaolo Bonzini     }
11266e790746SPaolo Bonzini 
11276e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
1128cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
11296e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
11306e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1131b1be4280SAmos Kong             goto error;
11326e790746SPaolo Bonzini         }
1133cae2e556SAmos Kong         in_use += mac_data.entries;
11346e790746SPaolo Bonzini     } else {
1135cae2e556SAmos Kong         uni_overflow = 1;
11366e790746SPaolo Bonzini     }
11376e790746SPaolo Bonzini 
11386e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
11396e790746SPaolo Bonzini 
1140cae2e556SAmos Kong     first_multi = in_use;
11416e790746SPaolo Bonzini 
11426e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
11436e790746SPaolo Bonzini                    sizeof(mac_data.entries));
11441399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
11456e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1146b1be4280SAmos Kong         goto error;
11476e790746SPaolo Bonzini     }
11486e790746SPaolo Bonzini 
11496e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
11506e790746SPaolo Bonzini 
11516e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
1152b1be4280SAmos Kong         goto error;
11536e790746SPaolo Bonzini     }
11546e790746SPaolo Bonzini 
1155edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
1156cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
11576e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
11586e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1159b1be4280SAmos Kong             goto error;
11606e790746SPaolo Bonzini         }
1161cae2e556SAmos Kong         in_use += mac_data.entries;
11626e790746SPaolo Bonzini     } else {
1163cae2e556SAmos Kong         multi_overflow = 1;
11646e790746SPaolo Bonzini     }
11656e790746SPaolo Bonzini 
1166cae2e556SAmos Kong     n->mac_table.in_use = in_use;
1167cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
1168cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
1169cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
1170cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
1171cae2e556SAmos Kong     g_free(macs);
1172b1be4280SAmos Kong     rxfilter_notify(nc);
1173b1be4280SAmos Kong 
11746e790746SPaolo Bonzini     return VIRTIO_NET_OK;
1175b1be4280SAmos Kong 
1176b1be4280SAmos Kong error:
1177cae2e556SAmos Kong     g_free(macs);
1178b1be4280SAmos Kong     return VIRTIO_NET_ERR;
11796e790746SPaolo Bonzini }
11806e790746SPaolo Bonzini 
11816e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
11826e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
11836e790746SPaolo Bonzini {
11841399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
11856e790746SPaolo Bonzini     uint16_t vid;
11866e790746SPaolo Bonzini     size_t s;
1187b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
11886e790746SPaolo Bonzini 
11896e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
11901399c60dSRusty Russell     vid = virtio_lduw_p(vdev, &vid);
11916e790746SPaolo Bonzini     if (s != sizeof(vid)) {
11926e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11936e790746SPaolo Bonzini     }
11946e790746SPaolo Bonzini 
11956e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
11966e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11976e790746SPaolo Bonzini 
11986e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
11996e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
12006e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
12016e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
12026e790746SPaolo Bonzini     else
12036e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
12046e790746SPaolo Bonzini 
1205b1be4280SAmos Kong     rxfilter_notify(nc);
1206b1be4280SAmos Kong 
12076e790746SPaolo Bonzini     return VIRTIO_NET_OK;
12086e790746SPaolo Bonzini }
12096e790746SPaolo Bonzini 
1210f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
1211f57fcf70SJason Wang                                       struct iovec *iov, unsigned int iov_cnt)
1212f57fcf70SJason Wang {
12139d8c6a25SDr. David Alan Gilbert     trace_virtio_net_handle_announce(n->announce_timer.round);
1214f57fcf70SJason Wang     if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
1215f57fcf70SJason Wang         n->status & VIRTIO_NET_S_ANNOUNCE) {
1216f57fcf70SJason Wang         n->status &= ~VIRTIO_NET_S_ANNOUNCE;
12179d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
12189d8c6a25SDr. David Alan Gilbert             qemu_announce_timer_step(&n->announce_timer);
1219f57fcf70SJason Wang         }
1220f57fcf70SJason Wang         return VIRTIO_NET_OK;
1221f57fcf70SJason Wang     } else {
1222f57fcf70SJason Wang         return VIRTIO_NET_ERR;
1223f57fcf70SJason Wang     }
1224f57fcf70SJason Wang }
1225f57fcf70SJason Wang 
12260145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n);
12270145c393SAndrew Melnychenko 
122859079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n)
122959079029SYuri Benditovich {
123059079029SYuri Benditovich     if (n->rss_data.enabled) {
123159079029SYuri Benditovich         trace_virtio_net_rss_disable();
123259079029SYuri Benditovich     }
123359079029SYuri Benditovich     n->rss_data.enabled = false;
12340145c393SAndrew Melnychenko 
12350145c393SAndrew Melnychenko     virtio_net_detach_epbf_rss(n);
12360145c393SAndrew Melnychenko }
12370145c393SAndrew Melnychenko 
12380145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd)
12390145c393SAndrew Melnychenko {
12400145c393SAndrew Melnychenko     NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0);
12410145c393SAndrew Melnychenko     if (nc == NULL || nc->info->set_steering_ebpf == NULL) {
12420145c393SAndrew Melnychenko         return false;
12430145c393SAndrew Melnychenko     }
12440145c393SAndrew Melnychenko 
12450145c393SAndrew Melnychenko     return nc->info->set_steering_ebpf(nc, prog_fd);
12460145c393SAndrew Melnychenko }
12470145c393SAndrew Melnychenko 
12480145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data,
12490145c393SAndrew Melnychenko                                    struct EBPFRSSConfig *config)
12500145c393SAndrew Melnychenko {
12510145c393SAndrew Melnychenko     config->redirect = data->redirect;
12520145c393SAndrew Melnychenko     config->populate_hash = data->populate_hash;
12530145c393SAndrew Melnychenko     config->hash_types = data->hash_types;
12540145c393SAndrew Melnychenko     config->indirections_len = data->indirections_len;
12550145c393SAndrew Melnychenko     config->default_queue = data->default_queue;
12560145c393SAndrew Melnychenko }
12570145c393SAndrew Melnychenko 
12580145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n)
12590145c393SAndrew Melnychenko {
12600145c393SAndrew Melnychenko     struct EBPFRSSConfig config = {};
12610145c393SAndrew Melnychenko 
12620145c393SAndrew Melnychenko     if (!ebpf_rss_is_loaded(&n->ebpf_rss)) {
12630145c393SAndrew Melnychenko         return false;
12640145c393SAndrew Melnychenko     }
12650145c393SAndrew Melnychenko 
12660145c393SAndrew Melnychenko     rss_data_to_rss_config(&n->rss_data, &config);
12670145c393SAndrew Melnychenko 
12680145c393SAndrew Melnychenko     if (!ebpf_rss_set_all(&n->ebpf_rss, &config,
12690145c393SAndrew Melnychenko                           n->rss_data.indirections_table, n->rss_data.key)) {
12700145c393SAndrew Melnychenko         return false;
12710145c393SAndrew Melnychenko     }
12720145c393SAndrew Melnychenko 
12730145c393SAndrew Melnychenko     if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) {
12740145c393SAndrew Melnychenko         return false;
12750145c393SAndrew Melnychenko     }
12760145c393SAndrew Melnychenko 
12770145c393SAndrew Melnychenko     return true;
12780145c393SAndrew Melnychenko }
12790145c393SAndrew Melnychenko 
12800145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n)
12810145c393SAndrew Melnychenko {
12820145c393SAndrew Melnychenko     virtio_net_attach_ebpf_to_backend(n->nic, -1);
12830145c393SAndrew Melnychenko }
12840145c393SAndrew Melnychenko 
12850145c393SAndrew Melnychenko static bool virtio_net_load_ebpf(VirtIONet *n)
12860145c393SAndrew Melnychenko {
12870145c393SAndrew Melnychenko     if (!virtio_net_attach_ebpf_to_backend(n->nic, -1)) {
12880145c393SAndrew Melnychenko         /* backend does't support steering ebpf */
12890145c393SAndrew Melnychenko         return false;
12900145c393SAndrew Melnychenko     }
12910145c393SAndrew Melnychenko 
12920145c393SAndrew Melnychenko     return ebpf_rss_load(&n->ebpf_rss);
12930145c393SAndrew Melnychenko }
12940145c393SAndrew Melnychenko 
12950145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n)
12960145c393SAndrew Melnychenko {
12970145c393SAndrew Melnychenko     virtio_net_attach_ebpf_to_backend(n->nic, -1);
12980145c393SAndrew Melnychenko     ebpf_rss_unload(&n->ebpf_rss);
129959079029SYuri Benditovich }
130059079029SYuri Benditovich 
130159079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n,
1302e22f0603SYuri Benditovich                                       struct iovec *iov,
1303e22f0603SYuri Benditovich                                       unsigned int iov_cnt,
1304e22f0603SYuri Benditovich                                       bool do_rss)
130559079029SYuri Benditovich {
130659079029SYuri Benditovich     VirtIODevice *vdev = VIRTIO_DEVICE(n);
130759079029SYuri Benditovich     struct virtio_net_rss_config cfg;
130859079029SYuri Benditovich     size_t s, offset = 0, size_get;
1309441537f1SJason Wang     uint16_t queue_pairs, i;
131059079029SYuri Benditovich     struct {
131159079029SYuri Benditovich         uint16_t us;
131259079029SYuri Benditovich         uint8_t b;
131359079029SYuri Benditovich     } QEMU_PACKED temp;
131459079029SYuri Benditovich     const char *err_msg = "";
131559079029SYuri Benditovich     uint32_t err_value = 0;
131659079029SYuri Benditovich 
1317e22f0603SYuri Benditovich     if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) {
131859079029SYuri Benditovich         err_msg = "RSS is not negotiated";
131959079029SYuri Benditovich         goto error;
132059079029SYuri Benditovich     }
1321e22f0603SYuri Benditovich     if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) {
1322e22f0603SYuri Benditovich         err_msg = "Hash report is not negotiated";
1323e22f0603SYuri Benditovich         goto error;
1324e22f0603SYuri Benditovich     }
132559079029SYuri Benditovich     size_get = offsetof(struct virtio_net_rss_config, indirection_table);
132659079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get);
132759079029SYuri Benditovich     if (s != size_get) {
132859079029SYuri Benditovich         err_msg = "Short command buffer";
132959079029SYuri Benditovich         err_value = (uint32_t)s;
133059079029SYuri Benditovich         goto error;
133159079029SYuri Benditovich     }
133259079029SYuri Benditovich     n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types);
133359079029SYuri Benditovich     n->rss_data.indirections_len =
133459079029SYuri Benditovich         virtio_lduw_p(vdev, &cfg.indirection_table_mask);
133559079029SYuri Benditovich     n->rss_data.indirections_len++;
1336e22f0603SYuri Benditovich     if (!do_rss) {
1337e22f0603SYuri Benditovich         n->rss_data.indirections_len = 1;
1338e22f0603SYuri Benditovich     }
133959079029SYuri Benditovich     if (!is_power_of_2(n->rss_data.indirections_len)) {
134059079029SYuri Benditovich         err_msg = "Invalid size of indirection table";
134159079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
134259079029SYuri Benditovich         goto error;
134359079029SYuri Benditovich     }
134459079029SYuri Benditovich     if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) {
134559079029SYuri Benditovich         err_msg = "Too large indirection table";
134659079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
134759079029SYuri Benditovich         goto error;
134859079029SYuri Benditovich     }
1349e22f0603SYuri Benditovich     n->rss_data.default_queue = do_rss ?
1350e22f0603SYuri Benditovich         virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0;
1351441537f1SJason Wang     if (n->rss_data.default_queue >= n->max_queue_pairs) {
135259079029SYuri Benditovich         err_msg = "Invalid default queue";
135359079029SYuri Benditovich         err_value = n->rss_data.default_queue;
135459079029SYuri Benditovich         goto error;
135559079029SYuri Benditovich     }
135659079029SYuri Benditovich     offset += size_get;
135759079029SYuri Benditovich     size_get = sizeof(uint16_t) * n->rss_data.indirections_len;
135859079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
135959079029SYuri Benditovich     n->rss_data.indirections_table = g_malloc(size_get);
136059079029SYuri Benditovich     if (!n->rss_data.indirections_table) {
136159079029SYuri Benditovich         err_msg = "Can't allocate indirections table";
136259079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
136359079029SYuri Benditovich         goto error;
136459079029SYuri Benditovich     }
136559079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset,
136659079029SYuri Benditovich                    n->rss_data.indirections_table, size_get);
136759079029SYuri Benditovich     if (s != size_get) {
136859079029SYuri Benditovich         err_msg = "Short indirection table buffer";
136959079029SYuri Benditovich         err_value = (uint32_t)s;
137059079029SYuri Benditovich         goto error;
137159079029SYuri Benditovich     }
137259079029SYuri Benditovich     for (i = 0; i < n->rss_data.indirections_len; ++i) {
137359079029SYuri Benditovich         uint16_t val = n->rss_data.indirections_table[i];
137459079029SYuri Benditovich         n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val);
137559079029SYuri Benditovich     }
137659079029SYuri Benditovich     offset += size_get;
137759079029SYuri Benditovich     size_get = sizeof(temp);
137859079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get);
137959079029SYuri Benditovich     if (s != size_get) {
1380441537f1SJason Wang         err_msg = "Can't get queue_pairs";
138159079029SYuri Benditovich         err_value = (uint32_t)s;
138259079029SYuri Benditovich         goto error;
138359079029SYuri Benditovich     }
1384441537f1SJason Wang     queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs;
1385441537f1SJason Wang     if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) {
1386441537f1SJason Wang         err_msg = "Invalid number of queue_pairs";
1387441537f1SJason Wang         err_value = queue_pairs;
138859079029SYuri Benditovich         goto error;
138959079029SYuri Benditovich     }
139059079029SYuri Benditovich     if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) {
139159079029SYuri Benditovich         err_msg = "Invalid key size";
139259079029SYuri Benditovich         err_value = temp.b;
139359079029SYuri Benditovich         goto error;
139459079029SYuri Benditovich     }
139559079029SYuri Benditovich     if (!temp.b && n->rss_data.hash_types) {
139659079029SYuri Benditovich         err_msg = "No key provided";
139759079029SYuri Benditovich         err_value = 0;
139859079029SYuri Benditovich         goto error;
139959079029SYuri Benditovich     }
140059079029SYuri Benditovich     if (!temp.b && !n->rss_data.hash_types) {
140159079029SYuri Benditovich         virtio_net_disable_rss(n);
1402441537f1SJason Wang         return queue_pairs;
140359079029SYuri Benditovich     }
140459079029SYuri Benditovich     offset += size_get;
140559079029SYuri Benditovich     size_get = temp.b;
140659079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get);
140759079029SYuri Benditovich     if (s != size_get) {
140859079029SYuri Benditovich         err_msg = "Can get key buffer";
140959079029SYuri Benditovich         err_value = (uint32_t)s;
141059079029SYuri Benditovich         goto error;
141159079029SYuri Benditovich     }
141259079029SYuri Benditovich     n->rss_data.enabled = true;
14130145c393SAndrew Melnychenko 
14140145c393SAndrew Melnychenko     if (!n->rss_data.populate_hash) {
14150145c393SAndrew Melnychenko         if (!virtio_net_attach_epbf_rss(n)) {
14160145c393SAndrew Melnychenko             /* EBPF must be loaded for vhost */
14170145c393SAndrew Melnychenko             if (get_vhost_net(qemu_get_queue(n->nic)->peer)) {
14180145c393SAndrew Melnychenko                 warn_report("Can't load eBPF RSS for vhost");
14190145c393SAndrew Melnychenko                 goto error;
14200145c393SAndrew Melnychenko             }
14210145c393SAndrew Melnychenko             /* fallback to software RSS */
14220145c393SAndrew Melnychenko             warn_report("Can't load eBPF RSS - fallback to software RSS");
14230145c393SAndrew Melnychenko             n->rss_data.enabled_software_rss = true;
14240145c393SAndrew Melnychenko         }
14250145c393SAndrew Melnychenko     } else {
14260145c393SAndrew Melnychenko         /* use software RSS for hash populating */
14270145c393SAndrew Melnychenko         /* and detach eBPF if was loaded before */
14280145c393SAndrew Melnychenko         virtio_net_detach_epbf_rss(n);
14290145c393SAndrew Melnychenko         n->rss_data.enabled_software_rss = true;
14300145c393SAndrew Melnychenko     }
14310145c393SAndrew Melnychenko 
143259079029SYuri Benditovich     trace_virtio_net_rss_enable(n->rss_data.hash_types,
143359079029SYuri Benditovich                                 n->rss_data.indirections_len,
143459079029SYuri Benditovich                                 temp.b);
1435441537f1SJason Wang     return queue_pairs;
143659079029SYuri Benditovich error:
143759079029SYuri Benditovich     trace_virtio_net_rss_error(err_msg, err_value);
143859079029SYuri Benditovich     virtio_net_disable_rss(n);
143959079029SYuri Benditovich     return 0;
144059079029SYuri Benditovich }
144159079029SYuri Benditovich 
14426e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
14436e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
14446e790746SPaolo Bonzini {
144517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1446441537f1SJason Wang     uint16_t queue_pairs;
14472a7888ccSSi-Wei Liu     NetClientState *nc = qemu_get_queue(n->nic);
14486e790746SPaolo Bonzini 
144959079029SYuri Benditovich     virtio_net_disable_rss(n);
1450e22f0603SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) {
1451441537f1SJason Wang         queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false);
1452441537f1SJason Wang         return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR;
1453e22f0603SYuri Benditovich     }
145459079029SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) {
1455441537f1SJason Wang         queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true);
145659079029SYuri Benditovich     } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
145759079029SYuri Benditovich         struct virtio_net_ctrl_mq mq;
145859079029SYuri Benditovich         size_t s;
145959079029SYuri Benditovich         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) {
146059079029SYuri Benditovich             return VIRTIO_NET_ERR;
146159079029SYuri Benditovich         }
14626e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
14636e790746SPaolo Bonzini         if (s != sizeof(mq)) {
14646e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
14656e790746SPaolo Bonzini         }
1466441537f1SJason Wang         queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
14676e790746SPaolo Bonzini 
146859079029SYuri Benditovich     } else {
14696e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
14706e790746SPaolo Bonzini     }
14716e790746SPaolo Bonzini 
1472441537f1SJason Wang     if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
1473441537f1SJason Wang         queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
1474441537f1SJason Wang         queue_pairs > n->max_queue_pairs ||
14756e790746SPaolo Bonzini         !n->multiqueue) {
14766e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
14776e790746SPaolo Bonzini     }
14786e790746SPaolo Bonzini 
1479441537f1SJason Wang     n->curr_queue_pairs = queue_pairs;
1480ca8717f9SEugenio Pérez     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
1481ca8717f9SEugenio Pérez         /*
1482ca8717f9SEugenio Pérez          * Avoid updating the backend for a vdpa device: We're only interested
1483ca8717f9SEugenio Pérez          * in updating the device model queues.
1484ca8717f9SEugenio Pérez          */
1485ca8717f9SEugenio Pérez         return VIRTIO_NET_OK;
1486ca8717f9SEugenio Pérez     }
1487441537f1SJason Wang     /* stop the backend before changing the number of queue_pairs to avoid handling a
14886e790746SPaolo Bonzini      * disabled queue */
148917a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
1490441537f1SJason Wang     virtio_net_set_queue_pairs(n);
14916e790746SPaolo Bonzini 
14926e790746SPaolo Bonzini     return VIRTIO_NET_OK;
14936e790746SPaolo Bonzini }
1494ba7eadb5SGreg Kurz 
1495640b8a1cSEugenio Pérez size_t virtio_net_handle_ctrl_iov(VirtIODevice *vdev,
1496640b8a1cSEugenio Pérez                                   const struct iovec *in_sg, unsigned in_num,
1497640b8a1cSEugenio Pérez                                   const struct iovec *out_sg,
1498640b8a1cSEugenio Pérez                                   unsigned out_num)
14996e790746SPaolo Bonzini {
150017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
15016e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
15026e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
15036e790746SPaolo Bonzini     size_t s;
1504771b6ed3SJason Wang     struct iovec *iov, *iov2;
1505640b8a1cSEugenio Pérez 
1506640b8a1cSEugenio Pérez     if (iov_size(in_sg, in_num) < sizeof(status) ||
1507640b8a1cSEugenio Pérez         iov_size(out_sg, out_num) < sizeof(ctrl)) {
1508640b8a1cSEugenio Pérez         virtio_error(vdev, "virtio-net ctrl missing headers");
1509640b8a1cSEugenio Pérez         return 0;
1510640b8a1cSEugenio Pérez     }
1511640b8a1cSEugenio Pérez 
1512640b8a1cSEugenio Pérez     iov2 = iov = g_memdup2(out_sg, sizeof(struct iovec) * out_num);
1513640b8a1cSEugenio Pérez     s = iov_to_buf(iov, out_num, 0, &ctrl, sizeof(ctrl));
1514640b8a1cSEugenio Pérez     iov_discard_front(&iov, &out_num, sizeof(ctrl));
1515640b8a1cSEugenio Pérez     if (s != sizeof(ctrl)) {
1516640b8a1cSEugenio Pérez         status = VIRTIO_NET_ERR;
1517640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
1518640b8a1cSEugenio Pérez         status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, out_num);
1519640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
1520640b8a1cSEugenio Pérez         status = virtio_net_handle_mac(n, ctrl.cmd, iov, out_num);
1521640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
1522640b8a1cSEugenio Pérez         status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, out_num);
1523640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
1524640b8a1cSEugenio Pérez         status = virtio_net_handle_announce(n, ctrl.cmd, iov, out_num);
1525640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
1526640b8a1cSEugenio Pérez         status = virtio_net_handle_mq(n, ctrl.cmd, iov, out_num);
1527640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
1528640b8a1cSEugenio Pérez         status = virtio_net_handle_offloads(n, ctrl.cmd, iov, out_num);
1529640b8a1cSEugenio Pérez     }
1530640b8a1cSEugenio Pérez 
1531640b8a1cSEugenio Pérez     s = iov_from_buf(in_sg, in_num, 0, &status, sizeof(status));
1532640b8a1cSEugenio Pérez     assert(s == sizeof(status));
1533640b8a1cSEugenio Pérez 
1534640b8a1cSEugenio Pérez     g_free(iov2);
1535640b8a1cSEugenio Pérez     return sizeof(status);
1536640b8a1cSEugenio Pérez }
1537640b8a1cSEugenio Pérez 
1538640b8a1cSEugenio Pérez static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
1539640b8a1cSEugenio Pérez {
1540640b8a1cSEugenio Pérez     VirtQueueElement *elem;
15416e790746SPaolo Bonzini 
154251b19ebeSPaolo Bonzini     for (;;) {
1543640b8a1cSEugenio Pérez         size_t written;
154451b19ebeSPaolo Bonzini         elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
154551b19ebeSPaolo Bonzini         if (!elem) {
154651b19ebeSPaolo Bonzini             break;
154751b19ebeSPaolo Bonzini         }
1548640b8a1cSEugenio Pérez 
1549640b8a1cSEugenio Pérez         written = virtio_net_handle_ctrl_iov(vdev, elem->in_sg, elem->in_num,
1550640b8a1cSEugenio Pérez                                              elem->out_sg, elem->out_num);
1551640b8a1cSEugenio Pérez         if (written > 0) {
1552640b8a1cSEugenio Pérez             virtqueue_push(vq, elem, written);
1553640b8a1cSEugenio Pérez             virtio_notify(vdev, vq);
1554640b8a1cSEugenio Pérez             g_free(elem);
1555640b8a1cSEugenio Pérez         } else {
1556ba7eadb5SGreg Kurz             virtqueue_detach_element(vq, elem, 0);
1557ba7eadb5SGreg Kurz             g_free(elem);
1558ba7eadb5SGreg Kurz             break;
15596e790746SPaolo Bonzini         }
15606e790746SPaolo Bonzini     }
15616e790746SPaolo Bonzini }
15626e790746SPaolo Bonzini 
15636e790746SPaolo Bonzini /* RX */
15646e790746SPaolo Bonzini 
15656e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
15666e790746SPaolo Bonzini {
156717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
15686e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
15696e790746SPaolo Bonzini 
15706e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
15716e790746SPaolo Bonzini }
15726e790746SPaolo Bonzini 
1573b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc)
15746e790746SPaolo Bonzini {
15756e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
157617a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
15776e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
15786e790746SPaolo Bonzini 
157917a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
1580b8c4b67eSPhilippe Mathieu-Daudé         return false;
15816e790746SPaolo Bonzini     }
15826e790746SPaolo Bonzini 
1583441537f1SJason Wang     if (nc->queue_index >= n->curr_queue_pairs) {
1584b8c4b67eSPhilippe Mathieu-Daudé         return false;
15856e790746SPaolo Bonzini     }
15866e790746SPaolo Bonzini 
15876e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
158817a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
1589b8c4b67eSPhilippe Mathieu-Daudé         return false;
15906e790746SPaolo Bonzini     }
15916e790746SPaolo Bonzini 
1592b8c4b67eSPhilippe Mathieu-Daudé     return true;
15936e790746SPaolo Bonzini }
15946e790746SPaolo Bonzini 
15956e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
15966e790746SPaolo Bonzini {
15976e790746SPaolo Bonzini     VirtIONet *n = q->n;
15986e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
15996e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
16006e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
16016e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
16026e790746SPaolo Bonzini 
16036e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
16046e790746SPaolo Bonzini          * available after the above check but before notification was
16056e790746SPaolo Bonzini          * enabled, check for available buffers again.
16066e790746SPaolo Bonzini          */
16076e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
16086e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
16096e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
16106e790746SPaolo Bonzini             return 0;
16116e790746SPaolo Bonzini         }
16126e790746SPaolo Bonzini     }
16136e790746SPaolo Bonzini 
16146e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
16156e790746SPaolo Bonzini     return 1;
16166e790746SPaolo Bonzini }
16176e790746SPaolo Bonzini 
16181399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
1619032a74a1SCédric Le Goater {
16201399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->hdr_len);
16211399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->gso_size);
16221399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_start);
16231399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_offset);
1624032a74a1SCédric Le Goater }
1625032a74a1SCédric Le Goater 
16266e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
16276e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
16286e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
16296e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
16306e790746SPaolo Bonzini  * dhclient yet.
16316e790746SPaolo Bonzini  *
16326e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
16336e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
16346e790746SPaolo Bonzini  * kernels.
16356e790746SPaolo Bonzini  *
16366e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
16376e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
16386e790746SPaolo Bonzini  * cache.
16396e790746SPaolo Bonzini  */
16406e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
16416e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
16426e790746SPaolo Bonzini {
16436e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
16446e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
16456e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
16466e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
16476e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
1648f5746335SBin Meng         net_checksum_calculate(buf, size, CSUM_UDP);
16496e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
16506e790746SPaolo Bonzini     }
16516e790746SPaolo Bonzini }
16526e790746SPaolo Bonzini 
16536e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
16546e790746SPaolo Bonzini                            const void *buf, size_t size)
16556e790746SPaolo Bonzini {
16566e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
16576e790746SPaolo Bonzini         /* FIXME this cast is evil */
16586e790746SPaolo Bonzini         void *wbuf = (void *)buf;
16596e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
16606e790746SPaolo Bonzini                                     size - n->host_hdr_len);
16611bfa316cSGreg Kurz 
16621bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
16631399c60dSRusty Russell             virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
16641bfa316cSGreg Kurz         }
16656e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
16666e790746SPaolo Bonzini     } else {
16676e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
16686e790746SPaolo Bonzini             .flags = 0,
16696e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
16706e790746SPaolo Bonzini         };
16716e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
16726e790746SPaolo Bonzini     }
16736e790746SPaolo Bonzini }
16746e790746SPaolo Bonzini 
16756e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
16766e790746SPaolo Bonzini {
16776e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
16786e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
16796e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
16806e790746SPaolo Bonzini     int i;
16816e790746SPaolo Bonzini 
16826e790746SPaolo Bonzini     if (n->promisc)
16836e790746SPaolo Bonzini         return 1;
16846e790746SPaolo Bonzini 
16856e790746SPaolo Bonzini     ptr += n->host_hdr_len;
16866e790746SPaolo Bonzini 
16876e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
16887542d3e7SPeter Maydell         int vid = lduw_be_p(ptr + 14) & 0xfff;
16896e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
16906e790746SPaolo Bonzini             return 0;
16916e790746SPaolo Bonzini     }
16926e790746SPaolo Bonzini 
16936e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
16946e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
16956e790746SPaolo Bonzini             return !n->nobcast;
16966e790746SPaolo Bonzini         } else if (n->nomulti) {
16976e790746SPaolo Bonzini             return 0;
16986e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
16996e790746SPaolo Bonzini             return 1;
17006e790746SPaolo Bonzini         }
17016e790746SPaolo Bonzini 
17026e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
17036e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
17046e790746SPaolo Bonzini                 return 1;
17056e790746SPaolo Bonzini             }
17066e790746SPaolo Bonzini         }
17076e790746SPaolo Bonzini     } else { // unicast
17086e790746SPaolo Bonzini         if (n->nouni) {
17096e790746SPaolo Bonzini             return 0;
17106e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
17116e790746SPaolo Bonzini             return 1;
17126e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
17136e790746SPaolo Bonzini             return 1;
17146e790746SPaolo Bonzini         }
17156e790746SPaolo Bonzini 
17166e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
17176e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
17186e790746SPaolo Bonzini                 return 1;
17196e790746SPaolo Bonzini             }
17206e790746SPaolo Bonzini         }
17216e790746SPaolo Bonzini     }
17226e790746SPaolo Bonzini 
17236e790746SPaolo Bonzini     return 0;
17246e790746SPaolo Bonzini }
17256e790746SPaolo Bonzini 
17264474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4,
17274474e37aSYuri Benditovich                                         bool isip6,
17284474e37aSYuri Benditovich                                         bool isudp,
17294474e37aSYuri Benditovich                                         bool istcp,
17304474e37aSYuri Benditovich                                         uint32_t types)
17314474e37aSYuri Benditovich {
17324474e37aSYuri Benditovich     if (isip4) {
17334474e37aSYuri Benditovich         if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) {
17344474e37aSYuri Benditovich             return NetPktRssIpV4Tcp;
17354474e37aSYuri Benditovich         }
17364474e37aSYuri Benditovich         if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) {
17374474e37aSYuri Benditovich             return NetPktRssIpV4Udp;
17384474e37aSYuri Benditovich         }
17394474e37aSYuri Benditovich         if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) {
17404474e37aSYuri Benditovich             return NetPktRssIpV4;
17414474e37aSYuri Benditovich         }
17424474e37aSYuri Benditovich     } else if (isip6) {
17434474e37aSYuri Benditovich         uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX |
17444474e37aSYuri Benditovich                         VIRTIO_NET_RSS_HASH_TYPE_TCPv6;
17454474e37aSYuri Benditovich 
17464474e37aSYuri Benditovich         if (istcp && (types & mask)) {
17474474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ?
17484474e37aSYuri Benditovich                 NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp;
17494474e37aSYuri Benditovich         }
17504474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6;
17514474e37aSYuri Benditovich         if (isudp && (types & mask)) {
17524474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ?
17534474e37aSYuri Benditovich                 NetPktRssIpV6UdpEx : NetPktRssIpV6Udp;
17544474e37aSYuri Benditovich         }
17554474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6;
17564474e37aSYuri Benditovich         if (types & mask) {
17574474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ?
17584474e37aSYuri Benditovich                 NetPktRssIpV6Ex : NetPktRssIpV6;
17594474e37aSYuri Benditovich         }
17604474e37aSYuri Benditovich     }
17614474e37aSYuri Benditovich     return 0xff;
17624474e37aSYuri Benditovich }
17634474e37aSYuri Benditovich 
1764e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report,
1765e22f0603SYuri Benditovich                                    uint32_t hash)
1766e22f0603SYuri Benditovich {
1767e22f0603SYuri Benditovich     struct virtio_net_hdr_v1_hash *hdr = (void *)buf;
1768e22f0603SYuri Benditovich     hdr->hash_value = hash;
1769e22f0603SYuri Benditovich     hdr->hash_report = report;
1770e22f0603SYuri Benditovich }
1771e22f0603SYuri Benditovich 
17724474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf,
177397cd965cSPaolo Bonzini                                   size_t size)
17746e790746SPaolo Bonzini {
17756e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1776e22f0603SYuri Benditovich     unsigned int index = nc->queue_index, new_index = index;
17774474e37aSYuri Benditovich     struct NetRxPkt *pkt = n->rx_pkt;
17784474e37aSYuri Benditovich     uint8_t net_hash_type;
17794474e37aSYuri Benditovich     uint32_t hash;
17804474e37aSYuri Benditovich     bool isip4, isip6, isudp, istcp;
1781e22f0603SYuri Benditovich     static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = {
1782e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv4,
1783e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv4,
1784e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6,
1785e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6,
1786e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6_EX,
1787e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6_EX,
1788e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv4,
1789e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6,
1790e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6_EX
1791e22f0603SYuri Benditovich     };
17924474e37aSYuri Benditovich 
17934474e37aSYuri Benditovich     net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len,
17944474e37aSYuri Benditovich                              size - n->host_hdr_len);
17954474e37aSYuri Benditovich     net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp);
17964474e37aSYuri Benditovich     if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) {
17974474e37aSYuri Benditovich         istcp = isudp = false;
17984474e37aSYuri Benditovich     }
17994474e37aSYuri Benditovich     if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) {
18004474e37aSYuri Benditovich         istcp = isudp = false;
18014474e37aSYuri Benditovich     }
18024474e37aSYuri Benditovich     net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp,
18034474e37aSYuri Benditovich                                              n->rss_data.hash_types);
18044474e37aSYuri Benditovich     if (net_hash_type > NetPktRssIpV6UdpEx) {
1805e22f0603SYuri Benditovich         if (n->rss_data.populate_hash) {
1806e22f0603SYuri Benditovich             virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0);
1807e22f0603SYuri Benditovich         }
1808e22f0603SYuri Benditovich         return n->rss_data.redirect ? n->rss_data.default_queue : -1;
18094474e37aSYuri Benditovich     }
18104474e37aSYuri Benditovich 
18114474e37aSYuri Benditovich     hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key);
1812e22f0603SYuri Benditovich 
1813e22f0603SYuri Benditovich     if (n->rss_data.populate_hash) {
1814e22f0603SYuri Benditovich         virtio_set_packet_hash(buf, reports[net_hash_type], hash);
1815e22f0603SYuri Benditovich     }
1816e22f0603SYuri Benditovich 
1817e22f0603SYuri Benditovich     if (n->rss_data.redirect) {
18184474e37aSYuri Benditovich         new_index = hash & (n->rss_data.indirections_len - 1);
18194474e37aSYuri Benditovich         new_index = n->rss_data.indirections_table[new_index];
18204474e37aSYuri Benditovich     }
1821e22f0603SYuri Benditovich 
1822e22f0603SYuri Benditovich     return (index == new_index) ? -1 : new_index;
18234474e37aSYuri Benditovich }
18244474e37aSYuri Benditovich 
18254474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf,
18264474e37aSYuri Benditovich                                       size_t size, bool no_rss)
18274474e37aSYuri Benditovich {
18284474e37aSYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
18296e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
183017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1831bedd7e93SJason Wang     VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE];
1832bedd7e93SJason Wang     size_t lens[VIRTQUEUE_MAX_SIZE];
18336e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
18346e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
18356e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
1836bedd7e93SJason Wang     size_t offset, i, guest_offset, j;
1837bedd7e93SJason Wang     ssize_t err;
18386e790746SPaolo Bonzini 
18396e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
18406e790746SPaolo Bonzini         return -1;
18416e790746SPaolo Bonzini     }
18426e790746SPaolo Bonzini 
18430145c393SAndrew Melnychenko     if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) {
18444474e37aSYuri Benditovich         int index = virtio_net_process_rss(nc, buf, size);
18454474e37aSYuri Benditovich         if (index >= 0) {
18464474e37aSYuri Benditovich             NetClientState *nc2 = qemu_get_subqueue(n->nic, index);
18474474e37aSYuri Benditovich             return virtio_net_receive_rcu(nc2, buf, size, true);
18484474e37aSYuri Benditovich         }
18494474e37aSYuri Benditovich     }
18504474e37aSYuri Benditovich 
18516e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
18526e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
18536e790746SPaolo Bonzini         return 0;
18546e790746SPaolo Bonzini     }
18556e790746SPaolo Bonzini 
18566e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
18576e790746SPaolo Bonzini         return size;
18586e790746SPaolo Bonzini 
18596e790746SPaolo Bonzini     offset = i = 0;
18606e790746SPaolo Bonzini 
18616e790746SPaolo Bonzini     while (offset < size) {
186251b19ebeSPaolo Bonzini         VirtQueueElement *elem;
18636e790746SPaolo Bonzini         int len, total;
186451b19ebeSPaolo Bonzini         const struct iovec *sg;
18656e790746SPaolo Bonzini 
18666e790746SPaolo Bonzini         total = 0;
18676e790746SPaolo Bonzini 
1868bedd7e93SJason Wang         if (i == VIRTQUEUE_MAX_SIZE) {
1869bedd7e93SJason Wang             virtio_error(vdev, "virtio-net unexpected long buffer chain");
1870bedd7e93SJason Wang             err = size;
1871bedd7e93SJason Wang             goto err;
1872bedd7e93SJason Wang         }
1873bedd7e93SJason Wang 
187451b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
187551b19ebeSPaolo Bonzini         if (!elem) {
1876ba10b9c0SGreg Kurz             if (i) {
1877ba10b9c0SGreg Kurz                 virtio_error(vdev, "virtio-net unexpected empty queue: "
18786e790746SPaolo Bonzini                              "i %zd mergeable %d offset %zd, size %zd, "
1879019a3edbSGerd Hoffmann                              "guest hdr len %zd, host hdr len %zd "
1880019a3edbSGerd Hoffmann                              "guest features 0x%" PRIx64,
18816e790746SPaolo Bonzini                              i, n->mergeable_rx_bufs, offset, size,
1882019a3edbSGerd Hoffmann                              n->guest_hdr_len, n->host_hdr_len,
1883019a3edbSGerd Hoffmann                              vdev->guest_features);
1884ba10b9c0SGreg Kurz             }
1885bedd7e93SJason Wang             err = -1;
1886bedd7e93SJason Wang             goto err;
18876e790746SPaolo Bonzini         }
18886e790746SPaolo Bonzini 
188951b19ebeSPaolo Bonzini         if (elem->in_num < 1) {
1890ba10b9c0SGreg Kurz             virtio_error(vdev,
1891ba10b9c0SGreg Kurz                          "virtio-net receive queue contains no in buffers");
1892ba10b9c0SGreg Kurz             virtqueue_detach_element(q->rx_vq, elem, 0);
1893ba10b9c0SGreg Kurz             g_free(elem);
1894bedd7e93SJason Wang             err = -1;
1895bedd7e93SJason Wang             goto err;
18966e790746SPaolo Bonzini         }
18976e790746SPaolo Bonzini 
189851b19ebeSPaolo Bonzini         sg = elem->in_sg;
18996e790746SPaolo Bonzini         if (i == 0) {
19006e790746SPaolo Bonzini             assert(offset == 0);
19016e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
19026e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
190351b19ebeSPaolo Bonzini                                     sg, elem->in_num,
19046e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
19056e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
19066e790746SPaolo Bonzini             }
19076e790746SPaolo Bonzini 
190851b19ebeSPaolo Bonzini             receive_header(n, sg, elem->in_num, buf, size);
1909e22f0603SYuri Benditovich             if (n->rss_data.populate_hash) {
1910e22f0603SYuri Benditovich                 offset = sizeof(mhdr);
1911e22f0603SYuri Benditovich                 iov_from_buf(sg, elem->in_num, offset,
1912e22f0603SYuri Benditovich                              buf + offset, n->host_hdr_len - sizeof(mhdr));
1913e22f0603SYuri Benditovich             }
19146e790746SPaolo Bonzini             offset = n->host_hdr_len;
19156e790746SPaolo Bonzini             total += n->guest_hdr_len;
19166e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
19176e790746SPaolo Bonzini         } else {
19186e790746SPaolo Bonzini             guest_offset = 0;
19196e790746SPaolo Bonzini         }
19206e790746SPaolo Bonzini 
19216e790746SPaolo Bonzini         /* copy in packet.  ugh */
192251b19ebeSPaolo Bonzini         len = iov_from_buf(sg, elem->in_num, guest_offset,
19236e790746SPaolo Bonzini                            buf + offset, size - offset);
19246e790746SPaolo Bonzini         total += len;
19256e790746SPaolo Bonzini         offset += len;
19266e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
19276e790746SPaolo Bonzini          * must have consumed the complete packet.
19286e790746SPaolo Bonzini          * Otherwise, drop it. */
19296e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
193027e57efeSLadi Prosek             virtqueue_unpop(q->rx_vq, elem, total);
193151b19ebeSPaolo Bonzini             g_free(elem);
1932bedd7e93SJason Wang             err = size;
1933bedd7e93SJason Wang             goto err;
19346e790746SPaolo Bonzini         }
19356e790746SPaolo Bonzini 
1936bedd7e93SJason Wang         elems[i] = elem;
1937bedd7e93SJason Wang         lens[i] = total;
1938bedd7e93SJason Wang         i++;
19396e790746SPaolo Bonzini     }
19406e790746SPaolo Bonzini 
19416e790746SPaolo Bonzini     if (mhdr_cnt) {
19421399c60dSRusty Russell         virtio_stw_p(vdev, &mhdr.num_buffers, i);
19436e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
19446e790746SPaolo Bonzini                      0,
19456e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
19466e790746SPaolo Bonzini     }
19476e790746SPaolo Bonzini 
1948bedd7e93SJason Wang     for (j = 0; j < i; j++) {
1949bedd7e93SJason Wang         /* signal other side */
1950bedd7e93SJason Wang         virtqueue_fill(q->rx_vq, elems[j], lens[j], j);
1951bedd7e93SJason Wang         g_free(elems[j]);
1952bedd7e93SJason Wang     }
1953bedd7e93SJason Wang 
19546e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
195517a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
19566e790746SPaolo Bonzini 
19576e790746SPaolo Bonzini     return size;
1958bedd7e93SJason Wang 
1959bedd7e93SJason Wang err:
1960bedd7e93SJason Wang     for (j = 0; j < i; j++) {
1961abe300d9SJason Wang         virtqueue_detach_element(q->rx_vq, elems[j], lens[j]);
1962bedd7e93SJason Wang         g_free(elems[j]);
1963bedd7e93SJason Wang     }
1964bedd7e93SJason Wang 
1965bedd7e93SJason Wang     return err;
19666e790746SPaolo Bonzini }
19676e790746SPaolo Bonzini 
19682974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf,
196997cd965cSPaolo Bonzini                                   size_t size)
197097cd965cSPaolo Bonzini {
1971068ddfa9SDr. David Alan Gilbert     RCU_READ_LOCK_GUARD();
197297cd965cSPaolo Bonzini 
19734474e37aSYuri Benditovich     return virtio_net_receive_rcu(nc, buf, size, false);
197497cd965cSPaolo Bonzini }
197597cd965cSPaolo Bonzini 
19762974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain,
19772974e916SYuri Benditovich                                          const uint8_t *buf,
19782974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
19792974e916SYuri Benditovich {
19802974e916SYuri Benditovich     uint16_t ip_hdrlen;
19812974e916SYuri Benditovich     struct ip_header *ip;
19822974e916SYuri Benditovich 
19832974e916SYuri Benditovich     ip = (struct ip_header *)(buf + chain->n->guest_hdr_len
19842974e916SYuri Benditovich                               + sizeof(struct eth_header));
19852974e916SYuri Benditovich     unit->ip = (void *)ip;
19862974e916SYuri Benditovich     ip_hdrlen = (ip->ip_ver_len & 0xF) << 2;
19872974e916SYuri Benditovich     unit->ip_plen = &ip->ip_len;
19882974e916SYuri Benditovich     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen);
19892974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
19902974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen;
19912974e916SYuri Benditovich }
19922974e916SYuri Benditovich 
19932974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain,
19942974e916SYuri Benditovich                                          const uint8_t *buf,
19952974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
19962974e916SYuri Benditovich {
19972974e916SYuri Benditovich     struct ip6_header *ip6;
19982974e916SYuri Benditovich 
19992974e916SYuri Benditovich     ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len
20002974e916SYuri Benditovich                                  + sizeof(struct eth_header));
20012974e916SYuri Benditovich     unit->ip = ip6;
20022974e916SYuri Benditovich     unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
200378ee6bd0SPhilippe Mathieu-Daudé     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip)
20042974e916SYuri Benditovich                                         + sizeof(struct ip6_header));
20052974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
20062974e916SYuri Benditovich 
20072974e916SYuri Benditovich     /* There is a difference between payload lenght in ipv4 and v6,
20082974e916SYuri Benditovich        ip header is excluded in ipv6 */
20092974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen;
20102974e916SYuri Benditovich }
20112974e916SYuri Benditovich 
20122974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain,
20132974e916SYuri Benditovich                                        VirtioNetRscSeg *seg)
20142974e916SYuri Benditovich {
20152974e916SYuri Benditovich     int ret;
2016dd3d85e8SYuri Benditovich     struct virtio_net_hdr_v1 *h;
20172974e916SYuri Benditovich 
2018dd3d85e8SYuri Benditovich     h = (struct virtio_net_hdr_v1 *)seg->buf;
20192974e916SYuri Benditovich     h->flags = 0;
20202974e916SYuri Benditovich     h->gso_type = VIRTIO_NET_HDR_GSO_NONE;
20212974e916SYuri Benditovich 
20222974e916SYuri Benditovich     if (seg->is_coalesced) {
2023dd3d85e8SYuri Benditovich         h->rsc.segments = seg->packets;
2024dd3d85e8SYuri Benditovich         h->rsc.dup_acks = seg->dup_ack;
20252974e916SYuri Benditovich         h->flags = VIRTIO_NET_HDR_F_RSC_INFO;
20262974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
20272974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
20282974e916SYuri Benditovich         } else {
20292974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
20302974e916SYuri Benditovich         }
20312974e916SYuri Benditovich     }
20322974e916SYuri Benditovich 
20332974e916SYuri Benditovich     ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size);
20342974e916SYuri Benditovich     QTAILQ_REMOVE(&chain->buffers, seg, next);
20352974e916SYuri Benditovich     g_free(seg->buf);
20362974e916SYuri Benditovich     g_free(seg);
20372974e916SYuri Benditovich 
20382974e916SYuri Benditovich     return ret;
20392974e916SYuri Benditovich }
20402974e916SYuri Benditovich 
20412974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq)
20422974e916SYuri Benditovich {
20432974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn;
20442974e916SYuri Benditovich     VirtioNetRscChain *chain = (VirtioNetRscChain *)opq;
20452974e916SYuri Benditovich 
20462974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) {
20472974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
20482974e916SYuri Benditovich             chain->stat.purge_failed++;
20492974e916SYuri Benditovich             continue;
20502974e916SYuri Benditovich         }
20512974e916SYuri Benditovich     }
20522974e916SYuri Benditovich 
20532974e916SYuri Benditovich     chain->stat.timer++;
20542974e916SYuri Benditovich     if (!QTAILQ_EMPTY(&chain->buffers)) {
20552974e916SYuri Benditovich         timer_mod(chain->drain_timer,
20562974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
20572974e916SYuri Benditovich     }
20582974e916SYuri Benditovich }
20592974e916SYuri Benditovich 
20602974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n)
20612974e916SYuri Benditovich {
20622974e916SYuri Benditovich     VirtioNetRscChain *chain, *rn_chain;
20632974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn_seg;
20642974e916SYuri Benditovich 
20652974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) {
20662974e916SYuri Benditovich         QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) {
20672974e916SYuri Benditovich             QTAILQ_REMOVE(&chain->buffers, seg, next);
20682974e916SYuri Benditovich             g_free(seg->buf);
20692974e916SYuri Benditovich             g_free(seg);
20702974e916SYuri Benditovich         }
20712974e916SYuri Benditovich 
20722974e916SYuri Benditovich         timer_free(chain->drain_timer);
20732974e916SYuri Benditovich         QTAILQ_REMOVE(&n->rsc_chains, chain, next);
20742974e916SYuri Benditovich         g_free(chain);
20752974e916SYuri Benditovich     }
20762974e916SYuri Benditovich }
20772974e916SYuri Benditovich 
20782974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain,
20792974e916SYuri Benditovich                                      NetClientState *nc,
20802974e916SYuri Benditovich                                      const uint8_t *buf, size_t size)
20812974e916SYuri Benditovich {
20822974e916SYuri Benditovich     uint16_t hdr_len;
20832974e916SYuri Benditovich     VirtioNetRscSeg *seg;
20842974e916SYuri Benditovich 
20852974e916SYuri Benditovich     hdr_len = chain->n->guest_hdr_len;
2086b21e2380SMarkus Armbruster     seg = g_new(VirtioNetRscSeg, 1);
20872974e916SYuri Benditovich     seg->buf = g_malloc(hdr_len + sizeof(struct eth_header)
20882974e916SYuri Benditovich         + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD);
20892974e916SYuri Benditovich     memcpy(seg->buf, buf, size);
20902974e916SYuri Benditovich     seg->size = size;
20912974e916SYuri Benditovich     seg->packets = 1;
20922974e916SYuri Benditovich     seg->dup_ack = 0;
20932974e916SYuri Benditovich     seg->is_coalesced = 0;
20942974e916SYuri Benditovich     seg->nc = nc;
20952974e916SYuri Benditovich 
20962974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&chain->buffers, seg, next);
20972974e916SYuri Benditovich     chain->stat.cache++;
20982974e916SYuri Benditovich 
20992974e916SYuri Benditovich     switch (chain->proto) {
21002974e916SYuri Benditovich     case ETH_P_IP:
21012974e916SYuri Benditovich         virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit);
21022974e916SYuri Benditovich         break;
21032974e916SYuri Benditovich     case ETH_P_IPV6:
21042974e916SYuri Benditovich         virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit);
21052974e916SYuri Benditovich         break;
21062974e916SYuri Benditovich     default:
21072974e916SYuri Benditovich         g_assert_not_reached();
21082974e916SYuri Benditovich     }
21092974e916SYuri Benditovich }
21102974e916SYuri Benditovich 
21112974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain,
21122974e916SYuri Benditovich                                          VirtioNetRscSeg *seg,
21132974e916SYuri Benditovich                                          const uint8_t *buf,
21142974e916SYuri Benditovich                                          struct tcp_header *n_tcp,
21152974e916SYuri Benditovich                                          struct tcp_header *o_tcp)
21162974e916SYuri Benditovich {
21172974e916SYuri Benditovich     uint32_t nack, oack;
21182974e916SYuri Benditovich     uint16_t nwin, owin;
21192974e916SYuri Benditovich 
21202974e916SYuri Benditovich     nack = htonl(n_tcp->th_ack);
21212974e916SYuri Benditovich     nwin = htons(n_tcp->th_win);
21222974e916SYuri Benditovich     oack = htonl(o_tcp->th_ack);
21232974e916SYuri Benditovich     owin = htons(o_tcp->th_win);
21242974e916SYuri Benditovich 
21252974e916SYuri Benditovich     if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) {
21262974e916SYuri Benditovich         chain->stat.ack_out_of_win++;
21272974e916SYuri Benditovich         return RSC_FINAL;
21282974e916SYuri Benditovich     } else if (nack == oack) {
21292974e916SYuri Benditovich         /* duplicated ack or window probe */
21302974e916SYuri Benditovich         if (nwin == owin) {
21312974e916SYuri Benditovich             /* duplicated ack, add dup ack count due to whql test up to 1 */
21322974e916SYuri Benditovich             chain->stat.dup_ack++;
21332974e916SYuri Benditovich             return RSC_FINAL;
21342974e916SYuri Benditovich         } else {
21352974e916SYuri Benditovich             /* Coalesce window update */
21362974e916SYuri Benditovich             o_tcp->th_win = n_tcp->th_win;
21372974e916SYuri Benditovich             chain->stat.win_update++;
21382974e916SYuri Benditovich             return RSC_COALESCE;
21392974e916SYuri Benditovich         }
21402974e916SYuri Benditovich     } else {
21412974e916SYuri Benditovich         /* pure ack, go to 'C', finalize*/
21422974e916SYuri Benditovich         chain->stat.pure_ack++;
21432974e916SYuri Benditovich         return RSC_FINAL;
21442974e916SYuri Benditovich     }
21452974e916SYuri Benditovich }
21462974e916SYuri Benditovich 
21472974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain,
21482974e916SYuri Benditovich                                             VirtioNetRscSeg *seg,
21492974e916SYuri Benditovich                                             const uint8_t *buf,
21502974e916SYuri Benditovich                                             VirtioNetRscUnit *n_unit)
21512974e916SYuri Benditovich {
21522974e916SYuri Benditovich     void *data;
21532974e916SYuri Benditovich     uint16_t o_ip_len;
21542974e916SYuri Benditovich     uint32_t nseq, oseq;
21552974e916SYuri Benditovich     VirtioNetRscUnit *o_unit;
21562974e916SYuri Benditovich 
21572974e916SYuri Benditovich     o_unit = &seg->unit;
21582974e916SYuri Benditovich     o_ip_len = htons(*o_unit->ip_plen);
21592974e916SYuri Benditovich     nseq = htonl(n_unit->tcp->th_seq);
21602974e916SYuri Benditovich     oseq = htonl(o_unit->tcp->th_seq);
21612974e916SYuri Benditovich 
21622974e916SYuri Benditovich     /* out of order or retransmitted. */
21632974e916SYuri Benditovich     if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) {
21642974e916SYuri Benditovich         chain->stat.data_out_of_win++;
21652974e916SYuri Benditovich         return RSC_FINAL;
21662974e916SYuri Benditovich     }
21672974e916SYuri Benditovich 
21682974e916SYuri Benditovich     data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen;
21692974e916SYuri Benditovich     if (nseq == oseq) {
21702974e916SYuri Benditovich         if ((o_unit->payload == 0) && n_unit->payload) {
21712974e916SYuri Benditovich             /* From no payload to payload, normal case, not a dup ack or etc */
21722974e916SYuri Benditovich             chain->stat.data_after_pure_ack++;
21732974e916SYuri Benditovich             goto coalesce;
21742974e916SYuri Benditovich         } else {
21752974e916SYuri Benditovich             return virtio_net_rsc_handle_ack(chain, seg, buf,
21762974e916SYuri Benditovich                                              n_unit->tcp, o_unit->tcp);
21772974e916SYuri Benditovich         }
21782974e916SYuri Benditovich     } else if ((nseq - oseq) != o_unit->payload) {
21792974e916SYuri Benditovich         /* Not a consistent packet, out of order */
21802974e916SYuri Benditovich         chain->stat.data_out_of_order++;
21812974e916SYuri Benditovich         return RSC_FINAL;
21822974e916SYuri Benditovich     } else {
21832974e916SYuri Benditovich coalesce:
21842974e916SYuri Benditovich         if ((o_ip_len + n_unit->payload) > chain->max_payload) {
21852974e916SYuri Benditovich             chain->stat.over_size++;
21862974e916SYuri Benditovich             return RSC_FINAL;
21872974e916SYuri Benditovich         }
21882974e916SYuri Benditovich 
21892974e916SYuri Benditovich         /* Here comes the right data, the payload length in v4/v6 is different,
21902974e916SYuri Benditovich            so use the field value to update and record the new data len */
21912974e916SYuri Benditovich         o_unit->payload += n_unit->payload; /* update new data len */
21922974e916SYuri Benditovich 
21932974e916SYuri Benditovich         /* update field in ip header */
21942974e916SYuri Benditovich         *o_unit->ip_plen = htons(o_ip_len + n_unit->payload);
21952974e916SYuri Benditovich 
21962974e916SYuri Benditovich         /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced
21972974e916SYuri Benditovich            for windows guest, while this may change the behavior for linux
21982974e916SYuri Benditovich            guest (only if it uses RSC feature). */
21992974e916SYuri Benditovich         o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags;
22002974e916SYuri Benditovich 
22012974e916SYuri Benditovich         o_unit->tcp->th_ack = n_unit->tcp->th_ack;
22022974e916SYuri Benditovich         o_unit->tcp->th_win = n_unit->tcp->th_win;
22032974e916SYuri Benditovich 
22042974e916SYuri Benditovich         memmove(seg->buf + seg->size, data, n_unit->payload);
22052974e916SYuri Benditovich         seg->size += n_unit->payload;
22062974e916SYuri Benditovich         seg->packets++;
22072974e916SYuri Benditovich         chain->stat.coalesced++;
22082974e916SYuri Benditovich         return RSC_COALESCE;
22092974e916SYuri Benditovich     }
22102974e916SYuri Benditovich }
22112974e916SYuri Benditovich 
22122974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain,
22132974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
22142974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
22152974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
22162974e916SYuri Benditovich {
22172974e916SYuri Benditovich     struct ip_header *ip1, *ip2;
22182974e916SYuri Benditovich 
22192974e916SYuri Benditovich     ip1 = (struct ip_header *)(unit->ip);
22202974e916SYuri Benditovich     ip2 = (struct ip_header *)(seg->unit.ip);
22212974e916SYuri Benditovich     if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst)
22222974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
22232974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
22242974e916SYuri Benditovich         chain->stat.no_match++;
22252974e916SYuri Benditovich         return RSC_NO_MATCH;
22262974e916SYuri Benditovich     }
22272974e916SYuri Benditovich 
22282974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
22292974e916SYuri Benditovich }
22302974e916SYuri Benditovich 
22312974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain,
22322974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
22332974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
22342974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
22352974e916SYuri Benditovich {
22362974e916SYuri Benditovich     struct ip6_header *ip1, *ip2;
22372974e916SYuri Benditovich 
22382974e916SYuri Benditovich     ip1 = (struct ip6_header *)(unit->ip);
22392974e916SYuri Benditovich     ip2 = (struct ip6_header *)(seg->unit.ip);
22402974e916SYuri Benditovich     if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address))
22412974e916SYuri Benditovich         || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address))
22422974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
22432974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
22442974e916SYuri Benditovich             chain->stat.no_match++;
22452974e916SYuri Benditovich             return RSC_NO_MATCH;
22462974e916SYuri Benditovich     }
22472974e916SYuri Benditovich 
22482974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
22492974e916SYuri Benditovich }
22502974e916SYuri Benditovich 
22512974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain
22522974e916SYuri Benditovich  * to prevent out of order */
22532974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain,
22542974e916SYuri Benditovich                                          struct tcp_header *tcp)
22552974e916SYuri Benditovich {
22562974e916SYuri Benditovich     uint16_t tcp_hdr;
22572974e916SYuri Benditovich     uint16_t tcp_flag;
22582974e916SYuri Benditovich 
22592974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags);
22602974e916SYuri Benditovich     tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10;
22612974e916SYuri Benditovich     tcp_flag &= VIRTIO_NET_TCP_FLAG;
22622974e916SYuri Benditovich     if (tcp_flag & TH_SYN) {
22632974e916SYuri Benditovich         chain->stat.tcp_syn++;
22642974e916SYuri Benditovich         return RSC_BYPASS;
22652974e916SYuri Benditovich     }
22662974e916SYuri Benditovich 
22672974e916SYuri Benditovich     if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) {
22682974e916SYuri Benditovich         chain->stat.tcp_ctrl_drain++;
22692974e916SYuri Benditovich         return RSC_FINAL;
22702974e916SYuri Benditovich     }
22712974e916SYuri Benditovich 
22722974e916SYuri Benditovich     if (tcp_hdr > sizeof(struct tcp_header)) {
22732974e916SYuri Benditovich         chain->stat.tcp_all_opt++;
22742974e916SYuri Benditovich         return RSC_FINAL;
22752974e916SYuri Benditovich     }
22762974e916SYuri Benditovich 
22772974e916SYuri Benditovich     return RSC_CANDIDATE;
22782974e916SYuri Benditovich }
22792974e916SYuri Benditovich 
22802974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain,
22812974e916SYuri Benditovich                                          NetClientState *nc,
22822974e916SYuri Benditovich                                          const uint8_t *buf, size_t size,
22832974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
22842974e916SYuri Benditovich {
22852974e916SYuri Benditovich     int ret;
22862974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
22872974e916SYuri Benditovich 
22882974e916SYuri Benditovich     if (QTAILQ_EMPTY(&chain->buffers)) {
22892974e916SYuri Benditovich         chain->stat.empty_cache++;
22902974e916SYuri Benditovich         virtio_net_rsc_cache_buf(chain, nc, buf, size);
22912974e916SYuri Benditovich         timer_mod(chain->drain_timer,
22922974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
22932974e916SYuri Benditovich         return size;
22942974e916SYuri Benditovich     }
22952974e916SYuri Benditovich 
22962974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
22972974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
22982974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit);
22992974e916SYuri Benditovich         } else {
23002974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit);
23012974e916SYuri Benditovich         }
23022974e916SYuri Benditovich 
23032974e916SYuri Benditovich         if (ret == RSC_FINAL) {
23042974e916SYuri Benditovich             if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
23052974e916SYuri Benditovich                 /* Send failed */
23062974e916SYuri Benditovich                 chain->stat.final_failed++;
23072974e916SYuri Benditovich                 return 0;
23082974e916SYuri Benditovich             }
23092974e916SYuri Benditovich 
23102974e916SYuri Benditovich             /* Send current packet */
23112974e916SYuri Benditovich             return virtio_net_do_receive(nc, buf, size);
23122974e916SYuri Benditovich         } else if (ret == RSC_NO_MATCH) {
23132974e916SYuri Benditovich             continue;
23142974e916SYuri Benditovich         } else {
23152974e916SYuri Benditovich             /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */
23162974e916SYuri Benditovich             seg->is_coalesced = 1;
23172974e916SYuri Benditovich             return size;
23182974e916SYuri Benditovich         }
23192974e916SYuri Benditovich     }
23202974e916SYuri Benditovich 
23212974e916SYuri Benditovich     chain->stat.no_match_cache++;
23222974e916SYuri Benditovich     virtio_net_rsc_cache_buf(chain, nc, buf, size);
23232974e916SYuri Benditovich     return size;
23242974e916SYuri Benditovich }
23252974e916SYuri Benditovich 
23262974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */
23272974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain,
23282974e916SYuri Benditovich                                         NetClientState *nc,
23292974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
23302974e916SYuri Benditovich                                         uint16_t ip_start, uint16_t ip_size,
23312974e916SYuri Benditovich                                         uint16_t tcp_port)
23322974e916SYuri Benditovich {
23332974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
23342974e916SYuri Benditovich     uint32_t ppair1, ppair2;
23352974e916SYuri Benditovich 
23362974e916SYuri Benditovich     ppair1 = *(uint32_t *)(buf + tcp_port);
23372974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
23382974e916SYuri Benditovich         ppair2 = *(uint32_t *)(seg->buf + tcp_port);
23392974e916SYuri Benditovich         if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size)
23402974e916SYuri Benditovich             || (ppair1 != ppair2)) {
23412974e916SYuri Benditovich             continue;
23422974e916SYuri Benditovich         }
23432974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
23442974e916SYuri Benditovich             chain->stat.drain_failed++;
23452974e916SYuri Benditovich         }
23462974e916SYuri Benditovich 
23472974e916SYuri Benditovich         break;
23482974e916SYuri Benditovich     }
23492974e916SYuri Benditovich 
23502974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
23512974e916SYuri Benditovich }
23522974e916SYuri Benditovich 
23532974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain,
23542974e916SYuri Benditovich                                             struct ip_header *ip,
23552974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
23562974e916SYuri Benditovich {
23572974e916SYuri Benditovich     uint16_t ip_len;
23582974e916SYuri Benditovich 
23592974e916SYuri Benditovich     /* Not an ipv4 packet */
23602974e916SYuri Benditovich     if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) {
23612974e916SYuri Benditovich         chain->stat.ip_option++;
23622974e916SYuri Benditovich         return RSC_BYPASS;
23632974e916SYuri Benditovich     }
23642974e916SYuri Benditovich 
23652974e916SYuri Benditovich     /* Don't handle packets with ip option */
23662974e916SYuri Benditovich     if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) {
23672974e916SYuri Benditovich         chain->stat.ip_option++;
23682974e916SYuri Benditovich         return RSC_BYPASS;
23692974e916SYuri Benditovich     }
23702974e916SYuri Benditovich 
23712974e916SYuri Benditovich     if (ip->ip_p != IPPROTO_TCP) {
23722974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23732974e916SYuri Benditovich         return RSC_BYPASS;
23742974e916SYuri Benditovich     }
23752974e916SYuri Benditovich 
23762974e916SYuri Benditovich     /* Don't handle packets with ip fragment */
23772974e916SYuri Benditovich     if (!(htons(ip->ip_off) & IP_DF)) {
23782974e916SYuri Benditovich         chain->stat.ip_frag++;
23792974e916SYuri Benditovich         return RSC_BYPASS;
23802974e916SYuri Benditovich     }
23812974e916SYuri Benditovich 
23822974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
23832974e916SYuri Benditovich     if (IPTOS_ECN(ip->ip_tos)) {
23842974e916SYuri Benditovich         chain->stat.ip_ecn++;
23852974e916SYuri Benditovich         return RSC_BYPASS;
23862974e916SYuri Benditovich     }
23872974e916SYuri Benditovich 
23882974e916SYuri Benditovich     ip_len = htons(ip->ip_len);
23892974e916SYuri Benditovich     if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header))
23902974e916SYuri Benditovich         || ip_len > (size - chain->n->guest_hdr_len -
23912974e916SYuri Benditovich                      sizeof(struct eth_header))) {
23922974e916SYuri Benditovich         chain->stat.ip_hacked++;
23932974e916SYuri Benditovich         return RSC_BYPASS;
23942974e916SYuri Benditovich     }
23952974e916SYuri Benditovich 
23962974e916SYuri Benditovich     return RSC_CANDIDATE;
23972974e916SYuri Benditovich }
23982974e916SYuri Benditovich 
23992974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain,
24002974e916SYuri Benditovich                                       NetClientState *nc,
24012974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
24022974e916SYuri Benditovich {
24032974e916SYuri Benditovich     int32_t ret;
24042974e916SYuri Benditovich     uint16_t hdr_len;
24052974e916SYuri Benditovich     VirtioNetRscUnit unit;
24062974e916SYuri Benditovich 
24072974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
24082974e916SYuri Benditovich 
24092974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)
24102974e916SYuri Benditovich         + sizeof(struct tcp_header))) {
24112974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
24122974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24132974e916SYuri Benditovich     }
24142974e916SYuri Benditovich 
24152974e916SYuri Benditovich     virtio_net_rsc_extract_unit4(chain, buf, &unit);
24162974e916SYuri Benditovich     if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size)
24172974e916SYuri Benditovich         != RSC_CANDIDATE) {
24182974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24192974e916SYuri Benditovich     }
24202974e916SYuri Benditovich 
24212974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
24222974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
24232974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24242974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
24252974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
24262974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 12),
24272974e916SYuri Benditovich                 VIRTIO_NET_IP4_ADDR_SIZE,
24282974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header));
24292974e916SYuri Benditovich     }
24302974e916SYuri Benditovich 
24312974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
24322974e916SYuri Benditovich }
24332974e916SYuri Benditovich 
24342974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain,
24352974e916SYuri Benditovich                                             struct ip6_header *ip6,
24362974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
24372974e916SYuri Benditovich {
24382974e916SYuri Benditovich     uint16_t ip_len;
24392974e916SYuri Benditovich 
24402974e916SYuri Benditovich     if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4)
24412974e916SYuri Benditovich         != IP_HEADER_VERSION_6) {
24422974e916SYuri Benditovich         return RSC_BYPASS;
24432974e916SYuri Benditovich     }
24442974e916SYuri Benditovich 
24452974e916SYuri Benditovich     /* Both option and protocol is checked in this */
24462974e916SYuri Benditovich     if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) {
24472974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
24482974e916SYuri Benditovich         return RSC_BYPASS;
24492974e916SYuri Benditovich     }
24502974e916SYuri Benditovich 
24512974e916SYuri Benditovich     ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
24522974e916SYuri Benditovich     if (ip_len < sizeof(struct tcp_header) ||
24532974e916SYuri Benditovich         ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header)
24542974e916SYuri Benditovich                   - sizeof(struct ip6_header))) {
24552974e916SYuri Benditovich         chain->stat.ip_hacked++;
24562974e916SYuri Benditovich         return RSC_BYPASS;
24572974e916SYuri Benditovich     }
24582974e916SYuri Benditovich 
24592974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
24602974e916SYuri Benditovich     if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) {
24612974e916SYuri Benditovich         chain->stat.ip_ecn++;
24622974e916SYuri Benditovich         return RSC_BYPASS;
24632974e916SYuri Benditovich     }
24642974e916SYuri Benditovich 
24652974e916SYuri Benditovich     return RSC_CANDIDATE;
24662974e916SYuri Benditovich }
24672974e916SYuri Benditovich 
24682974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc,
24692974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
24702974e916SYuri Benditovich {
24712974e916SYuri Benditovich     int32_t ret;
24722974e916SYuri Benditovich     uint16_t hdr_len;
24732974e916SYuri Benditovich     VirtioNetRscChain *chain;
24742974e916SYuri Benditovich     VirtioNetRscUnit unit;
24752974e916SYuri Benditovich 
24763d558330SMarkus Armbruster     chain = opq;
24772974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
24782974e916SYuri Benditovich 
24792974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header)
24802974e916SYuri Benditovich         + sizeof(tcp_header))) {
24812974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24822974e916SYuri Benditovich     }
24832974e916SYuri Benditovich 
24842974e916SYuri Benditovich     virtio_net_rsc_extract_unit6(chain, buf, &unit);
24852974e916SYuri Benditovich     if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain,
24862974e916SYuri Benditovich                                                  unit.ip, buf, size)) {
24872974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24882974e916SYuri Benditovich     }
24892974e916SYuri Benditovich 
24902974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
24912974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
24922974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24932974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
24942974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
24952974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 8),
24962974e916SYuri Benditovich                 VIRTIO_NET_IP6_ADDR_SIZE,
24972974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header)
24982974e916SYuri Benditovich                 + sizeof(struct ip6_header));
24992974e916SYuri Benditovich     }
25002974e916SYuri Benditovich 
25012974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
25022974e916SYuri Benditovich }
25032974e916SYuri Benditovich 
25042974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n,
25052974e916SYuri Benditovich                                                       NetClientState *nc,
25062974e916SYuri Benditovich                                                       uint16_t proto)
25072974e916SYuri Benditovich {
25082974e916SYuri Benditovich     VirtioNetRscChain *chain;
25092974e916SYuri Benditovich 
25102974e916SYuri Benditovich     if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) {
25112974e916SYuri Benditovich         return NULL;
25122974e916SYuri Benditovich     }
25132974e916SYuri Benditovich 
25142974e916SYuri Benditovich     QTAILQ_FOREACH(chain, &n->rsc_chains, next) {
25152974e916SYuri Benditovich         if (chain->proto == proto) {
25162974e916SYuri Benditovich             return chain;
25172974e916SYuri Benditovich         }
25182974e916SYuri Benditovich     }
25192974e916SYuri Benditovich 
25202974e916SYuri Benditovich     chain = g_malloc(sizeof(*chain));
25212974e916SYuri Benditovich     chain->n = n;
25222974e916SYuri Benditovich     chain->proto = proto;
25232974e916SYuri Benditovich     if (proto == (uint16_t)ETH_P_IP) {
25242974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD;
25252974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
25262974e916SYuri Benditovich     } else {
25272974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD;
25282974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
25292974e916SYuri Benditovich     }
25302974e916SYuri Benditovich     chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST,
25312974e916SYuri Benditovich                                       virtio_net_rsc_purge, chain);
25322974e916SYuri Benditovich     memset(&chain->stat, 0, sizeof(chain->stat));
25332974e916SYuri Benditovich 
25342974e916SYuri Benditovich     QTAILQ_INIT(&chain->buffers);
25352974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next);
25362974e916SYuri Benditovich 
25372974e916SYuri Benditovich     return chain;
25382974e916SYuri Benditovich }
25392974e916SYuri Benditovich 
25402974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc,
25412974e916SYuri Benditovich                                       const uint8_t *buf,
25422974e916SYuri Benditovich                                       size_t size)
25432974e916SYuri Benditovich {
25442974e916SYuri Benditovich     uint16_t proto;
25452974e916SYuri Benditovich     VirtioNetRscChain *chain;
25462974e916SYuri Benditovich     struct eth_header *eth;
25472974e916SYuri Benditovich     VirtIONet *n;
25482974e916SYuri Benditovich 
25492974e916SYuri Benditovich     n = qemu_get_nic_opaque(nc);
25502974e916SYuri Benditovich     if (size < (n->host_hdr_len + sizeof(struct eth_header))) {
25512974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
25522974e916SYuri Benditovich     }
25532974e916SYuri Benditovich 
25542974e916SYuri Benditovich     eth = (struct eth_header *)(buf + n->guest_hdr_len);
25552974e916SYuri Benditovich     proto = htons(eth->h_proto);
25562974e916SYuri Benditovich 
25572974e916SYuri Benditovich     chain = virtio_net_rsc_lookup_chain(n, nc, proto);
25582974e916SYuri Benditovich     if (chain) {
25592974e916SYuri Benditovich         chain->stat.received++;
25602974e916SYuri Benditovich         if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) {
25612974e916SYuri Benditovich             return virtio_net_rsc_receive4(chain, nc, buf, size);
25622974e916SYuri Benditovich         } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) {
25632974e916SYuri Benditovich             return virtio_net_rsc_receive6(chain, nc, buf, size);
25642974e916SYuri Benditovich         }
25652974e916SYuri Benditovich     }
25662974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
25672974e916SYuri Benditovich }
25682974e916SYuri Benditovich 
25692974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf,
25702974e916SYuri Benditovich                                   size_t size)
25712974e916SYuri Benditovich {
25722974e916SYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
25732974e916SYuri Benditovich     if ((n->rsc4_enabled || n->rsc6_enabled)) {
25742974e916SYuri Benditovich         return virtio_net_rsc_receive(nc, buf, size);
25752974e916SYuri Benditovich     } else {
25762974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
25772974e916SYuri Benditovich     }
25782974e916SYuri Benditovich }
25792974e916SYuri Benditovich 
25806e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
25816e790746SPaolo Bonzini 
25826e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
25836e790746SPaolo Bonzini {
25846e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
25856e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
258617a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2587df8d0708SLaurent Vivier     int ret;
25886e790746SPaolo Bonzini 
258951b19ebeSPaolo Bonzini     virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
259017a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
25916e790746SPaolo Bonzini 
259251b19ebeSPaolo Bonzini     g_free(q->async_tx.elem);
259351b19ebeSPaolo Bonzini     q->async_tx.elem = NULL;
25946e790746SPaolo Bonzini 
25956e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2596df8d0708SLaurent Vivier     ret = virtio_net_flush_tx(q);
25977550a822SLaurent Vivier     if (ret >= n->tx_burst) {
2598df8d0708SLaurent Vivier         /*
2599df8d0708SLaurent Vivier          * the flush has been stopped by tx_burst
2600df8d0708SLaurent Vivier          * we will not receive notification for the
2601df8d0708SLaurent Vivier          * remainining part, so re-schedule
2602df8d0708SLaurent Vivier          */
2603df8d0708SLaurent Vivier         virtio_queue_set_notification(q->tx_vq, 0);
26047550a822SLaurent Vivier         if (q->tx_bh) {
2605df8d0708SLaurent Vivier             qemu_bh_schedule(q->tx_bh);
26067550a822SLaurent Vivier         } else {
26077550a822SLaurent Vivier             timer_mod(q->tx_timer,
26087550a822SLaurent Vivier                       qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
26097550a822SLaurent Vivier         }
2610df8d0708SLaurent Vivier         q->tx_waiting = 1;
2611df8d0708SLaurent Vivier     }
26126e790746SPaolo Bonzini }
26136e790746SPaolo Bonzini 
26146e790746SPaolo Bonzini /* TX */
26156e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
26166e790746SPaolo Bonzini {
26176e790746SPaolo Bonzini     VirtIONet *n = q->n;
261817a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
261951b19ebeSPaolo Bonzini     VirtQueueElement *elem;
26206e790746SPaolo Bonzini     int32_t num_packets = 0;
26216e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
262217a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
26236e790746SPaolo Bonzini         return num_packets;
26246e790746SPaolo Bonzini     }
26256e790746SPaolo Bonzini 
262651b19ebeSPaolo Bonzini     if (q->async_tx.elem) {
26276e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
26286e790746SPaolo Bonzini         return num_packets;
26296e790746SPaolo Bonzini     }
26306e790746SPaolo Bonzini 
263151b19ebeSPaolo Bonzini     for (;;) {
2632bd89dd98SJason Wang         ssize_t ret;
263351b19ebeSPaolo Bonzini         unsigned int out_num;
263451b19ebeSPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
2635feb93f36SJason Wang         struct virtio_net_hdr_mrg_rxbuf mhdr;
26366e790746SPaolo Bonzini 
263751b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
263851b19ebeSPaolo Bonzini         if (!elem) {
263951b19ebeSPaolo Bonzini             break;
264051b19ebeSPaolo Bonzini         }
264151b19ebeSPaolo Bonzini 
264251b19ebeSPaolo Bonzini         out_num = elem->out_num;
264351b19ebeSPaolo Bonzini         out_sg = elem->out_sg;
26446e790746SPaolo Bonzini         if (out_num < 1) {
2645fa5e56c2SGreg Kurz             virtio_error(vdev, "virtio-net header not in first element");
2646fa5e56c2SGreg Kurz             virtqueue_detach_element(q->tx_vq, elem, 0);
2647fa5e56c2SGreg Kurz             g_free(elem);
2648fa5e56c2SGreg Kurz             return -EINVAL;
26496e790746SPaolo Bonzini         }
26506e790746SPaolo Bonzini 
2651032a74a1SCédric Le Goater         if (n->has_vnet_hdr) {
2652feb93f36SJason Wang             if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
2653feb93f36SJason Wang                 n->guest_hdr_len) {
2654fa5e56c2SGreg Kurz                 virtio_error(vdev, "virtio-net header incorrect");
2655fa5e56c2SGreg Kurz                 virtqueue_detach_element(q->tx_vq, elem, 0);
2656fa5e56c2SGreg Kurz                 g_free(elem);
2657fa5e56c2SGreg Kurz                 return -EINVAL;
2658032a74a1SCédric Le Goater             }
26591bfa316cSGreg Kurz             if (n->needs_vnet_hdr_swap) {
2660feb93f36SJason Wang                 virtio_net_hdr_swap(vdev, (void *) &mhdr);
2661feb93f36SJason Wang                 sg2[0].iov_base = &mhdr;
2662feb93f36SJason Wang                 sg2[0].iov_len = n->guest_hdr_len;
2663feb93f36SJason Wang                 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
2664feb93f36SJason Wang                                    out_sg, out_num,
2665feb93f36SJason Wang                                    n->guest_hdr_len, -1);
2666feb93f36SJason Wang                 if (out_num == VIRTQUEUE_MAX_SIZE) {
2667feb93f36SJason Wang                     goto drop;
2668032a74a1SCédric Le Goater                 }
2669feb93f36SJason Wang                 out_num += 1;
2670feb93f36SJason Wang                 out_sg = sg2;
2671feb93f36SJason Wang             }
2672feb93f36SJason Wang         }
26736e790746SPaolo Bonzini         /*
26746e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
26756e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
26766e790746SPaolo Bonzini          * that host is interested in.
26776e790746SPaolo Bonzini          */
26786e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
26796e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
26806e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
26816e790746SPaolo Bonzini                                        out_sg, out_num,
26826e790746SPaolo Bonzini                                        0, n->host_hdr_len);
26836e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
26846e790746SPaolo Bonzini                              out_sg, out_num,
26856e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
26866e790746SPaolo Bonzini             out_num = sg_num;
26876e790746SPaolo Bonzini             out_sg = sg;
26886e790746SPaolo Bonzini         }
26896e790746SPaolo Bonzini 
26906e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
26916e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
26926e790746SPaolo Bonzini         if (ret == 0) {
26936e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
26946e790746SPaolo Bonzini             q->async_tx.elem = elem;
26956e790746SPaolo Bonzini             return -EBUSY;
26966e790746SPaolo Bonzini         }
26976e790746SPaolo Bonzini 
2698feb93f36SJason Wang drop:
269951b19ebeSPaolo Bonzini         virtqueue_push(q->tx_vq, elem, 0);
270017a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
270151b19ebeSPaolo Bonzini         g_free(elem);
27026e790746SPaolo Bonzini 
27036e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
27046e790746SPaolo Bonzini             break;
27056e790746SPaolo Bonzini         }
27066e790746SPaolo Bonzini     }
27076e790746SPaolo Bonzini     return num_packets;
27086e790746SPaolo Bonzini }
27096e790746SPaolo Bonzini 
27107550a822SLaurent Vivier static void virtio_net_tx_timer(void *opaque);
27117550a822SLaurent Vivier 
27126e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
27136e790746SPaolo Bonzini {
271417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
27156e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
27166e790746SPaolo Bonzini 
2717283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2718283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2719283e2c2aSYuri Benditovich         return;
2720283e2c2aSYuri Benditovich     }
2721283e2c2aSYuri Benditovich 
27226e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
272317a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
27246e790746SPaolo Bonzini         q->tx_waiting = 1;
27256e790746SPaolo Bonzini         return;
27266e790746SPaolo Bonzini     }
27276e790746SPaolo Bonzini 
27286e790746SPaolo Bonzini     if (q->tx_waiting) {
27297550a822SLaurent Vivier         /* We already have queued packets, immediately flush */
2730bc72ad67SAlex Bligh         timer_del(q->tx_timer);
27317550a822SLaurent Vivier         virtio_net_tx_timer(q);
27326e790746SPaolo Bonzini     } else {
27337550a822SLaurent Vivier         /* re-arm timer to flush it (and more) on next tick */
2734bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
2735bc72ad67SAlex Bligh                   qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
27366e790746SPaolo Bonzini         q->tx_waiting = 1;
27376e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
27386e790746SPaolo Bonzini     }
27396e790746SPaolo Bonzini }
27406e790746SPaolo Bonzini 
27416e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
27426e790746SPaolo Bonzini {
274317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
27446e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
27456e790746SPaolo Bonzini 
2746283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2747283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2748283e2c2aSYuri Benditovich         return;
2749283e2c2aSYuri Benditovich     }
2750283e2c2aSYuri Benditovich 
27516e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
27526e790746SPaolo Bonzini         return;
27536e790746SPaolo Bonzini     }
27546e790746SPaolo Bonzini     q->tx_waiting = 1;
27556e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
275617a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
27576e790746SPaolo Bonzini         return;
27586e790746SPaolo Bonzini     }
27596e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
27606e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
27616e790746SPaolo Bonzini }
27626e790746SPaolo Bonzini 
27636e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
27646e790746SPaolo Bonzini {
27656e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
27666e790746SPaolo Bonzini     VirtIONet *n = q->n;
276717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
27687550a822SLaurent Vivier     int ret;
27697550a822SLaurent Vivier 
2770e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2771e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2772e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2773e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2774e8bcf842SMichael S. Tsirkin         return;
2775e8bcf842SMichael S. Tsirkin     }
27766e790746SPaolo Bonzini 
27776e790746SPaolo Bonzini     q->tx_waiting = 0;
27786e790746SPaolo Bonzini 
27796e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
278017a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
27816e790746SPaolo Bonzini         return;
278217a0ca55SKONRAD Frederic     }
27836e790746SPaolo Bonzini 
27847550a822SLaurent Vivier     ret = virtio_net_flush_tx(q);
27857550a822SLaurent Vivier     if (ret == -EBUSY || ret == -EINVAL) {
27867550a822SLaurent Vivier         return;
27877550a822SLaurent Vivier     }
27887550a822SLaurent Vivier     /*
27897550a822SLaurent Vivier      * If we flush a full burst of packets, assume there are
27907550a822SLaurent Vivier      * more coming and immediately rearm
27917550a822SLaurent Vivier      */
27927550a822SLaurent Vivier     if (ret >= n->tx_burst) {
27937550a822SLaurent Vivier         q->tx_waiting = 1;
27947550a822SLaurent Vivier         timer_mod(q->tx_timer,
27957550a822SLaurent Vivier                   qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
27967550a822SLaurent Vivier         return;
27977550a822SLaurent Vivier     }
27987550a822SLaurent Vivier     /*
27997550a822SLaurent Vivier      * If less than a full burst, re-enable notification and flush
28007550a822SLaurent Vivier      * anything that may have come in while we weren't looking.  If
28017550a822SLaurent Vivier      * we find something, assume the guest is still active and rearm
28027550a822SLaurent Vivier      */
28036e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
28047550a822SLaurent Vivier     ret = virtio_net_flush_tx(q);
28057550a822SLaurent Vivier     if (ret > 0) {
28067550a822SLaurent Vivier         virtio_queue_set_notification(q->tx_vq, 0);
28077550a822SLaurent Vivier         q->tx_waiting = 1;
28087550a822SLaurent Vivier         timer_mod(q->tx_timer,
28097550a822SLaurent Vivier                   qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
28107550a822SLaurent Vivier     }
28116e790746SPaolo Bonzini }
28126e790746SPaolo Bonzini 
28136e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
28146e790746SPaolo Bonzini {
28156e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
28166e790746SPaolo Bonzini     VirtIONet *n = q->n;
281717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
28186e790746SPaolo Bonzini     int32_t ret;
28196e790746SPaolo Bonzini 
2820e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2821e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2822e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2823e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2824e8bcf842SMichael S. Tsirkin         return;
2825e8bcf842SMichael S. Tsirkin     }
28266e790746SPaolo Bonzini 
28276e790746SPaolo Bonzini     q->tx_waiting = 0;
28286e790746SPaolo Bonzini 
28296e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
283017a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
28316e790746SPaolo Bonzini         return;
283217a0ca55SKONRAD Frederic     }
28336e790746SPaolo Bonzini 
28346e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
2835fa5e56c2SGreg Kurz     if (ret == -EBUSY || ret == -EINVAL) {
2836fa5e56c2SGreg Kurz         return; /* Notification re-enable handled by tx_complete or device
2837fa5e56c2SGreg Kurz                  * broken */
28386e790746SPaolo Bonzini     }
28396e790746SPaolo Bonzini 
28406e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
28416e790746SPaolo Bonzini      * more coming and immediately reschedule */
28426e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
28436e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
28446e790746SPaolo Bonzini         q->tx_waiting = 1;
28456e790746SPaolo Bonzini         return;
28466e790746SPaolo Bonzini     }
28476e790746SPaolo Bonzini 
28486e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
28496e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
28506e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
28516e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2852fa5e56c2SGreg Kurz     ret = virtio_net_flush_tx(q);
2853fa5e56c2SGreg Kurz     if (ret == -EINVAL) {
2854fa5e56c2SGreg Kurz         return;
2855fa5e56c2SGreg Kurz     } else if (ret > 0) {
28566e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
28576e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
28586e790746SPaolo Bonzini         q->tx_waiting = 1;
28596e790746SPaolo Bonzini     }
28606e790746SPaolo Bonzini }
28616e790746SPaolo Bonzini 
2862f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index)
2863f9d6dbf0SWen Congyang {
2864f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2865f9d6dbf0SWen Congyang 
28661c0fbfa3SMichael S. Tsirkin     n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
28671c0fbfa3SMichael S. Tsirkin                                            virtio_net_handle_rx);
28689b02e161SWei Wang 
2869f9d6dbf0SWen Congyang     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
2870f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
28719b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
28729b02e161SWei Wang                              virtio_net_handle_tx_timer);
2873f9d6dbf0SWen Congyang         n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
2874f9d6dbf0SWen Congyang                                               virtio_net_tx_timer,
2875f9d6dbf0SWen Congyang                                               &n->vqs[index]);
2876f9d6dbf0SWen Congyang     } else {
2877f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
28789b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
28799b02e161SWei Wang                              virtio_net_handle_tx_bh);
2880f9d6dbf0SWen Congyang         n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
2881f9d6dbf0SWen Congyang     }
2882f9d6dbf0SWen Congyang 
2883f9d6dbf0SWen Congyang     n->vqs[index].tx_waiting = 0;
2884f9d6dbf0SWen Congyang     n->vqs[index].n = n;
2885f9d6dbf0SWen Congyang }
2886f9d6dbf0SWen Congyang 
2887f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index)
2888f9d6dbf0SWen Congyang {
2889f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2890f9d6dbf0SWen Congyang     VirtIONetQueue *q = &n->vqs[index];
2891f9d6dbf0SWen Congyang     NetClientState *nc = qemu_get_subqueue(n->nic, index);
2892f9d6dbf0SWen Congyang 
2893f9d6dbf0SWen Congyang     qemu_purge_queued_packets(nc);
2894f9d6dbf0SWen Congyang 
2895f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2);
2896f9d6dbf0SWen Congyang     if (q->tx_timer) {
2897f9d6dbf0SWen Congyang         timer_free(q->tx_timer);
2898f989c30cSYunjian Wang         q->tx_timer = NULL;
2899f9d6dbf0SWen Congyang     } else {
2900f9d6dbf0SWen Congyang         qemu_bh_delete(q->tx_bh);
2901f989c30cSYunjian Wang         q->tx_bh = NULL;
2902f9d6dbf0SWen Congyang     }
2903f989c30cSYunjian Wang     q->tx_waiting = 0;
2904f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2 + 1);
2905f9d6dbf0SWen Congyang }
2906f9d6dbf0SWen Congyang 
2907441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs)
2908f9d6dbf0SWen Congyang {
2909f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2910f9d6dbf0SWen Congyang     int old_num_queues = virtio_get_num_queues(vdev);
2911441537f1SJason Wang     int new_num_queues = new_max_queue_pairs * 2 + 1;
2912f9d6dbf0SWen Congyang     int i;
2913f9d6dbf0SWen Congyang 
2914f9d6dbf0SWen Congyang     assert(old_num_queues >= 3);
2915f9d6dbf0SWen Congyang     assert(old_num_queues % 2 == 1);
2916f9d6dbf0SWen Congyang 
2917f9d6dbf0SWen Congyang     if (old_num_queues == new_num_queues) {
2918f9d6dbf0SWen Congyang         return;
2919f9d6dbf0SWen Congyang     }
2920f9d6dbf0SWen Congyang 
2921f9d6dbf0SWen Congyang     /*
2922f9d6dbf0SWen Congyang      * We always need to remove and add ctrl vq if
2923f9d6dbf0SWen Congyang      * old_num_queues != new_num_queues. Remove ctrl_vq first,
292420f86a75SYuval Shaia      * and then we only enter one of the following two loops.
2925f9d6dbf0SWen Congyang      */
2926f9d6dbf0SWen Congyang     virtio_del_queue(vdev, old_num_queues - 1);
2927f9d6dbf0SWen Congyang 
2928f9d6dbf0SWen Congyang     for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
2929f9d6dbf0SWen Congyang         /* new_num_queues < old_num_queues */
2930f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i / 2);
2931f9d6dbf0SWen Congyang     }
2932f9d6dbf0SWen Congyang 
2933f9d6dbf0SWen Congyang     for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
2934f9d6dbf0SWen Congyang         /* new_num_queues > old_num_queues */
2935f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i / 2);
2936f9d6dbf0SWen Congyang     }
2937f9d6dbf0SWen Congyang 
2938f9d6dbf0SWen Congyang     /* add ctrl_vq last */
2939f9d6dbf0SWen Congyang     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
2940f9d6dbf0SWen Congyang }
2941f9d6dbf0SWen Congyang 
2942ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
29436e790746SPaolo Bonzini {
2944441537f1SJason Wang     int max = multiqueue ? n->max_queue_pairs : 1;
2945f9d6dbf0SWen Congyang 
29466e790746SPaolo Bonzini     n->multiqueue = multiqueue;
2947441537f1SJason Wang     virtio_net_change_num_queue_pairs(n, max);
29486e790746SPaolo Bonzini 
2949441537f1SJason Wang     virtio_net_set_queue_pairs(n);
29506e790746SPaolo Bonzini }
29516e790746SPaolo Bonzini 
2952982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id)
2953037dab2fSGreg Kurz {
2954982b78c5SDr. David Alan Gilbert     VirtIONet *n = opaque;
2955982b78c5SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2956037dab2fSGreg Kurz     int i, link_down;
2957037dab2fSGreg Kurz 
29589d8c6a25SDr. David Alan Gilbert     trace_virtio_net_post_load_device();
2959982b78c5SDr. David Alan Gilbert     virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs,
296095129d6fSCornelia Huck                                virtio_vdev_has_feature(vdev,
2961e22f0603SYuri Benditovich                                                        VIRTIO_F_VERSION_1),
2962e22f0603SYuri Benditovich                                virtio_vdev_has_feature(vdev,
2963e22f0603SYuri Benditovich                                                        VIRTIO_NET_F_HASH_REPORT));
29646e790746SPaolo Bonzini 
29656e790746SPaolo Bonzini     /* MAC_TABLE_ENTRIES may be different from the saved image */
2966982b78c5SDr. David Alan Gilbert     if (n->mac_table.in_use > MAC_TABLE_ENTRIES) {
29676e790746SPaolo Bonzini         n->mac_table.in_use = 0;
29686e790746SPaolo Bonzini     }
29696e790746SPaolo Bonzini 
2970982b78c5SDr. David Alan Gilbert     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
29716c666823SMichael S. Tsirkin         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
29726c666823SMichael S. Tsirkin     }
29736c666823SMichael S. Tsirkin 
29747788c3f2SMikhail Sennikovsky     /*
29757788c3f2SMikhail Sennikovsky      * curr_guest_offloads will be later overwritten by the
29767788c3f2SMikhail Sennikovsky      * virtio_set_features_nocheck call done from the virtio_load.
29777788c3f2SMikhail Sennikovsky      * Here we make sure it is preserved and restored accordingly
29787788c3f2SMikhail Sennikovsky      * in the virtio_net_post_load_virtio callback.
29797788c3f2SMikhail Sennikovsky      */
29807788c3f2SMikhail Sennikovsky     n->saved_guest_offloads = n->curr_guest_offloads;
29816c666823SMichael S. Tsirkin 
2982441537f1SJason Wang     virtio_net_set_queue_pairs(n);
29836e790746SPaolo Bonzini 
29846e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
29856e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
29866e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
29876e790746SPaolo Bonzini             break;
29886e790746SPaolo Bonzini         }
29896e790746SPaolo Bonzini     }
29906e790746SPaolo Bonzini     n->mac_table.first_multi = i;
29916e790746SPaolo Bonzini 
29926e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
29936e790746SPaolo Bonzini      * to link status bit in n->status */
29946e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
2995441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
29966e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
29976e790746SPaolo Bonzini     }
29986e790746SPaolo Bonzini 
29996c666823SMichael S. Tsirkin     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
30006c666823SMichael S. Tsirkin         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
30019d8c6a25SDr. David Alan Gilbert         qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
30029d8c6a25SDr. David Alan Gilbert                                   QEMU_CLOCK_VIRTUAL,
30039d8c6a25SDr. David Alan Gilbert                                   virtio_net_announce_timer, n);
30049d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
30059d8c6a25SDr. David Alan Gilbert             timer_mod(n->announce_timer.tm,
30069d8c6a25SDr. David Alan Gilbert                       qemu_clock_get_ms(n->announce_timer.type));
30079d8c6a25SDr. David Alan Gilbert         } else {
3008944458b6SDr. David Alan Gilbert             qemu_announce_timer_del(&n->announce_timer, false);
30099d8c6a25SDr. David Alan Gilbert         }
30106c666823SMichael S. Tsirkin     }
30116c666823SMichael S. Tsirkin 
3012e41b7114SYuri Benditovich     if (n->rss_data.enabled) {
30130145c393SAndrew Melnychenko         n->rss_data.enabled_software_rss = n->rss_data.populate_hash;
30140145c393SAndrew Melnychenko         if (!n->rss_data.populate_hash) {
30150145c393SAndrew Melnychenko             if (!virtio_net_attach_epbf_rss(n)) {
30160145c393SAndrew Melnychenko                 if (get_vhost_net(qemu_get_queue(n->nic)->peer)) {
30170145c393SAndrew Melnychenko                     warn_report("Can't post-load eBPF RSS for vhost");
30180145c393SAndrew Melnychenko                 } else {
30190145c393SAndrew Melnychenko                     warn_report("Can't post-load eBPF RSS - "
30200145c393SAndrew Melnychenko                                 "fallback to software RSS");
30210145c393SAndrew Melnychenko                     n->rss_data.enabled_software_rss = true;
30220145c393SAndrew Melnychenko                 }
30230145c393SAndrew Melnychenko             }
30240145c393SAndrew Melnychenko         }
30250145c393SAndrew Melnychenko 
3026e41b7114SYuri Benditovich         trace_virtio_net_rss_enable(n->rss_data.hash_types,
3027e41b7114SYuri Benditovich                                     n->rss_data.indirections_len,
3028e41b7114SYuri Benditovich                                     sizeof(n->rss_data.key));
3029e41b7114SYuri Benditovich     } else {
3030e41b7114SYuri Benditovich         trace_virtio_net_rss_disable();
3031e41b7114SYuri Benditovich     }
30326e790746SPaolo Bonzini     return 0;
30336e790746SPaolo Bonzini }
30346e790746SPaolo Bonzini 
30357788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev)
30367788c3f2SMikhail Sennikovsky {
30377788c3f2SMikhail Sennikovsky     VirtIONet *n = VIRTIO_NET(vdev);
30387788c3f2SMikhail Sennikovsky     /*
30397788c3f2SMikhail Sennikovsky      * The actual needed state is now in saved_guest_offloads,
30407788c3f2SMikhail Sennikovsky      * see virtio_net_post_load_device for detail.
30417788c3f2SMikhail Sennikovsky      * Restore it back and apply the desired offloads.
30427788c3f2SMikhail Sennikovsky      */
30437788c3f2SMikhail Sennikovsky     n->curr_guest_offloads = n->saved_guest_offloads;
30447788c3f2SMikhail Sennikovsky     if (peer_has_vnet_hdr(n)) {
30457788c3f2SMikhail Sennikovsky         virtio_net_apply_guest_offloads(n);
30467788c3f2SMikhail Sennikovsky     }
30477788c3f2SMikhail Sennikovsky 
30487788c3f2SMikhail Sennikovsky     return 0;
30497788c3f2SMikhail Sennikovsky }
30507788c3f2SMikhail Sennikovsky 
3051982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */
3052982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = {
3053982b78c5SDr. David Alan Gilbert     .name = "virtio-net-queue-tx_waiting",
3054982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
3055982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(tx_waiting, VirtIONetQueue),
3056982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3057982b78c5SDr. David Alan Gilbert    },
3058982b78c5SDr. David Alan Gilbert };
3059982b78c5SDr. David Alan Gilbert 
3060441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id)
3061982b78c5SDr. David Alan Gilbert {
3062441537f1SJason Wang     return VIRTIO_NET(opaque)->max_queue_pairs > 1;
3063982b78c5SDr. David Alan Gilbert }
3064982b78c5SDr. David Alan Gilbert 
3065982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id)
3066982b78c5SDr. David Alan Gilbert {
3067982b78c5SDr. David Alan Gilbert     return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque),
3068982b78c5SDr. David Alan Gilbert                                    VIRTIO_NET_F_CTRL_GUEST_OFFLOADS);
3069982b78c5SDr. David Alan Gilbert }
3070982b78c5SDr. David Alan Gilbert 
3071982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id)
3072982b78c5SDr. David Alan Gilbert {
3073982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES;
3074982b78c5SDr. David Alan Gilbert }
3075982b78c5SDr. David Alan Gilbert 
3076982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id)
3077982b78c5SDr. David Alan Gilbert {
3078982b78c5SDr. David Alan Gilbert     return !mac_table_fits(opaque, version_id);
3079982b78c5SDr. David Alan Gilbert }
3080982b78c5SDr. David Alan Gilbert 
3081982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods
3082982b78c5SDr. David Alan Gilbert  * although only some fields are used by each.
3083982b78c5SDr. David Alan Gilbert  */
3084982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp {
3085982b78c5SDr. David Alan Gilbert     VirtIONet      *parent;
3086982b78c5SDr. David Alan Gilbert     VirtIONetQueue *vqs_1;
3087441537f1SJason Wang     uint16_t        curr_queue_pairs_1;
3088982b78c5SDr. David Alan Gilbert     uint8_t         has_ufo;
3089982b78c5SDr. David Alan Gilbert     uint32_t        has_vnet_hdr;
3090982b78c5SDr. David Alan Gilbert };
3091982b78c5SDr. David Alan Gilbert 
3092982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than
3093441537f1SJason Wang  * the 1st entry in the queue_pairs and only if there's more than one
3094982b78c5SDr. David Alan Gilbert  * entry.  We use the tmp mechanism to calculate a temporary
3095982b78c5SDr. David Alan Gilbert  * pointer and count and also validate the count.
3096982b78c5SDr. David Alan Gilbert  */
3097982b78c5SDr. David Alan Gilbert 
309844b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque)
3099982b78c5SDr. David Alan Gilbert {
3100982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3101982b78c5SDr. David Alan Gilbert 
3102982b78c5SDr. David Alan Gilbert     tmp->vqs_1 = tmp->parent->vqs + 1;
3103441537f1SJason Wang     tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1;
3104441537f1SJason Wang     if (tmp->parent->curr_queue_pairs == 0) {
3105441537f1SJason Wang         tmp->curr_queue_pairs_1 = 0;
3106982b78c5SDr. David Alan Gilbert     }
310744b1ff31SDr. David Alan Gilbert 
310844b1ff31SDr. David Alan Gilbert     return 0;
3109982b78c5SDr. David Alan Gilbert }
3110982b78c5SDr. David Alan Gilbert 
3111982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque)
3112982b78c5SDr. David Alan Gilbert {
3113982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3114982b78c5SDr. David Alan Gilbert 
3115982b78c5SDr. David Alan Gilbert     /* Reuse the pointer setup from save */
3116982b78c5SDr. David Alan Gilbert     virtio_net_tx_waiting_pre_save(opaque);
3117982b78c5SDr. David Alan Gilbert 
3118441537f1SJason Wang     if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) {
3119441537f1SJason Wang         error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x",
3120441537f1SJason Wang             tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs);
3121982b78c5SDr. David Alan Gilbert 
3122982b78c5SDr. David Alan Gilbert         return -EINVAL;
3123982b78c5SDr. David Alan Gilbert     }
3124982b78c5SDr. David Alan Gilbert 
3125982b78c5SDr. David Alan Gilbert     return 0; /* all good */
3126982b78c5SDr. David Alan Gilbert }
3127982b78c5SDr. David Alan Gilbert 
3128982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = {
3129982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-tx_waiting",
3130982b78c5SDr. David Alan Gilbert     .pre_load  = virtio_net_tx_waiting_pre_load,
3131982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_tx_waiting_pre_save,
3132982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3133982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp,
3134441537f1SJason Wang                                      curr_queue_pairs_1,
3135982b78c5SDr. David Alan Gilbert                                      vmstate_virtio_net_queue_tx_waiting,
3136982b78c5SDr. David Alan Gilbert                                      struct VirtIONetQueue),
3137982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3138982b78c5SDr. David Alan Gilbert     },
3139982b78c5SDr. David Alan Gilbert };
3140982b78c5SDr. David Alan Gilbert 
3141982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the
3142982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
3143982b78c5SDr. David Alan Gilbert  */
3144982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id)
3145982b78c5SDr. David Alan Gilbert {
3146982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3147982b78c5SDr. David Alan Gilbert 
3148982b78c5SDr. David Alan Gilbert     if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) {
3149982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires TUN_F_UFO support");
3150982b78c5SDr. David Alan Gilbert         return -EINVAL;
3151982b78c5SDr. David Alan Gilbert     }
3152982b78c5SDr. David Alan Gilbert 
3153982b78c5SDr. David Alan Gilbert     return 0;
3154982b78c5SDr. David Alan Gilbert }
3155982b78c5SDr. David Alan Gilbert 
315644b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque)
3157982b78c5SDr. David Alan Gilbert {
3158982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3159982b78c5SDr. David Alan Gilbert 
3160982b78c5SDr. David Alan Gilbert     tmp->has_ufo = tmp->parent->has_ufo;
316144b1ff31SDr. David Alan Gilbert 
316244b1ff31SDr. David Alan Gilbert     return 0;
3163982b78c5SDr. David Alan Gilbert }
3164982b78c5SDr. David Alan Gilbert 
3165982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = {
3166982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-ufo",
3167982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_ufo_post_load,
3168982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_ufo_pre_save,
3169982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3170982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp),
3171982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3172982b78c5SDr. David Alan Gilbert     },
3173982b78c5SDr. David Alan Gilbert };
3174982b78c5SDr. David Alan Gilbert 
3175982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the
3176982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
3177982b78c5SDr. David Alan Gilbert  */
3178982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id)
3179982b78c5SDr. David Alan Gilbert {
3180982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3181982b78c5SDr. David Alan Gilbert 
3182982b78c5SDr. David Alan Gilbert     if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) {
3183982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires vnet_hdr=on");
3184982b78c5SDr. David Alan Gilbert         return -EINVAL;
3185982b78c5SDr. David Alan Gilbert     }
3186982b78c5SDr. David Alan Gilbert 
3187982b78c5SDr. David Alan Gilbert     return 0;
3188982b78c5SDr. David Alan Gilbert }
3189982b78c5SDr. David Alan Gilbert 
319044b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque)
3191982b78c5SDr. David Alan Gilbert {
3192982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3193982b78c5SDr. David Alan Gilbert 
3194982b78c5SDr. David Alan Gilbert     tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr;
319544b1ff31SDr. David Alan Gilbert 
319644b1ff31SDr. David Alan Gilbert     return 0;
3197982b78c5SDr. David Alan Gilbert }
3198982b78c5SDr. David Alan Gilbert 
3199982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = {
3200982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-vnet",
3201982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_vnet_post_load,
3202982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_vnet_pre_save,
3203982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3204982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp),
3205982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3206982b78c5SDr. David Alan Gilbert     },
3207982b78c5SDr. David Alan Gilbert };
3208982b78c5SDr. David Alan Gilbert 
3209e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque)
3210e41b7114SYuri Benditovich {
3211e41b7114SYuri Benditovich     return VIRTIO_NET(opaque)->rss_data.enabled;
3212e41b7114SYuri Benditovich }
3213e41b7114SYuri Benditovich 
3214e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = {
3215e41b7114SYuri Benditovich     .name      = "virtio-net-device/rss",
3216e41b7114SYuri Benditovich     .version_id = 1,
3217e41b7114SYuri Benditovich     .minimum_version_id = 1,
3218e41b7114SYuri Benditovich     .needed = virtio_net_rss_needed,
3219e41b7114SYuri Benditovich     .fields = (VMStateField[]) {
3220e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.enabled, VirtIONet),
3221e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.redirect, VirtIONet),
3222e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.populate_hash, VirtIONet),
3223e41b7114SYuri Benditovich         VMSTATE_UINT32(rss_data.hash_types, VirtIONet),
3224e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.indirections_len, VirtIONet),
3225e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.default_queue, VirtIONet),
3226e41b7114SYuri Benditovich         VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet,
3227e41b7114SYuri Benditovich                             VIRTIO_NET_RSS_MAX_KEY_SIZE),
3228e41b7114SYuri Benditovich         VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet,
3229e41b7114SYuri Benditovich                                     rss_data.indirections_len, 0,
3230e41b7114SYuri Benditovich                                     vmstate_info_uint16, uint16_t),
3231e41b7114SYuri Benditovich         VMSTATE_END_OF_LIST()
3232e41b7114SYuri Benditovich     },
3233e41b7114SYuri Benditovich };
3234e41b7114SYuri Benditovich 
3235982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = {
3236982b78c5SDr. David Alan Gilbert     .name = "virtio-net-device",
3237982b78c5SDr. David Alan Gilbert     .version_id = VIRTIO_NET_VM_VERSION,
3238982b78c5SDr. David Alan Gilbert     .minimum_version_id = VIRTIO_NET_VM_VERSION,
3239982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_post_load_device,
3240982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
3241982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN),
3242982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_POINTER(vqs, VirtIONet,
3243982b78c5SDr. David Alan Gilbert                                vmstate_virtio_net_queue_tx_waiting,
3244982b78c5SDr. David Alan Gilbert                                VirtIONetQueue),
3245982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet),
3246982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16(status, VirtIONet),
3247982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(promisc, VirtIONet),
3248982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(allmulti, VirtIONet),
3249982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mac_table.in_use, VirtIONet),
3250982b78c5SDr. David Alan Gilbert 
3251982b78c5SDr. David Alan Gilbert         /* Guarded pair: If it fits we load it, else we throw it away
3252982b78c5SDr. David Alan Gilbert          * - can happen if source has a larger MAC table.; post-load
3253982b78c5SDr. David Alan Gilbert          *  sets flags in this case.
3254982b78c5SDr. David Alan Gilbert          */
3255982b78c5SDr. David Alan Gilbert         VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet,
3256982b78c5SDr. David Alan Gilbert                                 0, mac_table_fits, mac_table.in_use,
3257982b78c5SDr. David Alan Gilbert                                  ETH_ALEN),
3258982b78c5SDr. David Alan Gilbert         VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0,
3259982b78c5SDr. David Alan Gilbert                                      mac_table.in_use, ETH_ALEN),
3260982b78c5SDr. David Alan Gilbert 
3261982b78c5SDr. David Alan Gilbert         /* Note: This is an array of uint32's that's always been saved as a
3262982b78c5SDr. David Alan Gilbert          * buffer; hold onto your endiannesses; it's actually used as a bitmap
3263982b78c5SDr. David Alan Gilbert          * but based on the uint.
3264982b78c5SDr. David Alan Gilbert          */
3265982b78c5SDr. David Alan Gilbert         VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3),
3266982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3267982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_vnet),
3268982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet),
3269982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet),
3270982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(alluni, VirtIONet),
3271982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nomulti, VirtIONet),
3272982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nouni, VirtIONet),
3273982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nobcast, VirtIONet),
3274982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3275982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_ufo),
3276441537f1SJason Wang         VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0,
3277982b78c5SDr. David Alan Gilbert                             vmstate_info_uint16_equal, uint16_t),
3278441537f1SJason Wang         VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1),
3279982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3280982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_tx_waiting),
3281982b78c5SDr. David Alan Gilbert         VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet,
3282982b78c5SDr. David Alan Gilbert                             has_ctrl_guest_offloads),
3283982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3284982b78c5SDr. David Alan Gilbert    },
3285e41b7114SYuri Benditovich     .subsections = (const VMStateDescription * []) {
3286e41b7114SYuri Benditovich         &vmstate_virtio_net_rss,
3287e41b7114SYuri Benditovich         NULL
3288e41b7114SYuri Benditovich     }
3289982b78c5SDr. David Alan Gilbert };
3290982b78c5SDr. David Alan Gilbert 
32916e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
3292f394b2e2SEric Blake     .type = NET_CLIENT_DRIVER_NIC,
32936e790746SPaolo Bonzini     .size = sizeof(NICState),
32946e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
32956e790746SPaolo Bonzini     .receive = virtio_net_receive,
32966e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
3297b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
3298b2c929f0SDr. David Alan Gilbert     .announce = virtio_net_announce,
32996e790746SPaolo Bonzini };
33006e790746SPaolo Bonzini 
33016e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
33026e790746SPaolo Bonzini {
330317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
330468b0a639SSi-Wei Liu     NetClientState *nc;
33056e790746SPaolo Bonzini     assert(n->vhost_started);
330668b0a639SSi-Wei Liu     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) {
330768b0a639SSi-Wei Liu         /* Must guard against invalid features and bogus queue index
330868b0a639SSi-Wei Liu          * from being set by malicious guest, or penetrated through
330968b0a639SSi-Wei Liu          * buggy migration stream.
331068b0a639SSi-Wei Liu          */
331168b0a639SSi-Wei Liu         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
331268b0a639SSi-Wei Liu             qemu_log_mask(LOG_GUEST_ERROR,
331368b0a639SSi-Wei Liu                           "%s: bogus vq index ignored\n", __func__);
331468b0a639SSi-Wei Liu             return false;
331568b0a639SSi-Wei Liu         }
331668b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, n->max_queue_pairs);
331768b0a639SSi-Wei Liu     } else {
331868b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, vq2q(idx));
331968b0a639SSi-Wei Liu     }
3320ed8b4afeSNikolay Nikolaev     return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
33216e790746SPaolo Bonzini }
33226e790746SPaolo Bonzini 
33236e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
33246e790746SPaolo Bonzini                                            bool mask)
33256e790746SPaolo Bonzini {
332617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
332768b0a639SSi-Wei Liu     NetClientState *nc;
33286e790746SPaolo Bonzini     assert(n->vhost_started);
332968b0a639SSi-Wei Liu     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) {
333068b0a639SSi-Wei Liu         /* Must guard against invalid features and bogus queue index
333168b0a639SSi-Wei Liu          * from being set by malicious guest, or penetrated through
333268b0a639SSi-Wei Liu          * buggy migration stream.
333368b0a639SSi-Wei Liu          */
333468b0a639SSi-Wei Liu         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
333568b0a639SSi-Wei Liu             qemu_log_mask(LOG_GUEST_ERROR,
333668b0a639SSi-Wei Liu                           "%s: bogus vq index ignored\n", __func__);
333768b0a639SSi-Wei Liu             return;
333868b0a639SSi-Wei Liu         }
333968b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, n->max_queue_pairs);
334068b0a639SSi-Wei Liu     } else {
334168b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, vq2q(idx));
334268b0a639SSi-Wei Liu     }
3343a882b571SMichael S. Tsirkin     vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
3344a882b571SMichael S. Tsirkin                              vdev, idx, mask);
33456e790746SPaolo Bonzini }
33466e790746SPaolo Bonzini 
3347019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
33486e790746SPaolo Bonzini {
33490cd09c3aSCornelia Huck     virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
3350a93e599dSMaxime Coquelin 
3351d74c30c8SDaniil Tatianin     n->config_size = virtio_get_config_size(&cfg_size_params, host_features);
335217ec5a86SKONRAD Frederic }
33536e790746SPaolo Bonzini 
33548a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
33558a253ec2SKONRAD Frederic                                    const char *type)
33568a253ec2SKONRAD Frederic {
33578a253ec2SKONRAD Frederic     /*
33588a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
33598a253ec2SKONRAD Frederic      */
33608a253ec2SKONRAD Frederic     assert(type != NULL);
33618a253ec2SKONRAD Frederic 
33628a253ec2SKONRAD Frederic     g_free(n->netclient_name);
33638a253ec2SKONRAD Frederic     g_free(n->netclient_type);
33648a253ec2SKONRAD Frederic     n->netclient_name = g_strdup(name);
33658a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
33668a253ec2SKONRAD Frederic }
33678a253ec2SKONRAD Frederic 
33680e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev)
33699711cd0dSJens Freimann {
33709711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
33719711cd0dSJens Freimann     PCIDevice *pci_dev;
33729711cd0dSJens Freimann     Error *err = NULL;
33739711cd0dSJens Freimann 
33740e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
33759711cd0dSJens Freimann     if (hotplug_ctrl) {
33760e9a65c5SJuan Quintela         pci_dev = PCI_DEVICE(dev);
33779711cd0dSJens Freimann         pci_dev->partially_hotplugged = true;
33780e9a65c5SJuan Quintela         hotplug_handler_unplug_request(hotplug_ctrl, dev, &err);
33799711cd0dSJens Freimann         if (err) {
33809711cd0dSJens Freimann             error_report_err(err);
33819711cd0dSJens Freimann             return false;
33829711cd0dSJens Freimann         }
33839711cd0dSJens Freimann     } else {
33849711cd0dSJens Freimann         return false;
33859711cd0dSJens Freimann     }
33869711cd0dSJens Freimann     return true;
33879711cd0dSJens Freimann }
33889711cd0dSJens Freimann 
33890e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev,
33900e9a65c5SJuan Quintela                                     Error **errp)
33919711cd0dSJens Freimann {
33925a0948d3SMarkus Armbruster     Error *err = NULL;
33939711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
33940e9a65c5SJuan Quintela     PCIDevice *pdev = PCI_DEVICE(dev);
339578274682SJuan Quintela     BusState *primary_bus;
33969711cd0dSJens Freimann 
33979711cd0dSJens Freimann     if (!pdev->partially_hotplugged) {
33989711cd0dSJens Freimann         return true;
33999711cd0dSJens Freimann     }
34000e9a65c5SJuan Quintela     primary_bus = dev->parent_bus;
340178274682SJuan Quintela     if (!primary_bus) {
3402150ab54aSJens Freimann         error_setg(errp, "virtio_net: couldn't find primary bus");
34035a0948d3SMarkus Armbruster         return false;
34049711cd0dSJens Freimann     }
34050e9a65c5SJuan Quintela     qdev_set_parent_bus(dev, primary_bus, &error_abort);
3406e2bde83eSJuan Quintela     qatomic_set(&n->failover_primary_hidden, false);
34070e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
34089711cd0dSJens Freimann     if (hotplug_ctrl) {
34090e9a65c5SJuan Quintela         hotplug_handler_pre_plug(hotplug_ctrl, dev, &err);
34105a0948d3SMarkus Armbruster         if (err) {
34115a0948d3SMarkus Armbruster             goto out;
34125a0948d3SMarkus Armbruster         }
34130e9a65c5SJuan Quintela         hotplug_handler_plug(hotplug_ctrl, dev, &err);
34149711cd0dSJens Freimann     }
3415109c20eaSLaurent Vivier     pdev->partially_hotplugged = false;
3416150ab54aSJens Freimann 
3417150ab54aSJens Freimann out:
34185a0948d3SMarkus Armbruster     error_propagate(errp, err);
34195a0948d3SMarkus Armbruster     return !err;
34209711cd0dSJens Freimann }
34219711cd0dSJens Freimann 
342207a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s)
34239711cd0dSJens Freimann {
34249711cd0dSJens Freimann     bool should_be_hidden;
34259711cd0dSJens Freimann     Error *err = NULL;
342607a5d816SJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
342707a5d816SJuan Quintela 
342807a5d816SJuan Quintela     if (!dev) {
342907a5d816SJuan Quintela         return;
343007a5d816SJuan Quintela     }
34319711cd0dSJens Freimann 
3432e2bde83eSJuan Quintela     should_be_hidden = qatomic_read(&n->failover_primary_hidden);
34339711cd0dSJens Freimann 
34344dbac1aeSMarkus Armbruster     if (migration_in_setup(s) && !should_be_hidden) {
343507a5d816SJuan Quintela         if (failover_unplug_primary(n, dev)) {
343607a5d816SJuan Quintela             vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev);
343707a5d816SJuan Quintela             qapi_event_send_unplug_primary(dev->id);
3438e2bde83eSJuan Quintela             qatomic_set(&n->failover_primary_hidden, true);
34399711cd0dSJens Freimann         } else {
34409711cd0dSJens Freimann             warn_report("couldn't unplug primary device");
34419711cd0dSJens Freimann         }
34429711cd0dSJens Freimann     } else if (migration_has_failed(s)) {
3443150ab54aSJens Freimann         /* We already unplugged the device let's plug it back */
344407a5d816SJuan Quintela         if (!failover_replug_primary(n, dev, &err)) {
34459711cd0dSJens Freimann             if (err) {
34469711cd0dSJens Freimann                 error_report_err(err);
34479711cd0dSJens Freimann             }
34489711cd0dSJens Freimann         }
34499711cd0dSJens Freimann     }
34509711cd0dSJens Freimann }
34519711cd0dSJens Freimann 
34529711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data)
34539711cd0dSJens Freimann {
34549711cd0dSJens Freimann     MigrationState *s = data;
34559711cd0dSJens Freimann     VirtIONet *n = container_of(notifier, VirtIONet, migration_state);
34569711cd0dSJens Freimann     virtio_net_handle_migration_primary(n, s);
34579711cd0dSJens Freimann }
34589711cd0dSJens Freimann 
3459b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener,
3460f3558b1bSKevin Wolf                                          const QDict *device_opts,
3461f3558b1bSKevin Wolf                                          bool from_json,
3462f3558b1bSKevin Wolf                                          Error **errp)
34639711cd0dSJens Freimann {
34649711cd0dSJens Freimann     VirtIONet *n = container_of(listener, VirtIONet, primary_listener);
34654f0303aeSJuan Quintela     const char *standby_id;
34669711cd0dSJens Freimann 
34674d0e59acSJens Freimann     if (!device_opts) {
346889631fedSJuan Quintela         return false;
34694d0e59acSJens Freimann     }
3470bcfc906bSLaurent Vivier 
3471bcfc906bSLaurent Vivier     if (!qdict_haskey(device_opts, "failover_pair_id")) {
3472bcfc906bSLaurent Vivier         return false;
3473bcfc906bSLaurent Vivier     }
3474bcfc906bSLaurent Vivier 
3475bcfc906bSLaurent Vivier     if (!qdict_haskey(device_opts, "id")) {
3476bcfc906bSLaurent Vivier         error_setg(errp, "Device with failover_pair_id needs to have id");
3477bcfc906bSLaurent Vivier         return false;
3478bcfc906bSLaurent Vivier     }
3479bcfc906bSLaurent Vivier 
3480bcfc906bSLaurent Vivier     standby_id = qdict_get_str(device_opts, "failover_pair_id");
348189631fedSJuan Quintela     if (g_strcmp0(standby_id, n->netclient_name) != 0) {
348289631fedSJuan Quintela         return false;
34839711cd0dSJens Freimann     }
34849711cd0dSJens Freimann 
34857fe7791eSLaurent Vivier     /*
34867fe7791eSLaurent Vivier      * The hide helper can be called several times for a given device.
34877fe7791eSLaurent Vivier      * Check there is only one primary for a virtio-net device but
34887fe7791eSLaurent Vivier      * don't duplicate the qdict several times if it's called for the same
34897fe7791eSLaurent Vivier      * device.
34907fe7791eSLaurent Vivier      */
3491259a10dbSKevin Wolf     if (n->primary_opts) {
34927fe7791eSLaurent Vivier         const char *old, *new;
34937fe7791eSLaurent Vivier         /* devices with failover_pair_id always have an id */
34947fe7791eSLaurent Vivier         old = qdict_get_str(n->primary_opts, "id");
34957fe7791eSLaurent Vivier         new = qdict_get_str(device_opts, "id");
34967fe7791eSLaurent Vivier         if (strcmp(old, new) != 0) {
34977fe7791eSLaurent Vivier             error_setg(errp, "Cannot attach more than one primary device to "
34987fe7791eSLaurent Vivier                        "'%s': '%s' and '%s'", n->netclient_name, old, new);
3499259a10dbSKevin Wolf             return false;
3500259a10dbSKevin Wolf         }
35017fe7791eSLaurent Vivier     } else {
3502f3558b1bSKevin Wolf         n->primary_opts = qdict_clone_shallow(device_opts);
3503f3558b1bSKevin Wolf         n->primary_opts_from_json = from_json;
35047fe7791eSLaurent Vivier     }
3505259a10dbSKevin Wolf 
3506e2bde83eSJuan Quintela     /* failover_primary_hidden is set during feature negotiation */
35073abad4a2SJuan Quintela     return qatomic_read(&n->failover_primary_hidden);
35089711cd0dSJens Freimann }
35099711cd0dSJens Freimann 
3510e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
351117ec5a86SKONRAD Frederic {
3512e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3513284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3514284a32f0SAndreas Färber     NetClientState *nc;
35151773d9eeSKONRAD Frederic     int i;
351617ec5a86SKONRAD Frederic 
3517a93e599dSMaxime Coquelin     if (n->net_conf.mtu) {
3518127833eeSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_MTU);
3519a93e599dSMaxime Coquelin     }
3520a93e599dSMaxime Coquelin 
35219473939eSJason Baron     if (n->net_conf.duplex_str) {
35229473939eSJason Baron         if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) {
35239473939eSJason Baron             n->net_conf.duplex = DUPLEX_HALF;
35249473939eSJason Baron         } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) {
35259473939eSJason Baron             n->net_conf.duplex = DUPLEX_FULL;
35269473939eSJason Baron         } else {
35279473939eSJason Baron             error_setg(errp, "'duplex' must be 'half' or 'full'");
3528843c4cfcSMarkus Armbruster             return;
35299473939eSJason Baron         }
35309473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
35319473939eSJason Baron     } else {
35329473939eSJason Baron         n->net_conf.duplex = DUPLEX_UNKNOWN;
35339473939eSJason Baron     }
35349473939eSJason Baron 
35359473939eSJason Baron     if (n->net_conf.speed < SPEED_UNKNOWN) {
35369473939eSJason Baron         error_setg(errp, "'speed' must be between 0 and INT_MAX");
3537843c4cfcSMarkus Armbruster         return;
3538843c4cfcSMarkus Armbruster     }
3539843c4cfcSMarkus Armbruster     if (n->net_conf.speed >= 0) {
35409473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
35419473939eSJason Baron     }
35429473939eSJason Baron 
35439711cd0dSJens Freimann     if (n->failover) {
3544b91ad981SJuan Quintela         n->primary_listener.hide_device = failover_hide_primary_device;
3545e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, true);
35469711cd0dSJens Freimann         device_listener_register(&n->primary_listener);
35479711cd0dSJens Freimann         n->migration_state.notify = virtio_net_migration_state_notifier;
35489711cd0dSJens Freimann         add_migration_state_change_notifier(&n->migration_state);
35499711cd0dSJens Freimann         n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY);
35509711cd0dSJens Freimann     }
35519711cd0dSJens Freimann 
3552da3e8a23SShannon Zhao     virtio_net_set_config_size(n, n->host_features);
35533857cd5cSJonah Palmer     virtio_init(vdev, VIRTIO_ID_NET, n->config_size);
355417ec5a86SKONRAD Frederic 
35551c0fbfa3SMichael S. Tsirkin     /*
35561c0fbfa3SMichael S. Tsirkin      * We set a lower limit on RX queue size to what it always was.
35571c0fbfa3SMichael S. Tsirkin      * Guests that want a smaller ring can always resize it without
35581c0fbfa3SMichael S. Tsirkin      * help from us (using virtio 1 and up).
35591c0fbfa3SMichael S. Tsirkin      */
35601c0fbfa3SMichael S. Tsirkin     if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
35611c0fbfa3SMichael S. Tsirkin         n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
35625f997fd1SMichal Privoznik         !is_power_of_2(n->net_conf.rx_queue_size)) {
35631c0fbfa3SMichael S. Tsirkin         error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
35641c0fbfa3SMichael S. Tsirkin                    "must be a power of 2 between %d and %d.",
35651c0fbfa3SMichael S. Tsirkin                    n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
35661c0fbfa3SMichael S. Tsirkin                    VIRTQUEUE_MAX_SIZE);
35671c0fbfa3SMichael S. Tsirkin         virtio_cleanup(vdev);
35681c0fbfa3SMichael S. Tsirkin         return;
35691c0fbfa3SMichael S. Tsirkin     }
35701c0fbfa3SMichael S. Tsirkin 
35719b02e161SWei Wang     if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE ||
35729b02e161SWei Wang         n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE ||
35739b02e161SWei Wang         !is_power_of_2(n->net_conf.tx_queue_size)) {
35749b02e161SWei Wang         error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), "
35759b02e161SWei Wang                    "must be a power of 2 between %d and %d",
35769b02e161SWei Wang                    n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE,
35779b02e161SWei Wang                    VIRTQUEUE_MAX_SIZE);
35789b02e161SWei Wang         virtio_cleanup(vdev);
35799b02e161SWei Wang         return;
35809b02e161SWei Wang     }
35819b02e161SWei Wang 
358222288fe5SJason Wang     n->max_ncs = MAX(n->nic_conf.peers.queues, 1);
358322288fe5SJason Wang 
358422288fe5SJason Wang     /*
358522288fe5SJason Wang      * Figure out the datapath queue pairs since the backend could
358622288fe5SJason Wang      * provide control queue via peers as well.
358722288fe5SJason Wang      */
358822288fe5SJason Wang     if (n->nic_conf.peers.queues) {
358922288fe5SJason Wang         for (i = 0; i < n->max_ncs; i++) {
359022288fe5SJason Wang             if (n->nic_conf.peers.ncs[i]->is_datapath) {
359122288fe5SJason Wang                 ++n->max_queue_pairs;
359222288fe5SJason Wang             }
359322288fe5SJason Wang         }
359422288fe5SJason Wang     }
359522288fe5SJason Wang     n->max_queue_pairs = MAX(n->max_queue_pairs, 1);
359622288fe5SJason Wang 
3597441537f1SJason Wang     if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) {
359822288fe5SJason Wang         error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), "
3599631b22eaSStefan Weil                    "must be a positive integer less than %d.",
3600441537f1SJason Wang                    n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2);
36017e0e736eSJason Wang         virtio_cleanup(vdev);
36027e0e736eSJason Wang         return;
36037e0e736eSJason Wang     }
3604b21e2380SMarkus Armbruster     n->vqs = g_new0(VirtIONetQueue, n->max_queue_pairs);
3605441537f1SJason Wang     n->curr_queue_pairs = 1;
36061773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
36076e790746SPaolo Bonzini 
36081773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
36091773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
36100765691eSMarkus Armbruster         warn_report("virtio-net: "
36116e790746SPaolo Bonzini                     "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
36121773d9eeSKONRAD Frederic                     n->net_conf.tx);
36130765691eSMarkus Armbruster         error_printf("Defaulting to \"bh\"");
36146e790746SPaolo Bonzini     }
36156e790746SPaolo Bonzini 
36162eef278bSMichael S. Tsirkin     n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n),
36172eef278bSMichael S. Tsirkin                                     n->net_conf.tx_queue_size);
36189b02e161SWei Wang 
3619441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
3620f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i);
3621da51a335SJason Wang     }
3622da51a335SJason Wang 
362317a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
36241773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
36251773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
36266e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
36279d8c6a25SDr. David Alan Gilbert     qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
36289d8c6a25SDr. David Alan Gilbert                               QEMU_CLOCK_VIRTUAL,
3629f57fcf70SJason Wang                               virtio_net_announce_timer, n);
3630b2c929f0SDr. David Alan Gilbert     n->announce_timer.round = 0;
36316e790746SPaolo Bonzini 
36328a253ec2SKONRAD Frederic     if (n->netclient_type) {
36338a253ec2SKONRAD Frederic         /*
36348a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
36358a253ec2SKONRAD Frederic          */
36368a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
36378a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
36388a253ec2SKONRAD Frederic     } else {
36391773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
3640284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
36418a253ec2SKONRAD Frederic     }
36428a253ec2SKONRAD Frederic 
3643441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
3644d4c62930SBin Meng         n->nic->ncs[i].do_not_pad = true;
3645d4c62930SBin Meng     }
3646d4c62930SBin Meng 
36476e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
36486e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
3649441537f1SJason Wang         for (i = 0; i < n->max_queue_pairs; i++) {
3650d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
36516e790746SPaolo Bonzini         }
36526e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
36536e790746SPaolo Bonzini     } else {
36546e790746SPaolo Bonzini         n->host_hdr_len = 0;
36556e790746SPaolo Bonzini     }
36566e790746SPaolo Bonzini 
36571773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
36586e790746SPaolo Bonzini 
36596e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
36601773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
3661e22f0603SYuri Benditovich     virtio_net_set_mrg_rx_bufs(n, 0, 0, 0);
36626e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
36636e790746SPaolo Bonzini 
36646e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
36656e790746SPaolo Bonzini 
36666e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
36676e790746SPaolo Bonzini 
3668b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
3669b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
3670b1be4280SAmos Kong 
3671e87936eaSCindy Lu    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
3672e87936eaSCindy Lu         struct virtio_net_config netcfg = {};
3673e87936eaSCindy Lu         memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN);
3674e87936eaSCindy Lu         vhost_net_set_config(get_vhost_net(nc->peer),
3675e87936eaSCindy Lu             (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER);
3676e87936eaSCindy Lu     }
36772974e916SYuri Benditovich     QTAILQ_INIT(&n->rsc_chains);
3678284a32f0SAndreas Färber     n->qdev = dev;
36794474e37aSYuri Benditovich 
36804474e37aSYuri Benditovich     net_rx_pkt_init(&n->rx_pkt, false);
36810145c393SAndrew Melnychenko 
36820145c393SAndrew Melnychenko     if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) {
36830145c393SAndrew Melnychenko         virtio_net_load_ebpf(n);
36840145c393SAndrew Melnychenko     }
368517ec5a86SKONRAD Frederic }
368617ec5a86SKONRAD Frederic 
3687b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev)
368817ec5a86SKONRAD Frederic {
3689306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3690306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3691441537f1SJason Wang     int i, max_queue_pairs;
369217ec5a86SKONRAD Frederic 
36930145c393SAndrew Melnychenko     if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) {
36940145c393SAndrew Melnychenko         virtio_net_unload_ebpf(n);
36950145c393SAndrew Melnychenko     }
36960145c393SAndrew Melnychenko 
369717ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
369817ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
369917ec5a86SKONRAD Frederic 
37008a253ec2SKONRAD Frederic     g_free(n->netclient_name);
37018a253ec2SKONRAD Frederic     n->netclient_name = NULL;
37028a253ec2SKONRAD Frederic     g_free(n->netclient_type);
37038a253ec2SKONRAD Frederic     n->netclient_type = NULL;
37048a253ec2SKONRAD Frederic 
370517ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
370617ec5a86SKONRAD Frederic     g_free(n->vlans);
370717ec5a86SKONRAD Frederic 
37089711cd0dSJens Freimann     if (n->failover) {
3709f3558b1bSKevin Wolf         qobject_unref(n->primary_opts);
371065018100SJuan Quintela         device_listener_unregister(&n->primary_listener);
37111e157667SLaurent Vivier         remove_migration_state_change_notifier(&n->migration_state);
3712f3558b1bSKevin Wolf     } else {
3713f3558b1bSKevin Wolf         assert(n->primary_opts == NULL);
37149711cd0dSJens Freimann     }
37159711cd0dSJens Freimann 
3716441537f1SJason Wang     max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
3717441537f1SJason Wang     for (i = 0; i < max_queue_pairs; i++) {
3718f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i);
371917ec5a86SKONRAD Frederic     }
3720d945d9f1SYuri Benditovich     /* delete also control vq */
3721441537f1SJason Wang     virtio_del_queue(vdev, max_queue_pairs * 2);
3722944458b6SDr. David Alan Gilbert     qemu_announce_timer_del(&n->announce_timer, false);
372317ec5a86SKONRAD Frederic     g_free(n->vqs);
372417ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
37252974e916SYuri Benditovich     virtio_net_rsc_cleanup(n);
372659079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
37274474e37aSYuri Benditovich     net_rx_pkt_uninit(n->rx_pkt);
37286a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
372917ec5a86SKONRAD Frederic }
373017ec5a86SKONRAD Frederic 
373117ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
373217ec5a86SKONRAD Frederic {
373317ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
373417ec5a86SKONRAD Frederic 
373517ec5a86SKONRAD Frederic     /*
373617ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
373717ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
373817ec5a86SKONRAD Frederic      */
373917ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
3740aa4197c3SGonglei     device_add_bootindex_property(obj, &n->nic_conf.bootindex,
3741aa4197c3SGonglei                                   "bootindex", "/ethernet-phy@0",
374240c2281cSMarkus Armbruster                                   DEVICE(n));
37430145c393SAndrew Melnychenko 
37440145c393SAndrew Melnychenko     ebpf_rss_init(&n->ebpf_rss);
374517ec5a86SKONRAD Frederic }
374617ec5a86SKONRAD Frederic 
374744b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque)
37484d45dcfbSHalil Pasic {
37494d45dcfbSHalil Pasic     VirtIONet *n = opaque;
37504d45dcfbSHalil Pasic 
37514d45dcfbSHalil Pasic     /* At this point, backend must be stopped, otherwise
37524d45dcfbSHalil Pasic      * it might keep writing to memory. */
37534d45dcfbSHalil Pasic     assert(!n->vhost_started);
375444b1ff31SDr. David Alan Gilbert 
375544b1ff31SDr. David Alan Gilbert     return 0;
37564d45dcfbSHalil Pasic }
37574d45dcfbSHalil Pasic 
37589711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque)
37599711cd0dSJens Freimann {
37609711cd0dSJens Freimann     DeviceState *dev = opaque;
376121e8709bSJuan Quintela     DeviceState *primary;
37629711cd0dSJens Freimann     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
37639711cd0dSJens Freimann     VirtIONet *n = VIRTIO_NET(vdev);
37649711cd0dSJens Freimann 
3765284f42a5SJens Freimann     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) {
3766284f42a5SJens Freimann         return false;
3767284f42a5SJens Freimann     }
376821e8709bSJuan Quintela     primary = failover_find_primary_device(n);
376921e8709bSJuan Quintela     return primary ? primary->pending_deleted_event : false;
37709711cd0dSJens Freimann }
37719711cd0dSJens Freimann 
37729711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque)
37739711cd0dSJens Freimann {
37749711cd0dSJens Freimann     DeviceState *dev = opaque;
37759711cd0dSJens Freimann     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
37769711cd0dSJens Freimann 
37779711cd0dSJens Freimann     return vdc->primary_unplug_pending(dev);
37789711cd0dSJens Freimann }
37799711cd0dSJens Freimann 
3780c255488dSJonah Palmer static struct vhost_dev *virtio_net_get_vhost(VirtIODevice *vdev)
3781c255488dSJonah Palmer {
3782c255488dSJonah Palmer     VirtIONet *n = VIRTIO_NET(vdev);
3783c255488dSJonah Palmer     NetClientState *nc = qemu_get_queue(n->nic);
3784c255488dSJonah Palmer     struct vhost_net *net = get_vhost_net(nc->peer);
3785c255488dSJonah Palmer     return &net->dev;
3786c255488dSJonah Palmer }
3787c255488dSJonah Palmer 
37884d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = {
37894d45dcfbSHalil Pasic     .name = "virtio-net",
37904d45dcfbSHalil Pasic     .minimum_version_id = VIRTIO_NET_VM_VERSION,
37914d45dcfbSHalil Pasic     .version_id = VIRTIO_NET_VM_VERSION,
37924d45dcfbSHalil Pasic     .fields = (VMStateField[]) {
37934d45dcfbSHalil Pasic         VMSTATE_VIRTIO_DEVICE,
37944d45dcfbSHalil Pasic         VMSTATE_END_OF_LIST()
37954d45dcfbSHalil Pasic     },
37964d45dcfbSHalil Pasic     .pre_save = virtio_net_pre_save,
37979711cd0dSJens Freimann     .dev_unplug_pending = dev_unplug_pending,
37984d45dcfbSHalil Pasic };
3799290c2428SDr. David Alan Gilbert 
380017ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
3801127833eeSJason Baron     DEFINE_PROP_BIT64("csum", VirtIONet, host_features,
3802127833eeSJason Baron                     VIRTIO_NET_F_CSUM, true),
3803127833eeSJason Baron     DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features,
380487108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_CSUM, true),
3805127833eeSJason Baron     DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
3806127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features,
380787108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO4, true),
3808127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features,
380987108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO6, true),
3810127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features,
381187108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ECN, true),
3812127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features,
381387108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_UFO, true),
3814127833eeSJason Baron     DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features,
381587108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ANNOUNCE, true),
3816127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features,
381787108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO4, true),
3818127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features,
381987108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO6, true),
3820127833eeSJason Baron     DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features,
382187108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_ECN, true),
3822127833eeSJason Baron     DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features,
382387108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_UFO, true),
3824127833eeSJason Baron     DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features,
382587108bb2SShannon Zhao                     VIRTIO_NET_F_MRG_RXBUF, true),
3826127833eeSJason Baron     DEFINE_PROP_BIT64("status", VirtIONet, host_features,
382787108bb2SShannon Zhao                     VIRTIO_NET_F_STATUS, true),
3828127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features,
382987108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VQ, true),
3830127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features,
383187108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX, true),
3832127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features,
383387108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VLAN, true),
3834127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features,
383587108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX_EXTRA, true),
3836127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features,
383787108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_MAC_ADDR, true),
3838127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features,
383987108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
3840127833eeSJason Baron     DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
384159079029SYuri Benditovich     DEFINE_PROP_BIT64("rss", VirtIONet, host_features,
384259079029SYuri Benditovich                     VIRTIO_NET_F_RSS, false),
3843e22f0603SYuri Benditovich     DEFINE_PROP_BIT64("hash", VirtIONet, host_features,
3844e22f0603SYuri Benditovich                     VIRTIO_NET_F_HASH_REPORT, false),
38452974e916SYuri Benditovich     DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features,
38462974e916SYuri Benditovich                     VIRTIO_NET_F_RSC_EXT, false),
38472974e916SYuri Benditovich     DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout,
38482974e916SYuri Benditovich                        VIRTIO_NET_RSC_DEFAULT_INTERVAL),
384917ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
385017ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
385117ec5a86SKONRAD Frederic                        TX_TIMER_INTERVAL),
385217ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
385317ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
38541c0fbfa3SMichael S. Tsirkin     DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
38551c0fbfa3SMichael S. Tsirkin                        VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
38569b02e161SWei Wang     DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size,
38579b02e161SWei Wang                        VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE),
3858a93e599dSMaxime Coquelin     DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0),
385975ebec11SMaxime Coquelin     DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend,
386075ebec11SMaxime Coquelin                      true),
38619473939eSJason Baron     DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN),
38629473939eSJason Baron     DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str),
38639711cd0dSJens Freimann     DEFINE_PROP_BOOL("failover", VirtIONet, failover, false),
386417ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
386517ec5a86SKONRAD Frederic };
386617ec5a86SKONRAD Frederic 
386717ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
386817ec5a86SKONRAD Frederic {
386917ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
387017ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
3871e6f746b3SAndreas Färber 
38724f67d30bSMarc-André Lureau     device_class_set_props(dc, virtio_net_properties);
3873290c2428SDr. David Alan Gilbert     dc->vmsd = &vmstate_virtio_net;
3874125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
3875e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
3876306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
387717ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
387817ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
387917ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
388017ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
388117ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
388217ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
38837dc6be52SXuan Zhuo     vdc->queue_reset = virtio_net_queue_reset;
38847f863302SKangjie Xu     vdc->queue_enable = virtio_net_queue_enable;
388517ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
388617ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
388717ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
38882a083ffdSMichael S. Tsirkin     vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO);
38897788c3f2SMikhail Sennikovsky     vdc->post_load = virtio_net_post_load_virtio;
3890982b78c5SDr. David Alan Gilbert     vdc->vmsd = &vmstate_virtio_net_device;
38919711cd0dSJens Freimann     vdc->primary_unplug_pending = primary_unplug_pending;
3892c255488dSJonah Palmer     vdc->get_vhost = virtio_net_get_vhost;
389317ec5a86SKONRAD Frederic }
389417ec5a86SKONRAD Frederic 
389517ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
389617ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
389717ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
389817ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
389917ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
390017ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
390117ec5a86SKONRAD Frederic };
390217ec5a86SKONRAD Frederic 
390317ec5a86SKONRAD Frederic static void virtio_register_types(void)
390417ec5a86SKONRAD Frederic {
390517ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
390617ec5a86SKONRAD Frederic }
390717ec5a86SKONRAD Frederic 
390817ec5a86SKONRAD Frederic type_init(virtio_register_types)
3909