xref: /openbmc/qemu/hw/net/virtio-net.c (revision 4fdf69ab691e513280a3b5529de997d95a29f358)
16e790746SPaolo Bonzini /*
26e790746SPaolo Bonzini  * Virtio Network Device
36e790746SPaolo Bonzini  *
46e790746SPaolo Bonzini  * Copyright IBM, Corp. 2007
56e790746SPaolo Bonzini  *
66e790746SPaolo Bonzini  * Authors:
76e790746SPaolo Bonzini  *  Anthony Liguori   <aliguori@us.ibm.com>
86e790746SPaolo Bonzini  *
96e790746SPaolo Bonzini  * This work is licensed under the terms of the GNU GPL, version 2.  See
106e790746SPaolo Bonzini  * the COPYING file in the top-level directory.
116e790746SPaolo Bonzini  *
126e790746SPaolo Bonzini  */
136e790746SPaolo Bonzini 
149b8bfe21SPeter Maydell #include "qemu/osdep.h"
159711cd0dSJens Freimann #include "qemu/atomic.h"
166e790746SPaolo Bonzini #include "qemu/iov.h"
1768b0a639SSi-Wei Liu #include "qemu/log.h"
18db725815SMarkus Armbruster #include "qemu/main-loop.h"
190b8fa32fSMarkus Armbruster #include "qemu/module.h"
206e790746SPaolo Bonzini #include "hw/virtio/virtio.h"
216e790746SPaolo Bonzini #include "net/net.h"
226e790746SPaolo Bonzini #include "net/checksum.h"
236e790746SPaolo Bonzini #include "net/tap.h"
246e790746SPaolo Bonzini #include "qemu/error-report.h"
256e790746SPaolo Bonzini #include "qemu/timer.h"
269711cd0dSJens Freimann #include "qemu/option.h"
279711cd0dSJens Freimann #include "qemu/option_int.h"
289711cd0dSJens Freimann #include "qemu/config-file.h"
299711cd0dSJens Freimann #include "qapi/qmp/qdict.h"
306e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h"
316e790746SPaolo Bonzini #include "net/vhost_net.h"
329d8c6a25SDr. David Alan Gilbert #include "net/announce.h"
3317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h"
34e688df6bSMarkus Armbruster #include "qapi/error.h"
359af23989SMarkus Armbruster #include "qapi/qapi-events-net.h"
36a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h"
379711cd0dSJens Freimann #include "qapi/qapi-types-migration.h"
389711cd0dSJens Freimann #include "qapi/qapi-events-migration.h"
391399c60dSRusty Russell #include "hw/virtio/virtio-access.h"
40f8d806c9SJuan Quintela #include "migration/misc.h"
419473939eSJason Baron #include "standard-headers/linux/ethtool.h"
422f780b6aSMarkus Armbruster #include "sysemu/sysemu.h"
439d8c6a25SDr. David Alan Gilbert #include "trace.h"
449711cd0dSJens Freimann #include "monitor/qdev.h"
459711cd0dSJens Freimann #include "hw/pci/pci.h"
464474e37aSYuri Benditovich #include "net_rx_pkt.h"
47108a6481SCindy Lu #include "hw/virtio/vhost.h"
481b529d90SLaurent Vivier #include "sysemu/qtest.h"
496e790746SPaolo Bonzini 
506e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION    11
516e790746SPaolo Bonzini 
526e790746SPaolo Bonzini #define MAX_VLAN    (1 << 12)   /* Per 802.1Q definition */
536e790746SPaolo Bonzini 
541c0fbfa3SMichael S. Tsirkin /* previously fixed value */
551c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
569b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256
579b02e161SWei Wang 
58441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */
591c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
609b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE
611c0fbfa3SMichael S. Tsirkin 
622974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE   8        /* ipv4 saddr + daddr */
632974e916SYuri Benditovich 
642974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG         0x3F
652974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH   0xF000
662974e916SYuri Benditovich 
672974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */
682974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header))
692974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535
702974e916SYuri Benditovich 
712974e916SYuri Benditovich /* header length value in ip header without option */
722974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5
732974e916SYuri Benditovich 
742974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE   32      /* ipv6 saddr + daddr */
752974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD
762974e916SYuri Benditovich 
772974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance
782974e916SYuri Benditovich    a lot, and should be tuned carefully, '300000'(300us) is the recommended
792974e916SYuri Benditovich    value to pass the WHQL test, '50000' can gain 2x netperf throughput with
802974e916SYuri Benditovich    tso/gso/gro 'off'. */
812974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000
822974e916SYuri Benditovich 
8359079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \
8459079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \
8559079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \
8659079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \
8759079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \
8859079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \
8959079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \
9059079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \
9159079029SYuri Benditovich                                          VIRTIO_NET_RSS_HASH_TYPE_UDP_EX)
9259079029SYuri Benditovich 
93ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = {
94127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MAC,
955d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mac)},
96127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_STATUS,
975d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, status)},
98127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MQ,
995d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
100127833eeSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_MTU,
1015d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, mtu)},
1029473939eSJason Baron     {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX,
1035d5b33c0SMax Reitz      .end = endof(struct virtio_net_config, duplex)},
104e22f0603SYuri Benditovich     {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT),
10559079029SYuri Benditovich      .end = endof(struct virtio_net_config, supported_hash_types)},
1066e790746SPaolo Bonzini     {}
1076e790746SPaolo Bonzini };
1086e790746SPaolo Bonzini 
109d74c30c8SDaniil Tatianin static const VirtIOConfigSizeParams cfg_size_params = {
110d74c30c8SDaniil Tatianin     .min_size = endof(struct virtio_net_config, mac),
111d74c30c8SDaniil Tatianin     .max_size = sizeof(struct virtio_net_config),
112d74c30c8SDaniil Tatianin     .feature_sizes = feature_sizes
113d74c30c8SDaniil Tatianin };
114d74c30c8SDaniil Tatianin 
1156e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
1166e790746SPaolo Bonzini {
1176e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1186e790746SPaolo Bonzini 
1196e790746SPaolo Bonzini     return &n->vqs[nc->queue_index];
1206e790746SPaolo Bonzini }
1216e790746SPaolo Bonzini 
1226e790746SPaolo Bonzini static int vq2q(int queue_index)
1236e790746SPaolo Bonzini {
1246e790746SPaolo Bonzini     return queue_index / 2;
1256e790746SPaolo Bonzini }
1266e790746SPaolo Bonzini 
127*4fdf69abSKangjie Xu static void flush_or_purge_queued_packets(NetClientState *nc)
128*4fdf69abSKangjie Xu {
129*4fdf69abSKangjie Xu     if (!nc->peer) {
130*4fdf69abSKangjie Xu         return;
131*4fdf69abSKangjie Xu     }
132*4fdf69abSKangjie Xu 
133*4fdf69abSKangjie Xu     qemu_flush_or_purge_queued_packets(nc->peer, true);
134*4fdf69abSKangjie Xu     assert(!virtio_net_get_subqueue(nc)->async_tx.elem);
135*4fdf69abSKangjie Xu }
136*4fdf69abSKangjie Xu 
1376e790746SPaolo Bonzini /* TODO
1386e790746SPaolo Bonzini  * - we could suppress RX interrupt if we were so inclined.
1396e790746SPaolo Bonzini  */
1406e790746SPaolo Bonzini 
1416e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
1426e790746SPaolo Bonzini {
14317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1446e790746SPaolo Bonzini     struct virtio_net_config netcfg;
145c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
146fb592882SCindy Lu     static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } };
1476e790746SPaolo Bonzini 
148108a6481SCindy Lu     int ret = 0;
149108a6481SCindy Lu     memset(&netcfg, 0 , sizeof(struct virtio_net_config));
1501399c60dSRusty Russell     virtio_stw_p(vdev, &netcfg.status, n->status);
151441537f1SJason Wang     virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs);
152a93e599dSMaxime Coquelin     virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu);
1536e790746SPaolo Bonzini     memcpy(netcfg.mac, n->mac, ETH_ALEN);
1549473939eSJason Baron     virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed);
1559473939eSJason Baron     netcfg.duplex = n->net_conf.duplex;
15659079029SYuri Benditovich     netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE;
15759079029SYuri Benditovich     virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length,
158e22f0603SYuri Benditovich                  virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ?
159e22f0603SYuri Benditovich                  VIRTIO_NET_RSS_MAX_TABLE_LEN : 1);
16059079029SYuri Benditovich     virtio_stl_p(vdev, &netcfg.supported_hash_types,
16159079029SYuri Benditovich                  VIRTIO_NET_RSS_SUPPORTED_HASHES);
1626e790746SPaolo Bonzini     memcpy(config, &netcfg, n->config_size);
163108a6481SCindy Lu 
164c546ecf2SJason Wang     /*
165c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
166c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
167c546ecf2SJason Wang      */
168c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
169108a6481SCindy Lu         ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg,
170108a6481SCindy Lu                                    n->config_size);
171108a6481SCindy Lu         if (ret != -1) {
172fb592882SCindy Lu             /*
173fb592882SCindy Lu              * Some NIC/kernel combinations present 0 as the mac address.  As
174fb592882SCindy Lu              * that is not a legal address, try to proceed with the
175fb592882SCindy Lu              * address from the QEMU command line in the hope that the
176fb592882SCindy Lu              * address has been configured correctly elsewhere - just not
177fb592882SCindy Lu              * reported by the device.
178fb592882SCindy Lu              */
179fb592882SCindy Lu             if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) {
180fb592882SCindy Lu                 info_report("Zero hardware mac address detected. Ignoring.");
181fb592882SCindy Lu                 memcpy(netcfg.mac, n->mac, ETH_ALEN);
182fb592882SCindy Lu             }
183108a6481SCindy Lu             memcpy(config, &netcfg, n->config_size);
184108a6481SCindy Lu         }
185108a6481SCindy Lu     }
1866e790746SPaolo Bonzini }
1876e790746SPaolo Bonzini 
1886e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
1896e790746SPaolo Bonzini {
19017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
1916e790746SPaolo Bonzini     struct virtio_net_config netcfg = {};
192c546ecf2SJason Wang     NetClientState *nc = qemu_get_queue(n->nic);
1936e790746SPaolo Bonzini 
1946e790746SPaolo Bonzini     memcpy(&netcfg, config, n->config_size);
1956e790746SPaolo Bonzini 
19695129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
19795129d6fSCornelia Huck         !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
1986e790746SPaolo Bonzini         memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
1996e790746SPaolo Bonzini         memcpy(n->mac, netcfg.mac, ETH_ALEN);
2006e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
2016e790746SPaolo Bonzini     }
202108a6481SCindy Lu 
203c546ecf2SJason Wang     /*
204c546ecf2SJason Wang      * Is this VDPA? No peer means not VDPA: there's no way to
205c546ecf2SJason Wang      * disconnect/reconnect a VDPA peer.
206c546ecf2SJason Wang      */
207c546ecf2SJason Wang     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
208c546ecf2SJason Wang         vhost_net_set_config(get_vhost_net(nc->peer),
209c546ecf2SJason Wang                              (uint8_t *)&netcfg, 0, n->config_size,
210108a6481SCindy Lu                              VHOST_SET_CONFIG_TYPE_MASTER);
211108a6481SCindy Lu       }
2126e790746SPaolo Bonzini }
2136e790746SPaolo Bonzini 
2146e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status)
2156e790746SPaolo Bonzini {
21617a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2176e790746SPaolo Bonzini     return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
21817a0ca55SKONRAD Frederic         (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
2196e790746SPaolo Bonzini }
2206e790746SPaolo Bonzini 
221b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net)
222b2c929f0SDr. David Alan Gilbert {
223b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(net);
224b2c929f0SDr. David Alan Gilbert     trace_virtio_net_announce_notify();
225b2c929f0SDr. David Alan Gilbert 
226b2c929f0SDr. David Alan Gilbert     net->status |= VIRTIO_NET_S_ANNOUNCE;
227b2c929f0SDr. David Alan Gilbert     virtio_notify_config(vdev);
228b2c929f0SDr. David Alan Gilbert }
229b2c929f0SDr. David Alan Gilbert 
230f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque)
231f57fcf70SJason Wang {
232f57fcf70SJason Wang     VirtIONet *n = opaque;
2339d8c6a25SDr. David Alan Gilbert     trace_virtio_net_announce_timer(n->announce_timer.round);
234f57fcf70SJason Wang 
2359d8c6a25SDr. David Alan Gilbert     n->announce_timer.round--;
236b2c929f0SDr. David Alan Gilbert     virtio_net_announce_notify(n);
237b2c929f0SDr. David Alan Gilbert }
238b2c929f0SDr. David Alan Gilbert 
239b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc)
240b2c929f0SDr. David Alan Gilbert {
241b2c929f0SDr. David Alan Gilbert     VirtIONet *n = qemu_get_nic_opaque(nc);
242b2c929f0SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
243b2c929f0SDr. David Alan Gilbert 
244b2c929f0SDr. David Alan Gilbert     /*
245b2c929f0SDr. David Alan Gilbert      * Make sure the virtio migration announcement timer isn't running
246b2c929f0SDr. David Alan Gilbert      * If it is, let it trigger announcement so that we do not cause
247b2c929f0SDr. David Alan Gilbert      * confusion.
248b2c929f0SDr. David Alan Gilbert      */
249b2c929f0SDr. David Alan Gilbert     if (n->announce_timer.round) {
250b2c929f0SDr. David Alan Gilbert         return;
251b2c929f0SDr. David Alan Gilbert     }
252b2c929f0SDr. David Alan Gilbert 
253b2c929f0SDr. David Alan Gilbert     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
254b2c929f0SDr. David Alan Gilbert         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
255b2c929f0SDr. David Alan Gilbert             virtio_net_announce_notify(n);
256b2c929f0SDr. David Alan Gilbert     }
257f57fcf70SJason Wang }
258f57fcf70SJason Wang 
2596e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
2606e790746SPaolo Bonzini {
26117a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2626e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
263441537f1SJason Wang     int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
264aa858194SSi-Wei Liu     int cvq = virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ) ?
265aa858194SSi-Wei Liu               n->max_ncs - n->max_queue_pairs : 0;
2666e790746SPaolo Bonzini 
267ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
2686e790746SPaolo Bonzini         return;
2696e790746SPaolo Bonzini     }
2706e790746SPaolo Bonzini 
2718c1ac475SRadim Krčmář     if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
2728c1ac475SRadim Krčmář         !!n->vhost_started) {
2736e790746SPaolo Bonzini         return;
2746e790746SPaolo Bonzini     }
2756e790746SPaolo Bonzini     if (!n->vhost_started) {
276086abc1cSMichael S. Tsirkin         int r, i;
277086abc1cSMichael S. Tsirkin 
2781bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
2791bfa316cSGreg Kurz             error_report("backend does not support %s vnet headers; "
2801bfa316cSGreg Kurz                          "falling back on userspace virtio",
2811bfa316cSGreg Kurz                          virtio_is_big_endian(vdev) ? "BE" : "LE");
2821bfa316cSGreg Kurz             return;
2831bfa316cSGreg Kurz         }
2841bfa316cSGreg Kurz 
285086abc1cSMichael S. Tsirkin         /* Any packets outstanding? Purge them to avoid touching rings
286086abc1cSMichael S. Tsirkin          * when vhost is running.
287086abc1cSMichael S. Tsirkin          */
288441537f1SJason Wang         for (i = 0;  i < queue_pairs; i++) {
289086abc1cSMichael S. Tsirkin             NetClientState *qnc = qemu_get_subqueue(n->nic, i);
290086abc1cSMichael S. Tsirkin 
291086abc1cSMichael S. Tsirkin             /* Purge both directions: TX and RX. */
292086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
293086abc1cSMichael S. Tsirkin             qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
294086abc1cSMichael S. Tsirkin         }
295086abc1cSMichael S. Tsirkin 
296a93e599dSMaxime Coquelin         if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) {
297a93e599dSMaxime Coquelin             r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu);
298a93e599dSMaxime Coquelin             if (r < 0) {
299a93e599dSMaxime Coquelin                 error_report("%uBytes MTU not supported by the backend",
300a93e599dSMaxime Coquelin                              n->net_conf.mtu);
301a93e599dSMaxime Coquelin 
302a93e599dSMaxime Coquelin                 return;
303a93e599dSMaxime Coquelin             }
304a93e599dSMaxime Coquelin         }
305a93e599dSMaxime Coquelin 
3066e790746SPaolo Bonzini         n->vhost_started = 1;
30722288fe5SJason Wang         r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq);
3086e790746SPaolo Bonzini         if (r < 0) {
3096e790746SPaolo Bonzini             error_report("unable to start vhost net: %d: "
3106e790746SPaolo Bonzini                          "falling back on userspace virtio", -r);
3116e790746SPaolo Bonzini             n->vhost_started = 0;
3126e790746SPaolo Bonzini         }
3136e790746SPaolo Bonzini     } else {
31422288fe5SJason Wang         vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq);
3156e790746SPaolo Bonzini         n->vhost_started = 0;
3166e790746SPaolo Bonzini     }
3176e790746SPaolo Bonzini }
3186e790746SPaolo Bonzini 
3191bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
3201bfa316cSGreg Kurz                                           NetClientState *peer,
3211bfa316cSGreg Kurz                                           bool enable)
3221bfa316cSGreg Kurz {
3231bfa316cSGreg Kurz     if (virtio_is_big_endian(vdev)) {
3241bfa316cSGreg Kurz         return qemu_set_vnet_be(peer, enable);
3251bfa316cSGreg Kurz     } else {
3261bfa316cSGreg Kurz         return qemu_set_vnet_le(peer, enable);
3271bfa316cSGreg Kurz     }
3281bfa316cSGreg Kurz }
3291bfa316cSGreg Kurz 
3301bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
331441537f1SJason Wang                                        int queue_pairs, bool enable)
3321bfa316cSGreg Kurz {
3331bfa316cSGreg Kurz     int i;
3341bfa316cSGreg Kurz 
335441537f1SJason Wang     for (i = 0; i < queue_pairs; i++) {
3361bfa316cSGreg Kurz         if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
3371bfa316cSGreg Kurz             enable) {
3381bfa316cSGreg Kurz             while (--i >= 0) {
3391bfa316cSGreg Kurz                 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
3401bfa316cSGreg Kurz             }
3411bfa316cSGreg Kurz 
3421bfa316cSGreg Kurz             return true;
3431bfa316cSGreg Kurz         }
3441bfa316cSGreg Kurz     }
3451bfa316cSGreg Kurz 
3461bfa316cSGreg Kurz     return false;
3471bfa316cSGreg Kurz }
3481bfa316cSGreg Kurz 
3491bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
3501bfa316cSGreg Kurz {
3511bfa316cSGreg Kurz     VirtIODevice *vdev = VIRTIO_DEVICE(n);
352441537f1SJason Wang     int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
3531bfa316cSGreg Kurz 
3541bfa316cSGreg Kurz     if (virtio_net_started(n, status)) {
3551bfa316cSGreg Kurz         /* Before using the device, we tell the network backend about the
3561bfa316cSGreg Kurz          * endianness to use when parsing vnet headers. If the backend
3571bfa316cSGreg Kurz          * can't do it, we fallback onto fixing the headers in the core
3581bfa316cSGreg Kurz          * virtio-net code.
3591bfa316cSGreg Kurz          */
3601bfa316cSGreg Kurz         n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
361441537f1SJason Wang                                                             queue_pairs, true);
3621bfa316cSGreg Kurz     } else if (virtio_net_started(n, vdev->status)) {
3631bfa316cSGreg Kurz         /* After using the device, we need to reset the network backend to
3641bfa316cSGreg Kurz          * the default (guest native endianness), otherwise the guest may
3651bfa316cSGreg Kurz          * lose network connectivity if it is rebooted into a different
3661bfa316cSGreg Kurz          * endianness.
3671bfa316cSGreg Kurz          */
368441537f1SJason Wang         virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false);
3691bfa316cSGreg Kurz     }
3701bfa316cSGreg Kurz }
3711bfa316cSGreg Kurz 
372283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq)
373283e2c2aSYuri Benditovich {
374283e2c2aSYuri Benditovich     unsigned int dropped = virtqueue_drop_all(vq);
375283e2c2aSYuri Benditovich     if (dropped) {
376283e2c2aSYuri Benditovich         virtio_notify(vdev, vq);
377283e2c2aSYuri Benditovich     }
378283e2c2aSYuri Benditovich }
379283e2c2aSYuri Benditovich 
3806e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
3816e790746SPaolo Bonzini {
38217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
3836e790746SPaolo Bonzini     VirtIONetQueue *q;
3846e790746SPaolo Bonzini     int i;
3856e790746SPaolo Bonzini     uint8_t queue_status;
3866e790746SPaolo Bonzini 
3871bfa316cSGreg Kurz     virtio_net_vnet_endian_status(n, status);
3886e790746SPaolo Bonzini     virtio_net_vhost_status(n, status);
3896e790746SPaolo Bonzini 
390441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
39138705bb5SFam Zheng         NetClientState *ncs = qemu_get_subqueue(n->nic, i);
39238705bb5SFam Zheng         bool queue_started;
3936e790746SPaolo Bonzini         q = &n->vqs[i];
3946e790746SPaolo Bonzini 
395441537f1SJason Wang         if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) {
3966e790746SPaolo Bonzini             queue_status = 0;
3976e790746SPaolo Bonzini         } else {
3986e790746SPaolo Bonzini             queue_status = status;
3996e790746SPaolo Bonzini         }
40038705bb5SFam Zheng         queue_started =
40138705bb5SFam Zheng             virtio_net_started(n, queue_status) && !n->vhost_started;
40238705bb5SFam Zheng 
40338705bb5SFam Zheng         if (queue_started) {
40438705bb5SFam Zheng             qemu_flush_queued_packets(ncs);
40538705bb5SFam Zheng         }
4066e790746SPaolo Bonzini 
4076e790746SPaolo Bonzini         if (!q->tx_waiting) {
4086e790746SPaolo Bonzini             continue;
4096e790746SPaolo Bonzini         }
4106e790746SPaolo Bonzini 
41138705bb5SFam Zheng         if (queue_started) {
4126e790746SPaolo Bonzini             if (q->tx_timer) {
413bc72ad67SAlex Bligh                 timer_mod(q->tx_timer,
414bc72ad67SAlex Bligh                                qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
4156e790746SPaolo Bonzini             } else {
4166e790746SPaolo Bonzini                 qemu_bh_schedule(q->tx_bh);
4176e790746SPaolo Bonzini             }
4186e790746SPaolo Bonzini         } else {
4196e790746SPaolo Bonzini             if (q->tx_timer) {
420bc72ad67SAlex Bligh                 timer_del(q->tx_timer);
4216e790746SPaolo Bonzini             } else {
4226e790746SPaolo Bonzini                 qemu_bh_cancel(q->tx_bh);
4236e790746SPaolo Bonzini             }
424283e2c2aSYuri Benditovich             if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 &&
42570e53e6eSJason Wang                 (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) &&
42670e53e6eSJason Wang                 vdev->vm_running) {
427283e2c2aSYuri Benditovich                 /* if tx is waiting we are likely have some packets in tx queue
428283e2c2aSYuri Benditovich                  * and disabled notification */
429283e2c2aSYuri Benditovich                 q->tx_waiting = 0;
430283e2c2aSYuri Benditovich                 virtio_queue_set_notification(q->tx_vq, 1);
431283e2c2aSYuri Benditovich                 virtio_net_drop_tx_queue_data(vdev, q->tx_vq);
432283e2c2aSYuri Benditovich             }
4336e790746SPaolo Bonzini         }
4346e790746SPaolo Bonzini     }
4356e790746SPaolo Bonzini }
4366e790746SPaolo Bonzini 
4376e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc)
4386e790746SPaolo Bonzini {
4396e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
44017a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
4416e790746SPaolo Bonzini     uint16_t old_status = n->status;
4426e790746SPaolo Bonzini 
4436e790746SPaolo Bonzini     if (nc->link_down)
4446e790746SPaolo Bonzini         n->status &= ~VIRTIO_NET_S_LINK_UP;
4456e790746SPaolo Bonzini     else
4466e790746SPaolo Bonzini         n->status |= VIRTIO_NET_S_LINK_UP;
4476e790746SPaolo Bonzini 
4486e790746SPaolo Bonzini     if (n->status != old_status)
44917a0ca55SKONRAD Frederic         virtio_notify_config(vdev);
4506e790746SPaolo Bonzini 
45117a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
4526e790746SPaolo Bonzini }
4536e790746SPaolo Bonzini 
454b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc)
455b1be4280SAmos Kong {
456b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
457b1be4280SAmos Kong 
458b1be4280SAmos Kong     if (nc->rxfilter_notify_enabled) {
459ddfb0baaSMarkus Armbruster         char *path = object_get_canonical_path(OBJECT(n->qdev));
46006150279SWenchao Xia         qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
4613ab72385SPeter Xu                                               n->netclient_name, path);
46296e35046SAmos Kong         g_free(path);
463b1be4280SAmos Kong 
464b1be4280SAmos Kong         /* disable event notification to avoid events flooding */
465b1be4280SAmos Kong         nc->rxfilter_notify_enabled = 0;
466b1be4280SAmos Kong     }
467b1be4280SAmos Kong }
468b1be4280SAmos Kong 
469f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n)
470f7bc8ef8SAmos Kong {
47154aa3de7SEric Blake     intList *list;
472f7bc8ef8SAmos Kong     int i, j;
473f7bc8ef8SAmos Kong 
474f7bc8ef8SAmos Kong     list = NULL;
475f7bc8ef8SAmos Kong     for (i = 0; i < MAX_VLAN >> 5; i++) {
476f7bc8ef8SAmos Kong         for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
477f7bc8ef8SAmos Kong             if (n->vlans[i] & (1U << j)) {
47854aa3de7SEric Blake                 QAPI_LIST_PREPEND(list, (i << 5) + j);
479f7bc8ef8SAmos Kong             }
480f7bc8ef8SAmos Kong         }
481f7bc8ef8SAmos Kong     }
482f7bc8ef8SAmos Kong 
483f7bc8ef8SAmos Kong     return list;
484f7bc8ef8SAmos Kong }
485f7bc8ef8SAmos Kong 
486b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
487b1be4280SAmos Kong {
488b1be4280SAmos Kong     VirtIONet *n = qemu_get_nic_opaque(nc);
489f7bc8ef8SAmos Kong     VirtIODevice *vdev = VIRTIO_DEVICE(n);
490b1be4280SAmos Kong     RxFilterInfo *info;
49154aa3de7SEric Blake     strList *str_list;
492f7bc8ef8SAmos Kong     int i;
493b1be4280SAmos Kong 
494b1be4280SAmos Kong     info = g_malloc0(sizeof(*info));
495b1be4280SAmos Kong     info->name = g_strdup(nc->name);
496b1be4280SAmos Kong     info->promiscuous = n->promisc;
497b1be4280SAmos Kong 
498b1be4280SAmos Kong     if (n->nouni) {
499b1be4280SAmos Kong         info->unicast = RX_STATE_NONE;
500b1be4280SAmos Kong     } else if (n->alluni) {
501b1be4280SAmos Kong         info->unicast = RX_STATE_ALL;
502b1be4280SAmos Kong     } else {
503b1be4280SAmos Kong         info->unicast = RX_STATE_NORMAL;
504b1be4280SAmos Kong     }
505b1be4280SAmos Kong 
506b1be4280SAmos Kong     if (n->nomulti) {
507b1be4280SAmos Kong         info->multicast = RX_STATE_NONE;
508b1be4280SAmos Kong     } else if (n->allmulti) {
509b1be4280SAmos Kong         info->multicast = RX_STATE_ALL;
510b1be4280SAmos Kong     } else {
511b1be4280SAmos Kong         info->multicast = RX_STATE_NORMAL;
512b1be4280SAmos Kong     }
513b1be4280SAmos Kong 
514b1be4280SAmos Kong     info->broadcast_allowed = n->nobcast;
515b1be4280SAmos Kong     info->multicast_overflow = n->mac_table.multi_overflow;
516b1be4280SAmos Kong     info->unicast_overflow = n->mac_table.uni_overflow;
517b1be4280SAmos Kong 
518b0575ba4SScott Feldman     info->main_mac = qemu_mac_strdup_printf(n->mac);
519b1be4280SAmos Kong 
520b1be4280SAmos Kong     str_list = NULL;
521b1be4280SAmos Kong     for (i = 0; i < n->mac_table.first_multi; i++) {
52254aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
52354aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
524b1be4280SAmos Kong     }
525b1be4280SAmos Kong     info->unicast_table = str_list;
526b1be4280SAmos Kong 
527b1be4280SAmos Kong     str_list = NULL;
528b1be4280SAmos Kong     for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
52954aa3de7SEric Blake         QAPI_LIST_PREPEND(str_list,
53054aa3de7SEric Blake                       qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN));
531b1be4280SAmos Kong     }
532b1be4280SAmos Kong     info->multicast_table = str_list;
533f7bc8ef8SAmos Kong     info->vlan_table = get_vlan_table(n);
534b1be4280SAmos Kong 
53595129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
536f7bc8ef8SAmos Kong         info->vlan = RX_STATE_ALL;
537f7bc8ef8SAmos Kong     } else if (!info->vlan_table) {
538f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NONE;
539f7bc8ef8SAmos Kong     } else {
540f7bc8ef8SAmos Kong         info->vlan = RX_STATE_NORMAL;
541b1be4280SAmos Kong     }
542b1be4280SAmos Kong 
543b1be4280SAmos Kong     /* enable event notification after query */
544b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
545b1be4280SAmos Kong 
546b1be4280SAmos Kong     return info;
547b1be4280SAmos Kong }
548b1be4280SAmos Kong 
5496e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev)
5506e790746SPaolo Bonzini {
55117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
55294b52958SGreg Kurz     int i;
5536e790746SPaolo Bonzini 
5546e790746SPaolo Bonzini     /* Reset back to compatibility mode */
5556e790746SPaolo Bonzini     n->promisc = 1;
5566e790746SPaolo Bonzini     n->allmulti = 0;
5576e790746SPaolo Bonzini     n->alluni = 0;
5586e790746SPaolo Bonzini     n->nomulti = 0;
5596e790746SPaolo Bonzini     n->nouni = 0;
5606e790746SPaolo Bonzini     n->nobcast = 0;
5616e790746SPaolo Bonzini     /* multiqueue is disabled by default */
562441537f1SJason Wang     n->curr_queue_pairs = 1;
5639d8c6a25SDr. David Alan Gilbert     timer_del(n->announce_timer.tm);
5649d8c6a25SDr. David Alan Gilbert     n->announce_timer.round = 0;
565f57fcf70SJason Wang     n->status &= ~VIRTIO_NET_S_ANNOUNCE;
5666e790746SPaolo Bonzini 
5676e790746SPaolo Bonzini     /* Flush any MAC and VLAN filter table state */
5686e790746SPaolo Bonzini     n->mac_table.in_use = 0;
5696e790746SPaolo Bonzini     n->mac_table.first_multi = 0;
5706e790746SPaolo Bonzini     n->mac_table.multi_overflow = 0;
5716e790746SPaolo Bonzini     n->mac_table.uni_overflow = 0;
5726e790746SPaolo Bonzini     memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
5736e790746SPaolo Bonzini     memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
574702d66a8SMichael S. Tsirkin     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
5756e790746SPaolo Bonzini     memset(n->vlans, 0, MAX_VLAN >> 3);
57694b52958SGreg Kurz 
57794b52958SGreg Kurz     /* Flush any async TX */
578441537f1SJason Wang     for (i = 0;  i < n->max_queue_pairs; i++) {
579*4fdf69abSKangjie Xu         flush_or_purge_queued_packets(qemu_get_subqueue(n->nic, i));
58094b52958SGreg Kurz     }
5816e790746SPaolo Bonzini }
5826e790746SPaolo Bonzini 
5836e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n)
5846e790746SPaolo Bonzini {
5856e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
5866e790746SPaolo Bonzini     if (!nc->peer) {
5876e790746SPaolo Bonzini         return;
5886e790746SPaolo Bonzini     }
5896e790746SPaolo Bonzini 
590d6085e3aSStefan Hajnoczi     n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
5916e790746SPaolo Bonzini }
5926e790746SPaolo Bonzini 
5936e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n)
5946e790746SPaolo Bonzini {
5956e790746SPaolo Bonzini     return n->has_vnet_hdr;
5966e790746SPaolo Bonzini }
5976e790746SPaolo Bonzini 
5986e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n)
5996e790746SPaolo Bonzini {
6006e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n))
6016e790746SPaolo Bonzini         return 0;
6026e790746SPaolo Bonzini 
603d6085e3aSStefan Hajnoczi     n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
6046e790746SPaolo Bonzini 
6056e790746SPaolo Bonzini     return n->has_ufo;
6066e790746SPaolo Bonzini }
6076e790746SPaolo Bonzini 
608bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
609e22f0603SYuri Benditovich                                        int version_1, int hash_report)
6106e790746SPaolo Bonzini {
6116e790746SPaolo Bonzini     int i;
6126e790746SPaolo Bonzini     NetClientState *nc;
6136e790746SPaolo Bonzini 
6146e790746SPaolo Bonzini     n->mergeable_rx_bufs = mergeable_rx_bufs;
6156e790746SPaolo Bonzini 
616bb9d17f8SCornelia Huck     if (version_1) {
617e22f0603SYuri Benditovich         n->guest_hdr_len = hash_report ?
618e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_v1_hash) :
619e22f0603SYuri Benditovich             sizeof(struct virtio_net_hdr_mrg_rxbuf);
620e22f0603SYuri Benditovich         n->rss_data.populate_hash = !!hash_report;
621bb9d17f8SCornelia Huck     } else {
6226e790746SPaolo Bonzini         n->guest_hdr_len = n->mergeable_rx_bufs ?
623bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr_mrg_rxbuf) :
624bb9d17f8SCornelia Huck             sizeof(struct virtio_net_hdr);
625bb9d17f8SCornelia Huck     }
6266e790746SPaolo Bonzini 
627441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
6286e790746SPaolo Bonzini         nc = qemu_get_subqueue(n->nic, i);
6296e790746SPaolo Bonzini 
6306e790746SPaolo Bonzini         if (peer_has_vnet_hdr(n) &&
631d6085e3aSStefan Hajnoczi             qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
632d6085e3aSStefan Hajnoczi             qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
6336e790746SPaolo Bonzini             n->host_hdr_len = n->guest_hdr_len;
6346e790746SPaolo Bonzini         }
6356e790746SPaolo Bonzini     }
6366e790746SPaolo Bonzini }
6376e790746SPaolo Bonzini 
6382eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n)
6392eef278bSMichael S. Tsirkin {
6402eef278bSMichael S. Tsirkin     NetClientState *peer = n->nic_conf.peers.ncs[0];
6412eef278bSMichael S. Tsirkin 
6422eef278bSMichael S. Tsirkin     /*
6430ea5778fSEugenio Pérez      * Backends other than vhost-user or vhost-vdpa don't support max queue
6440ea5778fSEugenio Pérez      * size.
6452eef278bSMichael S. Tsirkin      */
6462eef278bSMichael S. Tsirkin     if (!peer) {
6472eef278bSMichael S. Tsirkin         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6482eef278bSMichael S. Tsirkin     }
6492eef278bSMichael S. Tsirkin 
6500ea5778fSEugenio Pérez     switch(peer->info->type) {
6510ea5778fSEugenio Pérez     case NET_CLIENT_DRIVER_VHOST_USER:
6520ea5778fSEugenio Pérez     case NET_CLIENT_DRIVER_VHOST_VDPA:
6532eef278bSMichael S. Tsirkin         return VIRTQUEUE_MAX_SIZE;
6540ea5778fSEugenio Pérez     default:
6550ea5778fSEugenio Pérez         return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE;
6560ea5778fSEugenio Pérez     };
6572eef278bSMichael S. Tsirkin }
6582eef278bSMichael S. Tsirkin 
6596e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index)
6606e790746SPaolo Bonzini {
6616e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6626e790746SPaolo Bonzini 
6636e790746SPaolo Bonzini     if (!nc->peer) {
6646e790746SPaolo Bonzini         return 0;
6656e790746SPaolo Bonzini     }
6666e790746SPaolo Bonzini 
667f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6687263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 1);
6697263a0adSChangchun Ouyang     }
6707263a0adSChangchun Ouyang 
671f394b2e2SEric Blake     if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
6726e790746SPaolo Bonzini         return 0;
6736e790746SPaolo Bonzini     }
6746e790746SPaolo Bonzini 
675441537f1SJason Wang     if (n->max_queue_pairs == 1) {
6761074b879SJason Wang         return 0;
6771074b879SJason Wang     }
6781074b879SJason Wang 
6796e790746SPaolo Bonzini     return tap_enable(nc->peer);
6806e790746SPaolo Bonzini }
6816e790746SPaolo Bonzini 
6826e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index)
6836e790746SPaolo Bonzini {
6846e790746SPaolo Bonzini     NetClientState *nc = qemu_get_subqueue(n->nic, index);
6856e790746SPaolo Bonzini 
6866e790746SPaolo Bonzini     if (!nc->peer) {
6876e790746SPaolo Bonzini         return 0;
6886e790746SPaolo Bonzini     }
6896e790746SPaolo Bonzini 
690f394b2e2SEric Blake     if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
6917263a0adSChangchun Ouyang         vhost_set_vring_enable(nc->peer, 0);
6927263a0adSChangchun Ouyang     }
6937263a0adSChangchun Ouyang 
694f394b2e2SEric Blake     if (nc->peer->info->type !=  NET_CLIENT_DRIVER_TAP) {
6956e790746SPaolo Bonzini         return 0;
6966e790746SPaolo Bonzini     }
6976e790746SPaolo Bonzini 
6986e790746SPaolo Bonzini     return tap_disable(nc->peer);
6996e790746SPaolo Bonzini }
7006e790746SPaolo Bonzini 
701441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n)
7026e790746SPaolo Bonzini {
7036e790746SPaolo Bonzini     int i;
704ddfa83eaSJoel Stanley     int r;
7056e790746SPaolo Bonzini 
70668b5f314SYuri Benditovich     if (n->nic->peer_deleted) {
70768b5f314SYuri Benditovich         return;
70868b5f314SYuri Benditovich     }
70968b5f314SYuri Benditovich 
710441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
711441537f1SJason Wang         if (i < n->curr_queue_pairs) {
712ddfa83eaSJoel Stanley             r = peer_attach(n, i);
713ddfa83eaSJoel Stanley             assert(!r);
7146e790746SPaolo Bonzini         } else {
715ddfa83eaSJoel Stanley             r = peer_detach(n, i);
716ddfa83eaSJoel Stanley             assert(!r);
7176e790746SPaolo Bonzini         }
7186e790746SPaolo Bonzini     }
7196e790746SPaolo Bonzini }
7206e790746SPaolo Bonzini 
721ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
7226e790746SPaolo Bonzini 
7239d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
7249d5b731dSJason Wang                                         Error **errp)
7256e790746SPaolo Bonzini {
72617a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
7276e790746SPaolo Bonzini     NetClientState *nc = qemu_get_queue(n->nic);
7286e790746SPaolo Bonzini 
729da3e8a23SShannon Zhao     /* Firstly sync all virtio-net possible supported features */
730da3e8a23SShannon Zhao     features |= n->host_features;
731da3e8a23SShannon Zhao 
7320cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7336e790746SPaolo Bonzini 
7346e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n)) {
7350cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
7360cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7370cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7380cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
7396e790746SPaolo Bonzini 
7400cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
7410cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
7420cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
7430cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
744e22f0603SYuri Benditovich 
745e22f0603SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT);
7466e790746SPaolo Bonzini     }
7476e790746SPaolo Bonzini 
7486e790746SPaolo Bonzini     if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
7490cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
7500cd09c3aSCornelia Huck         virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
7516e790746SPaolo Bonzini     }
7526e790746SPaolo Bonzini 
753ed8b4afeSNikolay Nikolaev     if (!get_vhost_net(nc->peer)) {
7546e790746SPaolo Bonzini         return features;
7556e790746SPaolo Bonzini     }
7562974e916SYuri Benditovich 
7570145c393SAndrew Melnychenko     if (!ebpf_rss_is_loaded(&n->ebpf_rss)) {
75859079029SYuri Benditovich         virtio_clear_feature(&features, VIRTIO_NET_F_RSS);
7590145c393SAndrew Melnychenko     }
76075ebec11SMaxime Coquelin     features = vhost_net_get_features(get_vhost_net(nc->peer), features);
76175ebec11SMaxime Coquelin     vdev->backend_features = features;
76275ebec11SMaxime Coquelin 
76375ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
76475ebec11SMaxime Coquelin             (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) {
76575ebec11SMaxime Coquelin         features |= (1ULL << VIRTIO_NET_F_MTU);
76675ebec11SMaxime Coquelin     }
76775ebec11SMaxime Coquelin 
76875ebec11SMaxime Coquelin     return features;
7696e790746SPaolo Bonzini }
7706e790746SPaolo Bonzini 
771019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
7726e790746SPaolo Bonzini {
773019a3edbSGerd Hoffmann     uint64_t features = 0;
7746e790746SPaolo Bonzini 
7756e790746SPaolo Bonzini     /* Linux kernel 2.6.25.  It understood MAC (as everyone must),
7766e790746SPaolo Bonzini      * but also these: */
7770cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_MAC);
7780cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
7790cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
7800cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
7810cd09c3aSCornelia Huck     virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
7826e790746SPaolo Bonzini 
7836e790746SPaolo Bonzini     return features;
7846e790746SPaolo Bonzini }
7856e790746SPaolo Bonzini 
786644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n)
787644c9858SDmitry Fleytman {
788ad37bb3bSStefan Hajnoczi     qemu_set_offload(qemu_get_queue(n->nic)->peer,
789644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
790644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
791644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
792644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
793644c9858SDmitry Fleytman             !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
794644c9858SDmitry Fleytman }
795644c9858SDmitry Fleytman 
796644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
797644c9858SDmitry Fleytman {
798644c9858SDmitry Fleytman     static const uint64_t guest_offloads_mask =
799644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
800644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
801644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
802644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_ECN)  |
803644c9858SDmitry Fleytman         (1ULL << VIRTIO_NET_F_GUEST_UFO);
804644c9858SDmitry Fleytman 
805644c9858SDmitry Fleytman     return guest_offloads_mask & features;
806644c9858SDmitry Fleytman }
807644c9858SDmitry Fleytman 
808644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
809644c9858SDmitry Fleytman {
810644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
811644c9858SDmitry Fleytman     return virtio_net_guest_offloads_by_features(vdev->guest_features);
812644c9858SDmitry Fleytman }
813644c9858SDmitry Fleytman 
814f5e1847bSJuan Quintela typedef struct {
815f5e1847bSJuan Quintela     VirtIONet *n;
81612b2fad7SKevin Wolf     DeviceState *dev;
81712b2fad7SKevin Wolf } FailoverDevice;
818f5e1847bSJuan Quintela 
819f5e1847bSJuan Quintela /**
82012b2fad7SKevin Wolf  * Set the failover primary device
821f5e1847bSJuan Quintela  *
822f5e1847bSJuan Quintela  * @opaque: FailoverId to setup
823f5e1847bSJuan Quintela  * @opts: opts for device we are handling
824f5e1847bSJuan Quintela  * @errp: returns an error if this function fails
825f5e1847bSJuan Quintela  */
82612b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque)
827f5e1847bSJuan Quintela {
82812b2fad7SKevin Wolf     FailoverDevice *fdev = opaque;
82912b2fad7SKevin Wolf     PCIDevice *pci_dev = (PCIDevice *)
83012b2fad7SKevin Wolf         object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE);
831f5e1847bSJuan Quintela 
83212b2fad7SKevin Wolf     if (!pci_dev) {
83312b2fad7SKevin Wolf         return 0;
83412b2fad7SKevin Wolf     }
83512b2fad7SKevin Wolf 
83612b2fad7SKevin Wolf     if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) {
83712b2fad7SKevin Wolf         fdev->dev = dev;
838f5e1847bSJuan Quintela         return 1;
839f5e1847bSJuan Quintela     }
840f5e1847bSJuan Quintela 
841f5e1847bSJuan Quintela     return 0;
842f5e1847bSJuan Quintela }
843f5e1847bSJuan Quintela 
844f5e1847bSJuan Quintela /**
84585d3b931SJuan Quintela  * Find the primary device for this failover virtio-net
84685d3b931SJuan Quintela  *
84785d3b931SJuan Quintela  * @n: VirtIONet device
84885d3b931SJuan Quintela  * @errp: returns an error if this function fails
84985d3b931SJuan Quintela  */
8500a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n)
8519711cd0dSJens Freimann {
85212b2fad7SKevin Wolf     FailoverDevice fdev = {
85312b2fad7SKevin Wolf         .n = n,
85412b2fad7SKevin Wolf     };
8559711cd0dSJens Freimann 
85612b2fad7SKevin Wolf     qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL,
85712b2fad7SKevin Wolf                        NULL, NULL, &fdev);
85812b2fad7SKevin Wolf     return fdev.dev;
8599711cd0dSJens Freimann }
8609711cd0dSJens Freimann 
86121e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp)
86221e8709bSJuan Quintela {
86321e8709bSJuan Quintela     Error *err = NULL;
86421e8709bSJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
86521e8709bSJuan Quintela 
86621e8709bSJuan Quintela     if (dev) {
86721e8709bSJuan Quintela         return;
86821e8709bSJuan Quintela     }
86921e8709bSJuan Quintela 
870259a10dbSKevin Wolf     if (!n->primary_opts) {
87197ca9c59SLaurent Vivier         error_setg(errp, "Primary device not found");
87297ca9c59SLaurent Vivier         error_append_hint(errp, "Virtio-net failover will not work. Make "
87397ca9c59SLaurent Vivier                           "sure primary device has parameter"
87497ca9c59SLaurent Vivier                           " failover_pair_id=%s\n", n->netclient_name);
87521e8709bSJuan Quintela         return;
87621e8709bSJuan Quintela     }
877259a10dbSKevin Wolf 
878f3558b1bSKevin Wolf     dev = qdev_device_add_from_qdict(n->primary_opts,
879f3558b1bSKevin Wolf                                      n->primary_opts_from_json,
880f3558b1bSKevin Wolf                                      &err);
88121e8709bSJuan Quintela     if (err) {
882f3558b1bSKevin Wolf         qobject_unref(n->primary_opts);
883259a10dbSKevin Wolf         n->primary_opts = NULL;
88400e7b129SLaurent Vivier     } else {
88500e7b129SLaurent Vivier         object_unref(OBJECT(dev));
88621e8709bSJuan Quintela     }
88721e8709bSJuan Quintela     error_propagate(errp, err);
88821e8709bSJuan Quintela }
88921e8709bSJuan Quintela 
890d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
8916e790746SPaolo Bonzini {
89217a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
8939711cd0dSJens Freimann     Error *err = NULL;
8946e790746SPaolo Bonzini     int i;
8956e790746SPaolo Bonzini 
89675ebec11SMaxime Coquelin     if (n->mtu_bypass_backend &&
89775ebec11SMaxime Coquelin             !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) {
89875ebec11SMaxime Coquelin         features &= ~(1ULL << VIRTIO_NET_F_MTU);
89975ebec11SMaxime Coquelin     }
90075ebec11SMaxime Coquelin 
901ef546f12SCornelia Huck     virtio_net_set_multiqueue(n,
90259079029SYuri Benditovich                               virtio_has_feature(features, VIRTIO_NET_F_RSS) ||
90395129d6fSCornelia Huck                               virtio_has_feature(features, VIRTIO_NET_F_MQ));
9046e790746SPaolo Bonzini 
905ef546f12SCornelia Huck     virtio_net_set_mrg_rx_bufs(n,
90695129d6fSCornelia Huck                                virtio_has_feature(features,
907bb9d17f8SCornelia Huck                                                   VIRTIO_NET_F_MRG_RXBUF),
90895129d6fSCornelia Huck                                virtio_has_feature(features,
909e22f0603SYuri Benditovich                                                   VIRTIO_F_VERSION_1),
910e22f0603SYuri Benditovich                                virtio_has_feature(features,
911e22f0603SYuri Benditovich                                                   VIRTIO_NET_F_HASH_REPORT));
9126e790746SPaolo Bonzini 
9132974e916SYuri Benditovich     n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9142974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4);
9152974e916SYuri Benditovich     n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) &&
9162974e916SYuri Benditovich         virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6);
917e22f0603SYuri Benditovich     n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS);
9182974e916SYuri Benditovich 
9196e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
920644c9858SDmitry Fleytman         n->curr_guest_offloads =
921644c9858SDmitry Fleytman             virtio_net_guest_offloads_by_features(features);
922644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
9236e790746SPaolo Bonzini     }
9246e790746SPaolo Bonzini 
925441537f1SJason Wang     for (i = 0;  i < n->max_queue_pairs; i++) {
9266e790746SPaolo Bonzini         NetClientState *nc = qemu_get_subqueue(n->nic, i);
9276e790746SPaolo Bonzini 
928ed8b4afeSNikolay Nikolaev         if (!get_vhost_net(nc->peer)) {
9296e790746SPaolo Bonzini             continue;
9306e790746SPaolo Bonzini         }
931ed8b4afeSNikolay Nikolaev         vhost_net_ack_features(get_vhost_net(nc->peer), features);
9326e790746SPaolo Bonzini     }
9330b1eaa88SStefan Fritsch 
93495129d6fSCornelia Huck     if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
9350b1eaa88SStefan Fritsch         memset(n->vlans, 0, MAX_VLAN >> 3);
9360b1eaa88SStefan Fritsch     } else {
9370b1eaa88SStefan Fritsch         memset(n->vlans, 0xff, MAX_VLAN >> 3);
9380b1eaa88SStefan Fritsch     }
9399711cd0dSJens Freimann 
9409711cd0dSJens Freimann     if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) {
9419711cd0dSJens Freimann         qapi_event_send_failover_negotiated(n->netclient_name);
942e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, false);
9439711cd0dSJens Freimann         failover_add_primary(n, &err);
9449711cd0dSJens Freimann         if (err) {
9451b529d90SLaurent Vivier             if (!qtest_enabled()) {
9469711cd0dSJens Freimann                 warn_report_err(err);
9471b529d90SLaurent Vivier             } else {
9481b529d90SLaurent Vivier                 error_free(err);
9491b529d90SLaurent Vivier             }
9509711cd0dSJens Freimann         }
9516e790746SPaolo Bonzini     }
95221e8709bSJuan Quintela }
9536e790746SPaolo Bonzini 
9546e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
9556e790746SPaolo Bonzini                                      struct iovec *iov, unsigned int iov_cnt)
9566e790746SPaolo Bonzini {
9576e790746SPaolo Bonzini     uint8_t on;
9586e790746SPaolo Bonzini     size_t s;
959b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
9606e790746SPaolo Bonzini 
9616e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
9626e790746SPaolo Bonzini     if (s != sizeof(on)) {
9636e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9646e790746SPaolo Bonzini     }
9656e790746SPaolo Bonzini 
9666e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
9676e790746SPaolo Bonzini         n->promisc = on;
9686e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
9696e790746SPaolo Bonzini         n->allmulti = on;
9706e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
9716e790746SPaolo Bonzini         n->alluni = on;
9726e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
9736e790746SPaolo Bonzini         n->nomulti = on;
9746e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
9756e790746SPaolo Bonzini         n->nouni = on;
9766e790746SPaolo Bonzini     } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
9776e790746SPaolo Bonzini         n->nobcast = on;
9786e790746SPaolo Bonzini     } else {
9796e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
9806e790746SPaolo Bonzini     }
9816e790746SPaolo Bonzini 
982b1be4280SAmos Kong     rxfilter_notify(nc);
983b1be4280SAmos Kong 
9846e790746SPaolo Bonzini     return VIRTIO_NET_OK;
9856e790746SPaolo Bonzini }
9866e790746SPaolo Bonzini 
987644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
988644c9858SDmitry Fleytman                                      struct iovec *iov, unsigned int iov_cnt)
989644c9858SDmitry Fleytman {
990644c9858SDmitry Fleytman     VirtIODevice *vdev = VIRTIO_DEVICE(n);
991644c9858SDmitry Fleytman     uint64_t offloads;
992644c9858SDmitry Fleytman     size_t s;
993644c9858SDmitry Fleytman 
99495129d6fSCornelia Huck     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
995644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
996644c9858SDmitry Fleytman     }
997644c9858SDmitry Fleytman 
998644c9858SDmitry Fleytman     s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
999644c9858SDmitry Fleytman     if (s != sizeof(offloads)) {
1000644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1001644c9858SDmitry Fleytman     }
1002644c9858SDmitry Fleytman 
1003644c9858SDmitry Fleytman     if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
1004644c9858SDmitry Fleytman         uint64_t supported_offloads;
1005644c9858SDmitry Fleytman 
1006189ae6bbSJason Wang         offloads = virtio_ldq_p(vdev, &offloads);
1007189ae6bbSJason Wang 
1008644c9858SDmitry Fleytman         if (!n->has_vnet_hdr) {
1009644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1010644c9858SDmitry Fleytman         }
1011644c9858SDmitry Fleytman 
10122974e916SYuri Benditovich         n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10132974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4);
10142974e916SYuri Benditovich         n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) &&
10152974e916SYuri Benditovich             virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6);
10162974e916SYuri Benditovich         virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT);
10172974e916SYuri Benditovich 
1018644c9858SDmitry Fleytman         supported_offloads = virtio_net_supported_guest_offloads(n);
1019644c9858SDmitry Fleytman         if (offloads & ~supported_offloads) {
1020644c9858SDmitry Fleytman             return VIRTIO_NET_ERR;
1021644c9858SDmitry Fleytman         }
1022644c9858SDmitry Fleytman 
1023644c9858SDmitry Fleytman         n->curr_guest_offloads = offloads;
1024644c9858SDmitry Fleytman         virtio_net_apply_guest_offloads(n);
1025644c9858SDmitry Fleytman 
1026644c9858SDmitry Fleytman         return VIRTIO_NET_OK;
1027644c9858SDmitry Fleytman     } else {
1028644c9858SDmitry Fleytman         return VIRTIO_NET_ERR;
1029644c9858SDmitry Fleytman     }
1030644c9858SDmitry Fleytman }
1031644c9858SDmitry Fleytman 
10326e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
10336e790746SPaolo Bonzini                                  struct iovec *iov, unsigned int iov_cnt)
10346e790746SPaolo Bonzini {
10351399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
10366e790746SPaolo Bonzini     struct virtio_net_ctrl_mac mac_data;
10376e790746SPaolo Bonzini     size_t s;
1038b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
10396e790746SPaolo Bonzini 
10406e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
10416e790746SPaolo Bonzini         if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
10426e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
10436e790746SPaolo Bonzini         }
10446e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
10456e790746SPaolo Bonzini         assert(s == sizeof(n->mac));
10466e790746SPaolo Bonzini         qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
1047b1be4280SAmos Kong         rxfilter_notify(nc);
1048b1be4280SAmos Kong 
10496e790746SPaolo Bonzini         return VIRTIO_NET_OK;
10506e790746SPaolo Bonzini     }
10516e790746SPaolo Bonzini 
10526e790746SPaolo Bonzini     if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
10536e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
10546e790746SPaolo Bonzini     }
10556e790746SPaolo Bonzini 
1056cae2e556SAmos Kong     int in_use = 0;
1057cae2e556SAmos Kong     int first_multi = 0;
1058cae2e556SAmos Kong     uint8_t uni_overflow = 0;
1059cae2e556SAmos Kong     uint8_t multi_overflow = 0;
1060cae2e556SAmos Kong     uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
10616e790746SPaolo Bonzini 
10626e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10636e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10641399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10656e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1066b1be4280SAmos Kong         goto error;
10676e790746SPaolo Bonzini     }
10686e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10696e790746SPaolo Bonzini 
10706e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
1071b1be4280SAmos Kong         goto error;
10726e790746SPaolo Bonzini     }
10736e790746SPaolo Bonzini 
10746e790746SPaolo Bonzini     if (mac_data.entries <= MAC_TABLE_ENTRIES) {
1075cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, macs,
10766e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
10776e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1078b1be4280SAmos Kong             goto error;
10796e790746SPaolo Bonzini         }
1080cae2e556SAmos Kong         in_use += mac_data.entries;
10816e790746SPaolo Bonzini     } else {
1082cae2e556SAmos Kong         uni_overflow = 1;
10836e790746SPaolo Bonzini     }
10846e790746SPaolo Bonzini 
10856e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
10866e790746SPaolo Bonzini 
1087cae2e556SAmos Kong     first_multi = in_use;
10886e790746SPaolo Bonzini 
10896e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
10906e790746SPaolo Bonzini                    sizeof(mac_data.entries));
10911399c60dSRusty Russell     mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
10926e790746SPaolo Bonzini     if (s != sizeof(mac_data.entries)) {
1093b1be4280SAmos Kong         goto error;
10946e790746SPaolo Bonzini     }
10956e790746SPaolo Bonzini 
10966e790746SPaolo Bonzini     iov_discard_front(&iov, &iov_cnt, s);
10976e790746SPaolo Bonzini 
10986e790746SPaolo Bonzini     if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
1099b1be4280SAmos Kong         goto error;
11006e790746SPaolo Bonzini     }
11016e790746SPaolo Bonzini 
1102edc24385SMichael S. Tsirkin     if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
1103cae2e556SAmos Kong         s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
11046e790746SPaolo Bonzini                        mac_data.entries * ETH_ALEN);
11056e790746SPaolo Bonzini         if (s != mac_data.entries * ETH_ALEN) {
1106b1be4280SAmos Kong             goto error;
11076e790746SPaolo Bonzini         }
1108cae2e556SAmos Kong         in_use += mac_data.entries;
11096e790746SPaolo Bonzini     } else {
1110cae2e556SAmos Kong         multi_overflow = 1;
11116e790746SPaolo Bonzini     }
11126e790746SPaolo Bonzini 
1113cae2e556SAmos Kong     n->mac_table.in_use = in_use;
1114cae2e556SAmos Kong     n->mac_table.first_multi = first_multi;
1115cae2e556SAmos Kong     n->mac_table.uni_overflow = uni_overflow;
1116cae2e556SAmos Kong     n->mac_table.multi_overflow = multi_overflow;
1117cae2e556SAmos Kong     memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
1118cae2e556SAmos Kong     g_free(macs);
1119b1be4280SAmos Kong     rxfilter_notify(nc);
1120b1be4280SAmos Kong 
11216e790746SPaolo Bonzini     return VIRTIO_NET_OK;
1122b1be4280SAmos Kong 
1123b1be4280SAmos Kong error:
1124cae2e556SAmos Kong     g_free(macs);
1125b1be4280SAmos Kong     return VIRTIO_NET_ERR;
11266e790746SPaolo Bonzini }
11276e790746SPaolo Bonzini 
11286e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
11296e790746SPaolo Bonzini                                         struct iovec *iov, unsigned int iov_cnt)
11306e790746SPaolo Bonzini {
11311399c60dSRusty Russell     VirtIODevice *vdev = VIRTIO_DEVICE(n);
11326e790746SPaolo Bonzini     uint16_t vid;
11336e790746SPaolo Bonzini     size_t s;
1134b1be4280SAmos Kong     NetClientState *nc = qemu_get_queue(n->nic);
11356e790746SPaolo Bonzini 
11366e790746SPaolo Bonzini     s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
11371399c60dSRusty Russell     vid = virtio_lduw_p(vdev, &vid);
11386e790746SPaolo Bonzini     if (s != sizeof(vid)) {
11396e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11406e790746SPaolo Bonzini     }
11416e790746SPaolo Bonzini 
11426e790746SPaolo Bonzini     if (vid >= MAX_VLAN)
11436e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11446e790746SPaolo Bonzini 
11456e790746SPaolo Bonzini     if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
11466e790746SPaolo Bonzini         n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
11476e790746SPaolo Bonzini     else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
11486e790746SPaolo Bonzini         n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
11496e790746SPaolo Bonzini     else
11506e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
11516e790746SPaolo Bonzini 
1152b1be4280SAmos Kong     rxfilter_notify(nc);
1153b1be4280SAmos Kong 
11546e790746SPaolo Bonzini     return VIRTIO_NET_OK;
11556e790746SPaolo Bonzini }
11566e790746SPaolo Bonzini 
1157f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
1158f57fcf70SJason Wang                                       struct iovec *iov, unsigned int iov_cnt)
1159f57fcf70SJason Wang {
11609d8c6a25SDr. David Alan Gilbert     trace_virtio_net_handle_announce(n->announce_timer.round);
1161f57fcf70SJason Wang     if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
1162f57fcf70SJason Wang         n->status & VIRTIO_NET_S_ANNOUNCE) {
1163f57fcf70SJason Wang         n->status &= ~VIRTIO_NET_S_ANNOUNCE;
11649d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
11659d8c6a25SDr. David Alan Gilbert             qemu_announce_timer_step(&n->announce_timer);
1166f57fcf70SJason Wang         }
1167f57fcf70SJason Wang         return VIRTIO_NET_OK;
1168f57fcf70SJason Wang     } else {
1169f57fcf70SJason Wang         return VIRTIO_NET_ERR;
1170f57fcf70SJason Wang     }
1171f57fcf70SJason Wang }
1172f57fcf70SJason Wang 
11730145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n);
11740145c393SAndrew Melnychenko 
117559079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n)
117659079029SYuri Benditovich {
117759079029SYuri Benditovich     if (n->rss_data.enabled) {
117859079029SYuri Benditovich         trace_virtio_net_rss_disable();
117959079029SYuri Benditovich     }
118059079029SYuri Benditovich     n->rss_data.enabled = false;
11810145c393SAndrew Melnychenko 
11820145c393SAndrew Melnychenko     virtio_net_detach_epbf_rss(n);
11830145c393SAndrew Melnychenko }
11840145c393SAndrew Melnychenko 
11850145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd)
11860145c393SAndrew Melnychenko {
11870145c393SAndrew Melnychenko     NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0);
11880145c393SAndrew Melnychenko     if (nc == NULL || nc->info->set_steering_ebpf == NULL) {
11890145c393SAndrew Melnychenko         return false;
11900145c393SAndrew Melnychenko     }
11910145c393SAndrew Melnychenko 
11920145c393SAndrew Melnychenko     return nc->info->set_steering_ebpf(nc, prog_fd);
11930145c393SAndrew Melnychenko }
11940145c393SAndrew Melnychenko 
11950145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data,
11960145c393SAndrew Melnychenko                                    struct EBPFRSSConfig *config)
11970145c393SAndrew Melnychenko {
11980145c393SAndrew Melnychenko     config->redirect = data->redirect;
11990145c393SAndrew Melnychenko     config->populate_hash = data->populate_hash;
12000145c393SAndrew Melnychenko     config->hash_types = data->hash_types;
12010145c393SAndrew Melnychenko     config->indirections_len = data->indirections_len;
12020145c393SAndrew Melnychenko     config->default_queue = data->default_queue;
12030145c393SAndrew Melnychenko }
12040145c393SAndrew Melnychenko 
12050145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n)
12060145c393SAndrew Melnychenko {
12070145c393SAndrew Melnychenko     struct EBPFRSSConfig config = {};
12080145c393SAndrew Melnychenko 
12090145c393SAndrew Melnychenko     if (!ebpf_rss_is_loaded(&n->ebpf_rss)) {
12100145c393SAndrew Melnychenko         return false;
12110145c393SAndrew Melnychenko     }
12120145c393SAndrew Melnychenko 
12130145c393SAndrew Melnychenko     rss_data_to_rss_config(&n->rss_data, &config);
12140145c393SAndrew Melnychenko 
12150145c393SAndrew Melnychenko     if (!ebpf_rss_set_all(&n->ebpf_rss, &config,
12160145c393SAndrew Melnychenko                           n->rss_data.indirections_table, n->rss_data.key)) {
12170145c393SAndrew Melnychenko         return false;
12180145c393SAndrew Melnychenko     }
12190145c393SAndrew Melnychenko 
12200145c393SAndrew Melnychenko     if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) {
12210145c393SAndrew Melnychenko         return false;
12220145c393SAndrew Melnychenko     }
12230145c393SAndrew Melnychenko 
12240145c393SAndrew Melnychenko     return true;
12250145c393SAndrew Melnychenko }
12260145c393SAndrew Melnychenko 
12270145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n)
12280145c393SAndrew Melnychenko {
12290145c393SAndrew Melnychenko     virtio_net_attach_ebpf_to_backend(n->nic, -1);
12300145c393SAndrew Melnychenko }
12310145c393SAndrew Melnychenko 
12320145c393SAndrew Melnychenko static bool virtio_net_load_ebpf(VirtIONet *n)
12330145c393SAndrew Melnychenko {
12340145c393SAndrew Melnychenko     if (!virtio_net_attach_ebpf_to_backend(n->nic, -1)) {
12350145c393SAndrew Melnychenko         /* backend does't support steering ebpf */
12360145c393SAndrew Melnychenko         return false;
12370145c393SAndrew Melnychenko     }
12380145c393SAndrew Melnychenko 
12390145c393SAndrew Melnychenko     return ebpf_rss_load(&n->ebpf_rss);
12400145c393SAndrew Melnychenko }
12410145c393SAndrew Melnychenko 
12420145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n)
12430145c393SAndrew Melnychenko {
12440145c393SAndrew Melnychenko     virtio_net_attach_ebpf_to_backend(n->nic, -1);
12450145c393SAndrew Melnychenko     ebpf_rss_unload(&n->ebpf_rss);
124659079029SYuri Benditovich }
124759079029SYuri Benditovich 
124859079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n,
1249e22f0603SYuri Benditovich                                       struct iovec *iov,
1250e22f0603SYuri Benditovich                                       unsigned int iov_cnt,
1251e22f0603SYuri Benditovich                                       bool do_rss)
125259079029SYuri Benditovich {
125359079029SYuri Benditovich     VirtIODevice *vdev = VIRTIO_DEVICE(n);
125459079029SYuri Benditovich     struct virtio_net_rss_config cfg;
125559079029SYuri Benditovich     size_t s, offset = 0, size_get;
1256441537f1SJason Wang     uint16_t queue_pairs, i;
125759079029SYuri Benditovich     struct {
125859079029SYuri Benditovich         uint16_t us;
125959079029SYuri Benditovich         uint8_t b;
126059079029SYuri Benditovich     } QEMU_PACKED temp;
126159079029SYuri Benditovich     const char *err_msg = "";
126259079029SYuri Benditovich     uint32_t err_value = 0;
126359079029SYuri Benditovich 
1264e22f0603SYuri Benditovich     if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) {
126559079029SYuri Benditovich         err_msg = "RSS is not negotiated";
126659079029SYuri Benditovich         goto error;
126759079029SYuri Benditovich     }
1268e22f0603SYuri Benditovich     if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) {
1269e22f0603SYuri Benditovich         err_msg = "Hash report is not negotiated";
1270e22f0603SYuri Benditovich         goto error;
1271e22f0603SYuri Benditovich     }
127259079029SYuri Benditovich     size_get = offsetof(struct virtio_net_rss_config, indirection_table);
127359079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get);
127459079029SYuri Benditovich     if (s != size_get) {
127559079029SYuri Benditovich         err_msg = "Short command buffer";
127659079029SYuri Benditovich         err_value = (uint32_t)s;
127759079029SYuri Benditovich         goto error;
127859079029SYuri Benditovich     }
127959079029SYuri Benditovich     n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types);
128059079029SYuri Benditovich     n->rss_data.indirections_len =
128159079029SYuri Benditovich         virtio_lduw_p(vdev, &cfg.indirection_table_mask);
128259079029SYuri Benditovich     n->rss_data.indirections_len++;
1283e22f0603SYuri Benditovich     if (!do_rss) {
1284e22f0603SYuri Benditovich         n->rss_data.indirections_len = 1;
1285e22f0603SYuri Benditovich     }
128659079029SYuri Benditovich     if (!is_power_of_2(n->rss_data.indirections_len)) {
128759079029SYuri Benditovich         err_msg = "Invalid size of indirection table";
128859079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
128959079029SYuri Benditovich         goto error;
129059079029SYuri Benditovich     }
129159079029SYuri Benditovich     if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) {
129259079029SYuri Benditovich         err_msg = "Too large indirection table";
129359079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
129459079029SYuri Benditovich         goto error;
129559079029SYuri Benditovich     }
1296e22f0603SYuri Benditovich     n->rss_data.default_queue = do_rss ?
1297e22f0603SYuri Benditovich         virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0;
1298441537f1SJason Wang     if (n->rss_data.default_queue >= n->max_queue_pairs) {
129959079029SYuri Benditovich         err_msg = "Invalid default queue";
130059079029SYuri Benditovich         err_value = n->rss_data.default_queue;
130159079029SYuri Benditovich         goto error;
130259079029SYuri Benditovich     }
130359079029SYuri Benditovich     offset += size_get;
130459079029SYuri Benditovich     size_get = sizeof(uint16_t) * n->rss_data.indirections_len;
130559079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
130659079029SYuri Benditovich     n->rss_data.indirections_table = g_malloc(size_get);
130759079029SYuri Benditovich     if (!n->rss_data.indirections_table) {
130859079029SYuri Benditovich         err_msg = "Can't allocate indirections table";
130959079029SYuri Benditovich         err_value = n->rss_data.indirections_len;
131059079029SYuri Benditovich         goto error;
131159079029SYuri Benditovich     }
131259079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset,
131359079029SYuri Benditovich                    n->rss_data.indirections_table, size_get);
131459079029SYuri Benditovich     if (s != size_get) {
131559079029SYuri Benditovich         err_msg = "Short indirection table buffer";
131659079029SYuri Benditovich         err_value = (uint32_t)s;
131759079029SYuri Benditovich         goto error;
131859079029SYuri Benditovich     }
131959079029SYuri Benditovich     for (i = 0; i < n->rss_data.indirections_len; ++i) {
132059079029SYuri Benditovich         uint16_t val = n->rss_data.indirections_table[i];
132159079029SYuri Benditovich         n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val);
132259079029SYuri Benditovich     }
132359079029SYuri Benditovich     offset += size_get;
132459079029SYuri Benditovich     size_get = sizeof(temp);
132559079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get);
132659079029SYuri Benditovich     if (s != size_get) {
1327441537f1SJason Wang         err_msg = "Can't get queue_pairs";
132859079029SYuri Benditovich         err_value = (uint32_t)s;
132959079029SYuri Benditovich         goto error;
133059079029SYuri Benditovich     }
1331441537f1SJason Wang     queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs;
1332441537f1SJason Wang     if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) {
1333441537f1SJason Wang         err_msg = "Invalid number of queue_pairs";
1334441537f1SJason Wang         err_value = queue_pairs;
133559079029SYuri Benditovich         goto error;
133659079029SYuri Benditovich     }
133759079029SYuri Benditovich     if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) {
133859079029SYuri Benditovich         err_msg = "Invalid key size";
133959079029SYuri Benditovich         err_value = temp.b;
134059079029SYuri Benditovich         goto error;
134159079029SYuri Benditovich     }
134259079029SYuri Benditovich     if (!temp.b && n->rss_data.hash_types) {
134359079029SYuri Benditovich         err_msg = "No key provided";
134459079029SYuri Benditovich         err_value = 0;
134559079029SYuri Benditovich         goto error;
134659079029SYuri Benditovich     }
134759079029SYuri Benditovich     if (!temp.b && !n->rss_data.hash_types) {
134859079029SYuri Benditovich         virtio_net_disable_rss(n);
1349441537f1SJason Wang         return queue_pairs;
135059079029SYuri Benditovich     }
135159079029SYuri Benditovich     offset += size_get;
135259079029SYuri Benditovich     size_get = temp.b;
135359079029SYuri Benditovich     s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get);
135459079029SYuri Benditovich     if (s != size_get) {
135559079029SYuri Benditovich         err_msg = "Can get key buffer";
135659079029SYuri Benditovich         err_value = (uint32_t)s;
135759079029SYuri Benditovich         goto error;
135859079029SYuri Benditovich     }
135959079029SYuri Benditovich     n->rss_data.enabled = true;
13600145c393SAndrew Melnychenko 
13610145c393SAndrew Melnychenko     if (!n->rss_data.populate_hash) {
13620145c393SAndrew Melnychenko         if (!virtio_net_attach_epbf_rss(n)) {
13630145c393SAndrew Melnychenko             /* EBPF must be loaded for vhost */
13640145c393SAndrew Melnychenko             if (get_vhost_net(qemu_get_queue(n->nic)->peer)) {
13650145c393SAndrew Melnychenko                 warn_report("Can't load eBPF RSS for vhost");
13660145c393SAndrew Melnychenko                 goto error;
13670145c393SAndrew Melnychenko             }
13680145c393SAndrew Melnychenko             /* fallback to software RSS */
13690145c393SAndrew Melnychenko             warn_report("Can't load eBPF RSS - fallback to software RSS");
13700145c393SAndrew Melnychenko             n->rss_data.enabled_software_rss = true;
13710145c393SAndrew Melnychenko         }
13720145c393SAndrew Melnychenko     } else {
13730145c393SAndrew Melnychenko         /* use software RSS for hash populating */
13740145c393SAndrew Melnychenko         /* and detach eBPF if was loaded before */
13750145c393SAndrew Melnychenko         virtio_net_detach_epbf_rss(n);
13760145c393SAndrew Melnychenko         n->rss_data.enabled_software_rss = true;
13770145c393SAndrew Melnychenko     }
13780145c393SAndrew Melnychenko 
137959079029SYuri Benditovich     trace_virtio_net_rss_enable(n->rss_data.hash_types,
138059079029SYuri Benditovich                                 n->rss_data.indirections_len,
138159079029SYuri Benditovich                                 temp.b);
1382441537f1SJason Wang     return queue_pairs;
138359079029SYuri Benditovich error:
138459079029SYuri Benditovich     trace_virtio_net_rss_error(err_msg, err_value);
138559079029SYuri Benditovich     virtio_net_disable_rss(n);
138659079029SYuri Benditovich     return 0;
138759079029SYuri Benditovich }
138859079029SYuri Benditovich 
13896e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
13906e790746SPaolo Bonzini                                 struct iovec *iov, unsigned int iov_cnt)
13916e790746SPaolo Bonzini {
139217a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1393441537f1SJason Wang     uint16_t queue_pairs;
13942a7888ccSSi-Wei Liu     NetClientState *nc = qemu_get_queue(n->nic);
13956e790746SPaolo Bonzini 
139659079029SYuri Benditovich     virtio_net_disable_rss(n);
1397e22f0603SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) {
1398441537f1SJason Wang         queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false);
1399441537f1SJason Wang         return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR;
1400e22f0603SYuri Benditovich     }
140159079029SYuri Benditovich     if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) {
1402441537f1SJason Wang         queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true);
140359079029SYuri Benditovich     } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
140459079029SYuri Benditovich         struct virtio_net_ctrl_mq mq;
140559079029SYuri Benditovich         size_t s;
140659079029SYuri Benditovich         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) {
140759079029SYuri Benditovich             return VIRTIO_NET_ERR;
140859079029SYuri Benditovich         }
14096e790746SPaolo Bonzini         s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
14106e790746SPaolo Bonzini         if (s != sizeof(mq)) {
14116e790746SPaolo Bonzini             return VIRTIO_NET_ERR;
14126e790746SPaolo Bonzini         }
1413441537f1SJason Wang         queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
14146e790746SPaolo Bonzini 
141559079029SYuri Benditovich     } else {
14166e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
14176e790746SPaolo Bonzini     }
14186e790746SPaolo Bonzini 
1419441537f1SJason Wang     if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
1420441537f1SJason Wang         queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
1421441537f1SJason Wang         queue_pairs > n->max_queue_pairs ||
14226e790746SPaolo Bonzini         !n->multiqueue) {
14236e790746SPaolo Bonzini         return VIRTIO_NET_ERR;
14246e790746SPaolo Bonzini     }
14256e790746SPaolo Bonzini 
1426441537f1SJason Wang     n->curr_queue_pairs = queue_pairs;
1427ca8717f9SEugenio Pérez     if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
1428ca8717f9SEugenio Pérez         /*
1429ca8717f9SEugenio Pérez          * Avoid updating the backend for a vdpa device: We're only interested
1430ca8717f9SEugenio Pérez          * in updating the device model queues.
1431ca8717f9SEugenio Pérez          */
1432ca8717f9SEugenio Pérez         return VIRTIO_NET_OK;
1433ca8717f9SEugenio Pérez     }
1434441537f1SJason Wang     /* stop the backend before changing the number of queue_pairs to avoid handling a
14356e790746SPaolo Bonzini      * disabled queue */
143617a0ca55SKONRAD Frederic     virtio_net_set_status(vdev, vdev->status);
1437441537f1SJason Wang     virtio_net_set_queue_pairs(n);
14386e790746SPaolo Bonzini 
14396e790746SPaolo Bonzini     return VIRTIO_NET_OK;
14406e790746SPaolo Bonzini }
1441ba7eadb5SGreg Kurz 
1442640b8a1cSEugenio Pérez size_t virtio_net_handle_ctrl_iov(VirtIODevice *vdev,
1443640b8a1cSEugenio Pérez                                   const struct iovec *in_sg, unsigned in_num,
1444640b8a1cSEugenio Pérez                                   const struct iovec *out_sg,
1445640b8a1cSEugenio Pérez                                   unsigned out_num)
14466e790746SPaolo Bonzini {
144717a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
14486e790746SPaolo Bonzini     struct virtio_net_ctrl_hdr ctrl;
14496e790746SPaolo Bonzini     virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
14506e790746SPaolo Bonzini     size_t s;
1451771b6ed3SJason Wang     struct iovec *iov, *iov2;
1452640b8a1cSEugenio Pérez 
1453640b8a1cSEugenio Pérez     if (iov_size(in_sg, in_num) < sizeof(status) ||
1454640b8a1cSEugenio Pérez         iov_size(out_sg, out_num) < sizeof(ctrl)) {
1455640b8a1cSEugenio Pérez         virtio_error(vdev, "virtio-net ctrl missing headers");
1456640b8a1cSEugenio Pérez         return 0;
1457640b8a1cSEugenio Pérez     }
1458640b8a1cSEugenio Pérez 
1459640b8a1cSEugenio Pérez     iov2 = iov = g_memdup2(out_sg, sizeof(struct iovec) * out_num);
1460640b8a1cSEugenio Pérez     s = iov_to_buf(iov, out_num, 0, &ctrl, sizeof(ctrl));
1461640b8a1cSEugenio Pérez     iov_discard_front(&iov, &out_num, sizeof(ctrl));
1462640b8a1cSEugenio Pérez     if (s != sizeof(ctrl)) {
1463640b8a1cSEugenio Pérez         status = VIRTIO_NET_ERR;
1464640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
1465640b8a1cSEugenio Pérez         status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, out_num);
1466640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
1467640b8a1cSEugenio Pérez         status = virtio_net_handle_mac(n, ctrl.cmd, iov, out_num);
1468640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
1469640b8a1cSEugenio Pérez         status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, out_num);
1470640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
1471640b8a1cSEugenio Pérez         status = virtio_net_handle_announce(n, ctrl.cmd, iov, out_num);
1472640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
1473640b8a1cSEugenio Pérez         status = virtio_net_handle_mq(n, ctrl.cmd, iov, out_num);
1474640b8a1cSEugenio Pérez     } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
1475640b8a1cSEugenio Pérez         status = virtio_net_handle_offloads(n, ctrl.cmd, iov, out_num);
1476640b8a1cSEugenio Pérez     }
1477640b8a1cSEugenio Pérez 
1478640b8a1cSEugenio Pérez     s = iov_from_buf(in_sg, in_num, 0, &status, sizeof(status));
1479640b8a1cSEugenio Pérez     assert(s == sizeof(status));
1480640b8a1cSEugenio Pérez 
1481640b8a1cSEugenio Pérez     g_free(iov2);
1482640b8a1cSEugenio Pérez     return sizeof(status);
1483640b8a1cSEugenio Pérez }
1484640b8a1cSEugenio Pérez 
1485640b8a1cSEugenio Pérez static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
1486640b8a1cSEugenio Pérez {
1487640b8a1cSEugenio Pérez     VirtQueueElement *elem;
14886e790746SPaolo Bonzini 
148951b19ebeSPaolo Bonzini     for (;;) {
1490640b8a1cSEugenio Pérez         size_t written;
149151b19ebeSPaolo Bonzini         elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
149251b19ebeSPaolo Bonzini         if (!elem) {
149351b19ebeSPaolo Bonzini             break;
149451b19ebeSPaolo Bonzini         }
1495640b8a1cSEugenio Pérez 
1496640b8a1cSEugenio Pérez         written = virtio_net_handle_ctrl_iov(vdev, elem->in_sg, elem->in_num,
1497640b8a1cSEugenio Pérez                                              elem->out_sg, elem->out_num);
1498640b8a1cSEugenio Pérez         if (written > 0) {
1499640b8a1cSEugenio Pérez             virtqueue_push(vq, elem, written);
1500640b8a1cSEugenio Pérez             virtio_notify(vdev, vq);
1501640b8a1cSEugenio Pérez             g_free(elem);
1502640b8a1cSEugenio Pérez         } else {
1503ba7eadb5SGreg Kurz             virtqueue_detach_element(vq, elem, 0);
1504ba7eadb5SGreg Kurz             g_free(elem);
1505ba7eadb5SGreg Kurz             break;
15066e790746SPaolo Bonzini         }
15076e790746SPaolo Bonzini     }
15086e790746SPaolo Bonzini }
15096e790746SPaolo Bonzini 
15106e790746SPaolo Bonzini /* RX */
15116e790746SPaolo Bonzini 
15126e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
15136e790746SPaolo Bonzini {
151417a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
15156e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(vq));
15166e790746SPaolo Bonzini 
15176e790746SPaolo Bonzini     qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
15186e790746SPaolo Bonzini }
15196e790746SPaolo Bonzini 
1520b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc)
15216e790746SPaolo Bonzini {
15226e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
152317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
15246e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
15256e790746SPaolo Bonzini 
152617a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
1527b8c4b67eSPhilippe Mathieu-Daudé         return false;
15286e790746SPaolo Bonzini     }
15296e790746SPaolo Bonzini 
1530441537f1SJason Wang     if (nc->queue_index >= n->curr_queue_pairs) {
1531b8c4b67eSPhilippe Mathieu-Daudé         return false;
15326e790746SPaolo Bonzini     }
15336e790746SPaolo Bonzini 
15346e790746SPaolo Bonzini     if (!virtio_queue_ready(q->rx_vq) ||
153517a0ca55SKONRAD Frederic         !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
1536b8c4b67eSPhilippe Mathieu-Daudé         return false;
15376e790746SPaolo Bonzini     }
15386e790746SPaolo Bonzini 
1539b8c4b67eSPhilippe Mathieu-Daudé     return true;
15406e790746SPaolo Bonzini }
15416e790746SPaolo Bonzini 
15426e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
15436e790746SPaolo Bonzini {
15446e790746SPaolo Bonzini     VirtIONet *n = q->n;
15456e790746SPaolo Bonzini     if (virtio_queue_empty(q->rx_vq) ||
15466e790746SPaolo Bonzini         (n->mergeable_rx_bufs &&
15476e790746SPaolo Bonzini          !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
15486e790746SPaolo Bonzini         virtio_queue_set_notification(q->rx_vq, 1);
15496e790746SPaolo Bonzini 
15506e790746SPaolo Bonzini         /* To avoid a race condition where the guest has made some buffers
15516e790746SPaolo Bonzini          * available after the above check but before notification was
15526e790746SPaolo Bonzini          * enabled, check for available buffers again.
15536e790746SPaolo Bonzini          */
15546e790746SPaolo Bonzini         if (virtio_queue_empty(q->rx_vq) ||
15556e790746SPaolo Bonzini             (n->mergeable_rx_bufs &&
15566e790746SPaolo Bonzini              !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
15576e790746SPaolo Bonzini             return 0;
15586e790746SPaolo Bonzini         }
15596e790746SPaolo Bonzini     }
15606e790746SPaolo Bonzini 
15616e790746SPaolo Bonzini     virtio_queue_set_notification(q->rx_vq, 0);
15626e790746SPaolo Bonzini     return 1;
15636e790746SPaolo Bonzini }
15646e790746SPaolo Bonzini 
15651399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
1566032a74a1SCédric Le Goater {
15671399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->hdr_len);
15681399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->gso_size);
15691399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_start);
15701399c60dSRusty Russell     virtio_tswap16s(vdev, &hdr->csum_offset);
1571032a74a1SCédric Le Goater }
1572032a74a1SCédric Le Goater 
15736e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
15746e790746SPaolo Bonzini  * it never finds out that the packets don't have valid checksums.  This
15756e790746SPaolo Bonzini  * causes dhclient to get upset.  Fedora's carried a patch for ages to
15766e790746SPaolo Bonzini  * fix this with Xen but it hasn't appeared in an upstream release of
15776e790746SPaolo Bonzini  * dhclient yet.
15786e790746SPaolo Bonzini  *
15796e790746SPaolo Bonzini  * To avoid breaking existing guests, we catch udp packets and add
15806e790746SPaolo Bonzini  * checksums.  This is terrible but it's better than hacking the guest
15816e790746SPaolo Bonzini  * kernels.
15826e790746SPaolo Bonzini  *
15836e790746SPaolo Bonzini  * N.B. if we introduce a zero-copy API, this operation is no longer free so
15846e790746SPaolo Bonzini  * we should provide a mechanism to disable it to avoid polluting the host
15856e790746SPaolo Bonzini  * cache.
15866e790746SPaolo Bonzini  */
15876e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
15886e790746SPaolo Bonzini                                         uint8_t *buf, size_t size)
15896e790746SPaolo Bonzini {
15906e790746SPaolo Bonzini     if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
15916e790746SPaolo Bonzini         (size > 27 && size < 1500) && /* normal sized MTU */
15926e790746SPaolo Bonzini         (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
15936e790746SPaolo Bonzini         (buf[23] == 17) && /* ip.protocol == UDP */
15946e790746SPaolo Bonzini         (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
1595f5746335SBin Meng         net_checksum_calculate(buf, size, CSUM_UDP);
15966e790746SPaolo Bonzini         hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
15976e790746SPaolo Bonzini     }
15986e790746SPaolo Bonzini }
15996e790746SPaolo Bonzini 
16006e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
16016e790746SPaolo Bonzini                            const void *buf, size_t size)
16026e790746SPaolo Bonzini {
16036e790746SPaolo Bonzini     if (n->has_vnet_hdr) {
16046e790746SPaolo Bonzini         /* FIXME this cast is evil */
16056e790746SPaolo Bonzini         void *wbuf = (void *)buf;
16066e790746SPaolo Bonzini         work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
16076e790746SPaolo Bonzini                                     size - n->host_hdr_len);
16081bfa316cSGreg Kurz 
16091bfa316cSGreg Kurz         if (n->needs_vnet_hdr_swap) {
16101399c60dSRusty Russell             virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
16111bfa316cSGreg Kurz         }
16126e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
16136e790746SPaolo Bonzini     } else {
16146e790746SPaolo Bonzini         struct virtio_net_hdr hdr = {
16156e790746SPaolo Bonzini             .flags = 0,
16166e790746SPaolo Bonzini             .gso_type = VIRTIO_NET_HDR_GSO_NONE
16176e790746SPaolo Bonzini         };
16186e790746SPaolo Bonzini         iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
16196e790746SPaolo Bonzini     }
16206e790746SPaolo Bonzini }
16216e790746SPaolo Bonzini 
16226e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
16236e790746SPaolo Bonzini {
16246e790746SPaolo Bonzini     static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
16256e790746SPaolo Bonzini     static const uint8_t vlan[] = {0x81, 0x00};
16266e790746SPaolo Bonzini     uint8_t *ptr = (uint8_t *)buf;
16276e790746SPaolo Bonzini     int i;
16286e790746SPaolo Bonzini 
16296e790746SPaolo Bonzini     if (n->promisc)
16306e790746SPaolo Bonzini         return 1;
16316e790746SPaolo Bonzini 
16326e790746SPaolo Bonzini     ptr += n->host_hdr_len;
16336e790746SPaolo Bonzini 
16346e790746SPaolo Bonzini     if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
16357542d3e7SPeter Maydell         int vid = lduw_be_p(ptr + 14) & 0xfff;
16366e790746SPaolo Bonzini         if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
16376e790746SPaolo Bonzini             return 0;
16386e790746SPaolo Bonzini     }
16396e790746SPaolo Bonzini 
16406e790746SPaolo Bonzini     if (ptr[0] & 1) { // multicast
16416e790746SPaolo Bonzini         if (!memcmp(ptr, bcast, sizeof(bcast))) {
16426e790746SPaolo Bonzini             return !n->nobcast;
16436e790746SPaolo Bonzini         } else if (n->nomulti) {
16446e790746SPaolo Bonzini             return 0;
16456e790746SPaolo Bonzini         } else if (n->allmulti || n->mac_table.multi_overflow) {
16466e790746SPaolo Bonzini             return 1;
16476e790746SPaolo Bonzini         }
16486e790746SPaolo Bonzini 
16496e790746SPaolo Bonzini         for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
16506e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
16516e790746SPaolo Bonzini                 return 1;
16526e790746SPaolo Bonzini             }
16536e790746SPaolo Bonzini         }
16546e790746SPaolo Bonzini     } else { // unicast
16556e790746SPaolo Bonzini         if (n->nouni) {
16566e790746SPaolo Bonzini             return 0;
16576e790746SPaolo Bonzini         } else if (n->alluni || n->mac_table.uni_overflow) {
16586e790746SPaolo Bonzini             return 1;
16596e790746SPaolo Bonzini         } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
16606e790746SPaolo Bonzini             return 1;
16616e790746SPaolo Bonzini         }
16626e790746SPaolo Bonzini 
16636e790746SPaolo Bonzini         for (i = 0; i < n->mac_table.first_multi; i++) {
16646e790746SPaolo Bonzini             if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
16656e790746SPaolo Bonzini                 return 1;
16666e790746SPaolo Bonzini             }
16676e790746SPaolo Bonzini         }
16686e790746SPaolo Bonzini     }
16696e790746SPaolo Bonzini 
16706e790746SPaolo Bonzini     return 0;
16716e790746SPaolo Bonzini }
16726e790746SPaolo Bonzini 
16734474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4,
16744474e37aSYuri Benditovich                                         bool isip6,
16754474e37aSYuri Benditovich                                         bool isudp,
16764474e37aSYuri Benditovich                                         bool istcp,
16774474e37aSYuri Benditovich                                         uint32_t types)
16784474e37aSYuri Benditovich {
16794474e37aSYuri Benditovich     if (isip4) {
16804474e37aSYuri Benditovich         if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) {
16814474e37aSYuri Benditovich             return NetPktRssIpV4Tcp;
16824474e37aSYuri Benditovich         }
16834474e37aSYuri Benditovich         if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) {
16844474e37aSYuri Benditovich             return NetPktRssIpV4Udp;
16854474e37aSYuri Benditovich         }
16864474e37aSYuri Benditovich         if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) {
16874474e37aSYuri Benditovich             return NetPktRssIpV4;
16884474e37aSYuri Benditovich         }
16894474e37aSYuri Benditovich     } else if (isip6) {
16904474e37aSYuri Benditovich         uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX |
16914474e37aSYuri Benditovich                         VIRTIO_NET_RSS_HASH_TYPE_TCPv6;
16924474e37aSYuri Benditovich 
16934474e37aSYuri Benditovich         if (istcp && (types & mask)) {
16944474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ?
16954474e37aSYuri Benditovich                 NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp;
16964474e37aSYuri Benditovich         }
16974474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6;
16984474e37aSYuri Benditovich         if (isudp && (types & mask)) {
16994474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ?
17004474e37aSYuri Benditovich                 NetPktRssIpV6UdpEx : NetPktRssIpV6Udp;
17014474e37aSYuri Benditovich         }
17024474e37aSYuri Benditovich         mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6;
17034474e37aSYuri Benditovich         if (types & mask) {
17044474e37aSYuri Benditovich             return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ?
17054474e37aSYuri Benditovich                 NetPktRssIpV6Ex : NetPktRssIpV6;
17064474e37aSYuri Benditovich         }
17074474e37aSYuri Benditovich     }
17084474e37aSYuri Benditovich     return 0xff;
17094474e37aSYuri Benditovich }
17104474e37aSYuri Benditovich 
1711e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report,
1712e22f0603SYuri Benditovich                                    uint32_t hash)
1713e22f0603SYuri Benditovich {
1714e22f0603SYuri Benditovich     struct virtio_net_hdr_v1_hash *hdr = (void *)buf;
1715e22f0603SYuri Benditovich     hdr->hash_value = hash;
1716e22f0603SYuri Benditovich     hdr->hash_report = report;
1717e22f0603SYuri Benditovich }
1718e22f0603SYuri Benditovich 
17194474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf,
172097cd965cSPaolo Bonzini                                   size_t size)
17216e790746SPaolo Bonzini {
17226e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
1723e22f0603SYuri Benditovich     unsigned int index = nc->queue_index, new_index = index;
17244474e37aSYuri Benditovich     struct NetRxPkt *pkt = n->rx_pkt;
17254474e37aSYuri Benditovich     uint8_t net_hash_type;
17264474e37aSYuri Benditovich     uint32_t hash;
17274474e37aSYuri Benditovich     bool isip4, isip6, isudp, istcp;
1728e22f0603SYuri Benditovich     static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = {
1729e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv4,
1730e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv4,
1731e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6,
1732e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6,
1733e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_IPv6_EX,
1734e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_TCPv6_EX,
1735e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv4,
1736e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6,
1737e22f0603SYuri Benditovich         VIRTIO_NET_HASH_REPORT_UDPv6_EX
1738e22f0603SYuri Benditovich     };
17394474e37aSYuri Benditovich 
17404474e37aSYuri Benditovich     net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len,
17414474e37aSYuri Benditovich                              size - n->host_hdr_len);
17424474e37aSYuri Benditovich     net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp);
17434474e37aSYuri Benditovich     if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) {
17444474e37aSYuri Benditovich         istcp = isudp = false;
17454474e37aSYuri Benditovich     }
17464474e37aSYuri Benditovich     if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) {
17474474e37aSYuri Benditovich         istcp = isudp = false;
17484474e37aSYuri Benditovich     }
17494474e37aSYuri Benditovich     net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp,
17504474e37aSYuri Benditovich                                              n->rss_data.hash_types);
17514474e37aSYuri Benditovich     if (net_hash_type > NetPktRssIpV6UdpEx) {
1752e22f0603SYuri Benditovich         if (n->rss_data.populate_hash) {
1753e22f0603SYuri Benditovich             virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0);
1754e22f0603SYuri Benditovich         }
1755e22f0603SYuri Benditovich         return n->rss_data.redirect ? n->rss_data.default_queue : -1;
17564474e37aSYuri Benditovich     }
17574474e37aSYuri Benditovich 
17584474e37aSYuri Benditovich     hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key);
1759e22f0603SYuri Benditovich 
1760e22f0603SYuri Benditovich     if (n->rss_data.populate_hash) {
1761e22f0603SYuri Benditovich         virtio_set_packet_hash(buf, reports[net_hash_type], hash);
1762e22f0603SYuri Benditovich     }
1763e22f0603SYuri Benditovich 
1764e22f0603SYuri Benditovich     if (n->rss_data.redirect) {
17654474e37aSYuri Benditovich         new_index = hash & (n->rss_data.indirections_len - 1);
17664474e37aSYuri Benditovich         new_index = n->rss_data.indirections_table[new_index];
17674474e37aSYuri Benditovich     }
1768e22f0603SYuri Benditovich 
1769e22f0603SYuri Benditovich     return (index == new_index) ? -1 : new_index;
17704474e37aSYuri Benditovich }
17714474e37aSYuri Benditovich 
17724474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf,
17734474e37aSYuri Benditovich                                       size_t size, bool no_rss)
17744474e37aSYuri Benditovich {
17754474e37aSYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
17766e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
177717a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
1778bedd7e93SJason Wang     VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE];
1779bedd7e93SJason Wang     size_t lens[VIRTQUEUE_MAX_SIZE];
17806e790746SPaolo Bonzini     struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
17816e790746SPaolo Bonzini     struct virtio_net_hdr_mrg_rxbuf mhdr;
17826e790746SPaolo Bonzini     unsigned mhdr_cnt = 0;
1783bedd7e93SJason Wang     size_t offset, i, guest_offset, j;
1784bedd7e93SJason Wang     ssize_t err;
17856e790746SPaolo Bonzini 
17866e790746SPaolo Bonzini     if (!virtio_net_can_receive(nc)) {
17876e790746SPaolo Bonzini         return -1;
17886e790746SPaolo Bonzini     }
17896e790746SPaolo Bonzini 
17900145c393SAndrew Melnychenko     if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) {
17914474e37aSYuri Benditovich         int index = virtio_net_process_rss(nc, buf, size);
17924474e37aSYuri Benditovich         if (index >= 0) {
17934474e37aSYuri Benditovich             NetClientState *nc2 = qemu_get_subqueue(n->nic, index);
17944474e37aSYuri Benditovich             return virtio_net_receive_rcu(nc2, buf, size, true);
17954474e37aSYuri Benditovich         }
17964474e37aSYuri Benditovich     }
17974474e37aSYuri Benditovich 
17986e790746SPaolo Bonzini     /* hdr_len refers to the header we supply to the guest */
17996e790746SPaolo Bonzini     if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
18006e790746SPaolo Bonzini         return 0;
18016e790746SPaolo Bonzini     }
18026e790746SPaolo Bonzini 
18036e790746SPaolo Bonzini     if (!receive_filter(n, buf, size))
18046e790746SPaolo Bonzini         return size;
18056e790746SPaolo Bonzini 
18066e790746SPaolo Bonzini     offset = i = 0;
18076e790746SPaolo Bonzini 
18086e790746SPaolo Bonzini     while (offset < size) {
180951b19ebeSPaolo Bonzini         VirtQueueElement *elem;
18106e790746SPaolo Bonzini         int len, total;
181151b19ebeSPaolo Bonzini         const struct iovec *sg;
18126e790746SPaolo Bonzini 
18136e790746SPaolo Bonzini         total = 0;
18146e790746SPaolo Bonzini 
1815bedd7e93SJason Wang         if (i == VIRTQUEUE_MAX_SIZE) {
1816bedd7e93SJason Wang             virtio_error(vdev, "virtio-net unexpected long buffer chain");
1817bedd7e93SJason Wang             err = size;
1818bedd7e93SJason Wang             goto err;
1819bedd7e93SJason Wang         }
1820bedd7e93SJason Wang 
182151b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
182251b19ebeSPaolo Bonzini         if (!elem) {
1823ba10b9c0SGreg Kurz             if (i) {
1824ba10b9c0SGreg Kurz                 virtio_error(vdev, "virtio-net unexpected empty queue: "
18256e790746SPaolo Bonzini                              "i %zd mergeable %d offset %zd, size %zd, "
1826019a3edbSGerd Hoffmann                              "guest hdr len %zd, host hdr len %zd "
1827019a3edbSGerd Hoffmann                              "guest features 0x%" PRIx64,
18286e790746SPaolo Bonzini                              i, n->mergeable_rx_bufs, offset, size,
1829019a3edbSGerd Hoffmann                              n->guest_hdr_len, n->host_hdr_len,
1830019a3edbSGerd Hoffmann                              vdev->guest_features);
1831ba10b9c0SGreg Kurz             }
1832bedd7e93SJason Wang             err = -1;
1833bedd7e93SJason Wang             goto err;
18346e790746SPaolo Bonzini         }
18356e790746SPaolo Bonzini 
183651b19ebeSPaolo Bonzini         if (elem->in_num < 1) {
1837ba10b9c0SGreg Kurz             virtio_error(vdev,
1838ba10b9c0SGreg Kurz                          "virtio-net receive queue contains no in buffers");
1839ba10b9c0SGreg Kurz             virtqueue_detach_element(q->rx_vq, elem, 0);
1840ba10b9c0SGreg Kurz             g_free(elem);
1841bedd7e93SJason Wang             err = -1;
1842bedd7e93SJason Wang             goto err;
18436e790746SPaolo Bonzini         }
18446e790746SPaolo Bonzini 
184551b19ebeSPaolo Bonzini         sg = elem->in_sg;
18466e790746SPaolo Bonzini         if (i == 0) {
18476e790746SPaolo Bonzini             assert(offset == 0);
18486e790746SPaolo Bonzini             if (n->mergeable_rx_bufs) {
18496e790746SPaolo Bonzini                 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
185051b19ebeSPaolo Bonzini                                     sg, elem->in_num,
18516e790746SPaolo Bonzini                                     offsetof(typeof(mhdr), num_buffers),
18526e790746SPaolo Bonzini                                     sizeof(mhdr.num_buffers));
18536e790746SPaolo Bonzini             }
18546e790746SPaolo Bonzini 
185551b19ebeSPaolo Bonzini             receive_header(n, sg, elem->in_num, buf, size);
1856e22f0603SYuri Benditovich             if (n->rss_data.populate_hash) {
1857e22f0603SYuri Benditovich                 offset = sizeof(mhdr);
1858e22f0603SYuri Benditovich                 iov_from_buf(sg, elem->in_num, offset,
1859e22f0603SYuri Benditovich                              buf + offset, n->host_hdr_len - sizeof(mhdr));
1860e22f0603SYuri Benditovich             }
18616e790746SPaolo Bonzini             offset = n->host_hdr_len;
18626e790746SPaolo Bonzini             total += n->guest_hdr_len;
18636e790746SPaolo Bonzini             guest_offset = n->guest_hdr_len;
18646e790746SPaolo Bonzini         } else {
18656e790746SPaolo Bonzini             guest_offset = 0;
18666e790746SPaolo Bonzini         }
18676e790746SPaolo Bonzini 
18686e790746SPaolo Bonzini         /* copy in packet.  ugh */
186951b19ebeSPaolo Bonzini         len = iov_from_buf(sg, elem->in_num, guest_offset,
18706e790746SPaolo Bonzini                            buf + offset, size - offset);
18716e790746SPaolo Bonzini         total += len;
18726e790746SPaolo Bonzini         offset += len;
18736e790746SPaolo Bonzini         /* If buffers can't be merged, at this point we
18746e790746SPaolo Bonzini          * must have consumed the complete packet.
18756e790746SPaolo Bonzini          * Otherwise, drop it. */
18766e790746SPaolo Bonzini         if (!n->mergeable_rx_bufs && offset < size) {
187727e57efeSLadi Prosek             virtqueue_unpop(q->rx_vq, elem, total);
187851b19ebeSPaolo Bonzini             g_free(elem);
1879bedd7e93SJason Wang             err = size;
1880bedd7e93SJason Wang             goto err;
18816e790746SPaolo Bonzini         }
18826e790746SPaolo Bonzini 
1883bedd7e93SJason Wang         elems[i] = elem;
1884bedd7e93SJason Wang         lens[i] = total;
1885bedd7e93SJason Wang         i++;
18866e790746SPaolo Bonzini     }
18876e790746SPaolo Bonzini 
18886e790746SPaolo Bonzini     if (mhdr_cnt) {
18891399c60dSRusty Russell         virtio_stw_p(vdev, &mhdr.num_buffers, i);
18906e790746SPaolo Bonzini         iov_from_buf(mhdr_sg, mhdr_cnt,
18916e790746SPaolo Bonzini                      0,
18926e790746SPaolo Bonzini                      &mhdr.num_buffers, sizeof mhdr.num_buffers);
18936e790746SPaolo Bonzini     }
18946e790746SPaolo Bonzini 
1895bedd7e93SJason Wang     for (j = 0; j < i; j++) {
1896bedd7e93SJason Wang         /* signal other side */
1897bedd7e93SJason Wang         virtqueue_fill(q->rx_vq, elems[j], lens[j], j);
1898bedd7e93SJason Wang         g_free(elems[j]);
1899bedd7e93SJason Wang     }
1900bedd7e93SJason Wang 
19016e790746SPaolo Bonzini     virtqueue_flush(q->rx_vq, i);
190217a0ca55SKONRAD Frederic     virtio_notify(vdev, q->rx_vq);
19036e790746SPaolo Bonzini 
19046e790746SPaolo Bonzini     return size;
1905bedd7e93SJason Wang 
1906bedd7e93SJason Wang err:
1907bedd7e93SJason Wang     for (j = 0; j < i; j++) {
1908abe300d9SJason Wang         virtqueue_detach_element(q->rx_vq, elems[j], lens[j]);
1909bedd7e93SJason Wang         g_free(elems[j]);
1910bedd7e93SJason Wang     }
1911bedd7e93SJason Wang 
1912bedd7e93SJason Wang     return err;
19136e790746SPaolo Bonzini }
19146e790746SPaolo Bonzini 
19152974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf,
191697cd965cSPaolo Bonzini                                   size_t size)
191797cd965cSPaolo Bonzini {
1918068ddfa9SDr. David Alan Gilbert     RCU_READ_LOCK_GUARD();
191997cd965cSPaolo Bonzini 
19204474e37aSYuri Benditovich     return virtio_net_receive_rcu(nc, buf, size, false);
192197cd965cSPaolo Bonzini }
192297cd965cSPaolo Bonzini 
19232974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain,
19242974e916SYuri Benditovich                                          const uint8_t *buf,
19252974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
19262974e916SYuri Benditovich {
19272974e916SYuri Benditovich     uint16_t ip_hdrlen;
19282974e916SYuri Benditovich     struct ip_header *ip;
19292974e916SYuri Benditovich 
19302974e916SYuri Benditovich     ip = (struct ip_header *)(buf + chain->n->guest_hdr_len
19312974e916SYuri Benditovich                               + sizeof(struct eth_header));
19322974e916SYuri Benditovich     unit->ip = (void *)ip;
19332974e916SYuri Benditovich     ip_hdrlen = (ip->ip_ver_len & 0xF) << 2;
19342974e916SYuri Benditovich     unit->ip_plen = &ip->ip_len;
19352974e916SYuri Benditovich     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen);
19362974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
19372974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen;
19382974e916SYuri Benditovich }
19392974e916SYuri Benditovich 
19402974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain,
19412974e916SYuri Benditovich                                          const uint8_t *buf,
19422974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
19432974e916SYuri Benditovich {
19442974e916SYuri Benditovich     struct ip6_header *ip6;
19452974e916SYuri Benditovich 
19462974e916SYuri Benditovich     ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len
19472974e916SYuri Benditovich                                  + sizeof(struct eth_header));
19482974e916SYuri Benditovich     unit->ip = ip6;
19492974e916SYuri Benditovich     unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
195078ee6bd0SPhilippe Mathieu-Daudé     unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip)
19512974e916SYuri Benditovich                                         + sizeof(struct ip6_header));
19522974e916SYuri Benditovich     unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10;
19532974e916SYuri Benditovich 
19542974e916SYuri Benditovich     /* There is a difference between payload lenght in ipv4 and v6,
19552974e916SYuri Benditovich        ip header is excluded in ipv6 */
19562974e916SYuri Benditovich     unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen;
19572974e916SYuri Benditovich }
19582974e916SYuri Benditovich 
19592974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain,
19602974e916SYuri Benditovich                                        VirtioNetRscSeg *seg)
19612974e916SYuri Benditovich {
19622974e916SYuri Benditovich     int ret;
1963dd3d85e8SYuri Benditovich     struct virtio_net_hdr_v1 *h;
19642974e916SYuri Benditovich 
1965dd3d85e8SYuri Benditovich     h = (struct virtio_net_hdr_v1 *)seg->buf;
19662974e916SYuri Benditovich     h->flags = 0;
19672974e916SYuri Benditovich     h->gso_type = VIRTIO_NET_HDR_GSO_NONE;
19682974e916SYuri Benditovich 
19692974e916SYuri Benditovich     if (seg->is_coalesced) {
1970dd3d85e8SYuri Benditovich         h->rsc.segments = seg->packets;
1971dd3d85e8SYuri Benditovich         h->rsc.dup_acks = seg->dup_ack;
19722974e916SYuri Benditovich         h->flags = VIRTIO_NET_HDR_F_RSC_INFO;
19732974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
19742974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
19752974e916SYuri Benditovich         } else {
19762974e916SYuri Benditovich             h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
19772974e916SYuri Benditovich         }
19782974e916SYuri Benditovich     }
19792974e916SYuri Benditovich 
19802974e916SYuri Benditovich     ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size);
19812974e916SYuri Benditovich     QTAILQ_REMOVE(&chain->buffers, seg, next);
19822974e916SYuri Benditovich     g_free(seg->buf);
19832974e916SYuri Benditovich     g_free(seg);
19842974e916SYuri Benditovich 
19852974e916SYuri Benditovich     return ret;
19862974e916SYuri Benditovich }
19872974e916SYuri Benditovich 
19882974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq)
19892974e916SYuri Benditovich {
19902974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn;
19912974e916SYuri Benditovich     VirtioNetRscChain *chain = (VirtioNetRscChain *)opq;
19922974e916SYuri Benditovich 
19932974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) {
19942974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
19952974e916SYuri Benditovich             chain->stat.purge_failed++;
19962974e916SYuri Benditovich             continue;
19972974e916SYuri Benditovich         }
19982974e916SYuri Benditovich     }
19992974e916SYuri Benditovich 
20002974e916SYuri Benditovich     chain->stat.timer++;
20012974e916SYuri Benditovich     if (!QTAILQ_EMPTY(&chain->buffers)) {
20022974e916SYuri Benditovich         timer_mod(chain->drain_timer,
20032974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
20042974e916SYuri Benditovich     }
20052974e916SYuri Benditovich }
20062974e916SYuri Benditovich 
20072974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n)
20082974e916SYuri Benditovich {
20092974e916SYuri Benditovich     VirtioNetRscChain *chain, *rn_chain;
20102974e916SYuri Benditovich     VirtioNetRscSeg *seg, *rn_seg;
20112974e916SYuri Benditovich 
20122974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) {
20132974e916SYuri Benditovich         QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) {
20142974e916SYuri Benditovich             QTAILQ_REMOVE(&chain->buffers, seg, next);
20152974e916SYuri Benditovich             g_free(seg->buf);
20162974e916SYuri Benditovich             g_free(seg);
20172974e916SYuri Benditovich         }
20182974e916SYuri Benditovich 
20192974e916SYuri Benditovich         timer_free(chain->drain_timer);
20202974e916SYuri Benditovich         QTAILQ_REMOVE(&n->rsc_chains, chain, next);
20212974e916SYuri Benditovich         g_free(chain);
20222974e916SYuri Benditovich     }
20232974e916SYuri Benditovich }
20242974e916SYuri Benditovich 
20252974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain,
20262974e916SYuri Benditovich                                      NetClientState *nc,
20272974e916SYuri Benditovich                                      const uint8_t *buf, size_t size)
20282974e916SYuri Benditovich {
20292974e916SYuri Benditovich     uint16_t hdr_len;
20302974e916SYuri Benditovich     VirtioNetRscSeg *seg;
20312974e916SYuri Benditovich 
20322974e916SYuri Benditovich     hdr_len = chain->n->guest_hdr_len;
2033b21e2380SMarkus Armbruster     seg = g_new(VirtioNetRscSeg, 1);
20342974e916SYuri Benditovich     seg->buf = g_malloc(hdr_len + sizeof(struct eth_header)
20352974e916SYuri Benditovich         + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD);
20362974e916SYuri Benditovich     memcpy(seg->buf, buf, size);
20372974e916SYuri Benditovich     seg->size = size;
20382974e916SYuri Benditovich     seg->packets = 1;
20392974e916SYuri Benditovich     seg->dup_ack = 0;
20402974e916SYuri Benditovich     seg->is_coalesced = 0;
20412974e916SYuri Benditovich     seg->nc = nc;
20422974e916SYuri Benditovich 
20432974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&chain->buffers, seg, next);
20442974e916SYuri Benditovich     chain->stat.cache++;
20452974e916SYuri Benditovich 
20462974e916SYuri Benditovich     switch (chain->proto) {
20472974e916SYuri Benditovich     case ETH_P_IP:
20482974e916SYuri Benditovich         virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit);
20492974e916SYuri Benditovich         break;
20502974e916SYuri Benditovich     case ETH_P_IPV6:
20512974e916SYuri Benditovich         virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit);
20522974e916SYuri Benditovich         break;
20532974e916SYuri Benditovich     default:
20542974e916SYuri Benditovich         g_assert_not_reached();
20552974e916SYuri Benditovich     }
20562974e916SYuri Benditovich }
20572974e916SYuri Benditovich 
20582974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain,
20592974e916SYuri Benditovich                                          VirtioNetRscSeg *seg,
20602974e916SYuri Benditovich                                          const uint8_t *buf,
20612974e916SYuri Benditovich                                          struct tcp_header *n_tcp,
20622974e916SYuri Benditovich                                          struct tcp_header *o_tcp)
20632974e916SYuri Benditovich {
20642974e916SYuri Benditovich     uint32_t nack, oack;
20652974e916SYuri Benditovich     uint16_t nwin, owin;
20662974e916SYuri Benditovich 
20672974e916SYuri Benditovich     nack = htonl(n_tcp->th_ack);
20682974e916SYuri Benditovich     nwin = htons(n_tcp->th_win);
20692974e916SYuri Benditovich     oack = htonl(o_tcp->th_ack);
20702974e916SYuri Benditovich     owin = htons(o_tcp->th_win);
20712974e916SYuri Benditovich 
20722974e916SYuri Benditovich     if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) {
20732974e916SYuri Benditovich         chain->stat.ack_out_of_win++;
20742974e916SYuri Benditovich         return RSC_FINAL;
20752974e916SYuri Benditovich     } else if (nack == oack) {
20762974e916SYuri Benditovich         /* duplicated ack or window probe */
20772974e916SYuri Benditovich         if (nwin == owin) {
20782974e916SYuri Benditovich             /* duplicated ack, add dup ack count due to whql test up to 1 */
20792974e916SYuri Benditovich             chain->stat.dup_ack++;
20802974e916SYuri Benditovich             return RSC_FINAL;
20812974e916SYuri Benditovich         } else {
20822974e916SYuri Benditovich             /* Coalesce window update */
20832974e916SYuri Benditovich             o_tcp->th_win = n_tcp->th_win;
20842974e916SYuri Benditovich             chain->stat.win_update++;
20852974e916SYuri Benditovich             return RSC_COALESCE;
20862974e916SYuri Benditovich         }
20872974e916SYuri Benditovich     } else {
20882974e916SYuri Benditovich         /* pure ack, go to 'C', finalize*/
20892974e916SYuri Benditovich         chain->stat.pure_ack++;
20902974e916SYuri Benditovich         return RSC_FINAL;
20912974e916SYuri Benditovich     }
20922974e916SYuri Benditovich }
20932974e916SYuri Benditovich 
20942974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain,
20952974e916SYuri Benditovich                                             VirtioNetRscSeg *seg,
20962974e916SYuri Benditovich                                             const uint8_t *buf,
20972974e916SYuri Benditovich                                             VirtioNetRscUnit *n_unit)
20982974e916SYuri Benditovich {
20992974e916SYuri Benditovich     void *data;
21002974e916SYuri Benditovich     uint16_t o_ip_len;
21012974e916SYuri Benditovich     uint32_t nseq, oseq;
21022974e916SYuri Benditovich     VirtioNetRscUnit *o_unit;
21032974e916SYuri Benditovich 
21042974e916SYuri Benditovich     o_unit = &seg->unit;
21052974e916SYuri Benditovich     o_ip_len = htons(*o_unit->ip_plen);
21062974e916SYuri Benditovich     nseq = htonl(n_unit->tcp->th_seq);
21072974e916SYuri Benditovich     oseq = htonl(o_unit->tcp->th_seq);
21082974e916SYuri Benditovich 
21092974e916SYuri Benditovich     /* out of order or retransmitted. */
21102974e916SYuri Benditovich     if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) {
21112974e916SYuri Benditovich         chain->stat.data_out_of_win++;
21122974e916SYuri Benditovich         return RSC_FINAL;
21132974e916SYuri Benditovich     }
21142974e916SYuri Benditovich 
21152974e916SYuri Benditovich     data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen;
21162974e916SYuri Benditovich     if (nseq == oseq) {
21172974e916SYuri Benditovich         if ((o_unit->payload == 0) && n_unit->payload) {
21182974e916SYuri Benditovich             /* From no payload to payload, normal case, not a dup ack or etc */
21192974e916SYuri Benditovich             chain->stat.data_after_pure_ack++;
21202974e916SYuri Benditovich             goto coalesce;
21212974e916SYuri Benditovich         } else {
21222974e916SYuri Benditovich             return virtio_net_rsc_handle_ack(chain, seg, buf,
21232974e916SYuri Benditovich                                              n_unit->tcp, o_unit->tcp);
21242974e916SYuri Benditovich         }
21252974e916SYuri Benditovich     } else if ((nseq - oseq) != o_unit->payload) {
21262974e916SYuri Benditovich         /* Not a consistent packet, out of order */
21272974e916SYuri Benditovich         chain->stat.data_out_of_order++;
21282974e916SYuri Benditovich         return RSC_FINAL;
21292974e916SYuri Benditovich     } else {
21302974e916SYuri Benditovich coalesce:
21312974e916SYuri Benditovich         if ((o_ip_len + n_unit->payload) > chain->max_payload) {
21322974e916SYuri Benditovich             chain->stat.over_size++;
21332974e916SYuri Benditovich             return RSC_FINAL;
21342974e916SYuri Benditovich         }
21352974e916SYuri Benditovich 
21362974e916SYuri Benditovich         /* Here comes the right data, the payload length in v4/v6 is different,
21372974e916SYuri Benditovich            so use the field value to update and record the new data len */
21382974e916SYuri Benditovich         o_unit->payload += n_unit->payload; /* update new data len */
21392974e916SYuri Benditovich 
21402974e916SYuri Benditovich         /* update field in ip header */
21412974e916SYuri Benditovich         *o_unit->ip_plen = htons(o_ip_len + n_unit->payload);
21422974e916SYuri Benditovich 
21432974e916SYuri Benditovich         /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced
21442974e916SYuri Benditovich            for windows guest, while this may change the behavior for linux
21452974e916SYuri Benditovich            guest (only if it uses RSC feature). */
21462974e916SYuri Benditovich         o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags;
21472974e916SYuri Benditovich 
21482974e916SYuri Benditovich         o_unit->tcp->th_ack = n_unit->tcp->th_ack;
21492974e916SYuri Benditovich         o_unit->tcp->th_win = n_unit->tcp->th_win;
21502974e916SYuri Benditovich 
21512974e916SYuri Benditovich         memmove(seg->buf + seg->size, data, n_unit->payload);
21522974e916SYuri Benditovich         seg->size += n_unit->payload;
21532974e916SYuri Benditovich         seg->packets++;
21542974e916SYuri Benditovich         chain->stat.coalesced++;
21552974e916SYuri Benditovich         return RSC_COALESCE;
21562974e916SYuri Benditovich     }
21572974e916SYuri Benditovich }
21582974e916SYuri Benditovich 
21592974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain,
21602974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
21612974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21622974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
21632974e916SYuri Benditovich {
21642974e916SYuri Benditovich     struct ip_header *ip1, *ip2;
21652974e916SYuri Benditovich 
21662974e916SYuri Benditovich     ip1 = (struct ip_header *)(unit->ip);
21672974e916SYuri Benditovich     ip2 = (struct ip_header *)(seg->unit.ip);
21682974e916SYuri Benditovich     if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst)
21692974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
21702974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
21712974e916SYuri Benditovich         chain->stat.no_match++;
21722974e916SYuri Benditovich         return RSC_NO_MATCH;
21732974e916SYuri Benditovich     }
21742974e916SYuri Benditovich 
21752974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
21762974e916SYuri Benditovich }
21772974e916SYuri Benditovich 
21782974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain,
21792974e916SYuri Benditovich                                         VirtioNetRscSeg *seg,
21802974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
21812974e916SYuri Benditovich                                         VirtioNetRscUnit *unit)
21822974e916SYuri Benditovich {
21832974e916SYuri Benditovich     struct ip6_header *ip1, *ip2;
21842974e916SYuri Benditovich 
21852974e916SYuri Benditovich     ip1 = (struct ip6_header *)(unit->ip);
21862974e916SYuri Benditovich     ip2 = (struct ip6_header *)(seg->unit.ip);
21872974e916SYuri Benditovich     if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address))
21882974e916SYuri Benditovich         || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address))
21892974e916SYuri Benditovich         || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport)
21902974e916SYuri Benditovich         || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) {
21912974e916SYuri Benditovich             chain->stat.no_match++;
21922974e916SYuri Benditovich             return RSC_NO_MATCH;
21932974e916SYuri Benditovich     }
21942974e916SYuri Benditovich 
21952974e916SYuri Benditovich     return virtio_net_rsc_coalesce_data(chain, seg, buf, unit);
21962974e916SYuri Benditovich }
21972974e916SYuri Benditovich 
21982974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain
21992974e916SYuri Benditovich  * to prevent out of order */
22002974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain,
22012974e916SYuri Benditovich                                          struct tcp_header *tcp)
22022974e916SYuri Benditovich {
22032974e916SYuri Benditovich     uint16_t tcp_hdr;
22042974e916SYuri Benditovich     uint16_t tcp_flag;
22052974e916SYuri Benditovich 
22062974e916SYuri Benditovich     tcp_flag = htons(tcp->th_offset_flags);
22072974e916SYuri Benditovich     tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10;
22082974e916SYuri Benditovich     tcp_flag &= VIRTIO_NET_TCP_FLAG;
22092974e916SYuri Benditovich     if (tcp_flag & TH_SYN) {
22102974e916SYuri Benditovich         chain->stat.tcp_syn++;
22112974e916SYuri Benditovich         return RSC_BYPASS;
22122974e916SYuri Benditovich     }
22132974e916SYuri Benditovich 
22142974e916SYuri Benditovich     if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) {
22152974e916SYuri Benditovich         chain->stat.tcp_ctrl_drain++;
22162974e916SYuri Benditovich         return RSC_FINAL;
22172974e916SYuri Benditovich     }
22182974e916SYuri Benditovich 
22192974e916SYuri Benditovich     if (tcp_hdr > sizeof(struct tcp_header)) {
22202974e916SYuri Benditovich         chain->stat.tcp_all_opt++;
22212974e916SYuri Benditovich         return RSC_FINAL;
22222974e916SYuri Benditovich     }
22232974e916SYuri Benditovich 
22242974e916SYuri Benditovich     return RSC_CANDIDATE;
22252974e916SYuri Benditovich }
22262974e916SYuri Benditovich 
22272974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain,
22282974e916SYuri Benditovich                                          NetClientState *nc,
22292974e916SYuri Benditovich                                          const uint8_t *buf, size_t size,
22302974e916SYuri Benditovich                                          VirtioNetRscUnit *unit)
22312974e916SYuri Benditovich {
22322974e916SYuri Benditovich     int ret;
22332974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
22342974e916SYuri Benditovich 
22352974e916SYuri Benditovich     if (QTAILQ_EMPTY(&chain->buffers)) {
22362974e916SYuri Benditovich         chain->stat.empty_cache++;
22372974e916SYuri Benditovich         virtio_net_rsc_cache_buf(chain, nc, buf, size);
22382974e916SYuri Benditovich         timer_mod(chain->drain_timer,
22392974e916SYuri Benditovich               qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout);
22402974e916SYuri Benditovich         return size;
22412974e916SYuri Benditovich     }
22422974e916SYuri Benditovich 
22432974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
22442974e916SYuri Benditovich         if (chain->proto == ETH_P_IP) {
22452974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit);
22462974e916SYuri Benditovich         } else {
22472974e916SYuri Benditovich             ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit);
22482974e916SYuri Benditovich         }
22492974e916SYuri Benditovich 
22502974e916SYuri Benditovich         if (ret == RSC_FINAL) {
22512974e916SYuri Benditovich             if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
22522974e916SYuri Benditovich                 /* Send failed */
22532974e916SYuri Benditovich                 chain->stat.final_failed++;
22542974e916SYuri Benditovich                 return 0;
22552974e916SYuri Benditovich             }
22562974e916SYuri Benditovich 
22572974e916SYuri Benditovich             /* Send current packet */
22582974e916SYuri Benditovich             return virtio_net_do_receive(nc, buf, size);
22592974e916SYuri Benditovich         } else if (ret == RSC_NO_MATCH) {
22602974e916SYuri Benditovich             continue;
22612974e916SYuri Benditovich         } else {
22622974e916SYuri Benditovich             /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */
22632974e916SYuri Benditovich             seg->is_coalesced = 1;
22642974e916SYuri Benditovich             return size;
22652974e916SYuri Benditovich         }
22662974e916SYuri Benditovich     }
22672974e916SYuri Benditovich 
22682974e916SYuri Benditovich     chain->stat.no_match_cache++;
22692974e916SYuri Benditovich     virtio_net_rsc_cache_buf(chain, nc, buf, size);
22702974e916SYuri Benditovich     return size;
22712974e916SYuri Benditovich }
22722974e916SYuri Benditovich 
22732974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */
22742974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain,
22752974e916SYuri Benditovich                                         NetClientState *nc,
22762974e916SYuri Benditovich                                         const uint8_t *buf, size_t size,
22772974e916SYuri Benditovich                                         uint16_t ip_start, uint16_t ip_size,
22782974e916SYuri Benditovich                                         uint16_t tcp_port)
22792974e916SYuri Benditovich {
22802974e916SYuri Benditovich     VirtioNetRscSeg *seg, *nseg;
22812974e916SYuri Benditovich     uint32_t ppair1, ppair2;
22822974e916SYuri Benditovich 
22832974e916SYuri Benditovich     ppair1 = *(uint32_t *)(buf + tcp_port);
22842974e916SYuri Benditovich     QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) {
22852974e916SYuri Benditovich         ppair2 = *(uint32_t *)(seg->buf + tcp_port);
22862974e916SYuri Benditovich         if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size)
22872974e916SYuri Benditovich             || (ppair1 != ppair2)) {
22882974e916SYuri Benditovich             continue;
22892974e916SYuri Benditovich         }
22902974e916SYuri Benditovich         if (virtio_net_rsc_drain_seg(chain, seg) == 0) {
22912974e916SYuri Benditovich             chain->stat.drain_failed++;
22922974e916SYuri Benditovich         }
22932974e916SYuri Benditovich 
22942974e916SYuri Benditovich         break;
22952974e916SYuri Benditovich     }
22962974e916SYuri Benditovich 
22972974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
22982974e916SYuri Benditovich }
22992974e916SYuri Benditovich 
23002974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain,
23012974e916SYuri Benditovich                                             struct ip_header *ip,
23022974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
23032974e916SYuri Benditovich {
23042974e916SYuri Benditovich     uint16_t ip_len;
23052974e916SYuri Benditovich 
23062974e916SYuri Benditovich     /* Not an ipv4 packet */
23072974e916SYuri Benditovich     if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) {
23082974e916SYuri Benditovich         chain->stat.ip_option++;
23092974e916SYuri Benditovich         return RSC_BYPASS;
23102974e916SYuri Benditovich     }
23112974e916SYuri Benditovich 
23122974e916SYuri Benditovich     /* Don't handle packets with ip option */
23132974e916SYuri Benditovich     if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) {
23142974e916SYuri Benditovich         chain->stat.ip_option++;
23152974e916SYuri Benditovich         return RSC_BYPASS;
23162974e916SYuri Benditovich     }
23172974e916SYuri Benditovich 
23182974e916SYuri Benditovich     if (ip->ip_p != IPPROTO_TCP) {
23192974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23202974e916SYuri Benditovich         return RSC_BYPASS;
23212974e916SYuri Benditovich     }
23222974e916SYuri Benditovich 
23232974e916SYuri Benditovich     /* Don't handle packets with ip fragment */
23242974e916SYuri Benditovich     if (!(htons(ip->ip_off) & IP_DF)) {
23252974e916SYuri Benditovich         chain->stat.ip_frag++;
23262974e916SYuri Benditovich         return RSC_BYPASS;
23272974e916SYuri Benditovich     }
23282974e916SYuri Benditovich 
23292974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
23302974e916SYuri Benditovich     if (IPTOS_ECN(ip->ip_tos)) {
23312974e916SYuri Benditovich         chain->stat.ip_ecn++;
23322974e916SYuri Benditovich         return RSC_BYPASS;
23332974e916SYuri Benditovich     }
23342974e916SYuri Benditovich 
23352974e916SYuri Benditovich     ip_len = htons(ip->ip_len);
23362974e916SYuri Benditovich     if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header))
23372974e916SYuri Benditovich         || ip_len > (size - chain->n->guest_hdr_len -
23382974e916SYuri Benditovich                      sizeof(struct eth_header))) {
23392974e916SYuri Benditovich         chain->stat.ip_hacked++;
23402974e916SYuri Benditovich         return RSC_BYPASS;
23412974e916SYuri Benditovich     }
23422974e916SYuri Benditovich 
23432974e916SYuri Benditovich     return RSC_CANDIDATE;
23442974e916SYuri Benditovich }
23452974e916SYuri Benditovich 
23462974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain,
23472974e916SYuri Benditovich                                       NetClientState *nc,
23482974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
23492974e916SYuri Benditovich {
23502974e916SYuri Benditovich     int32_t ret;
23512974e916SYuri Benditovich     uint16_t hdr_len;
23522974e916SYuri Benditovich     VirtioNetRscUnit unit;
23532974e916SYuri Benditovich 
23542974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
23552974e916SYuri Benditovich 
23562974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)
23572974e916SYuri Benditovich         + sizeof(struct tcp_header))) {
23582974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23592974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23602974e916SYuri Benditovich     }
23612974e916SYuri Benditovich 
23622974e916SYuri Benditovich     virtio_net_rsc_extract_unit4(chain, buf, &unit);
23632974e916SYuri Benditovich     if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size)
23642974e916SYuri Benditovich         != RSC_CANDIDATE) {
23652974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23662974e916SYuri Benditovich     }
23672974e916SYuri Benditovich 
23682974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
23692974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
23702974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
23712974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
23722974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
23732974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 12),
23742974e916SYuri Benditovich                 VIRTIO_NET_IP4_ADDR_SIZE,
23752974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header));
23762974e916SYuri Benditovich     }
23772974e916SYuri Benditovich 
23782974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
23792974e916SYuri Benditovich }
23802974e916SYuri Benditovich 
23812974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain,
23822974e916SYuri Benditovich                                             struct ip6_header *ip6,
23832974e916SYuri Benditovich                                             const uint8_t *buf, size_t size)
23842974e916SYuri Benditovich {
23852974e916SYuri Benditovich     uint16_t ip_len;
23862974e916SYuri Benditovich 
23872974e916SYuri Benditovich     if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4)
23882974e916SYuri Benditovich         != IP_HEADER_VERSION_6) {
23892974e916SYuri Benditovich         return RSC_BYPASS;
23902974e916SYuri Benditovich     }
23912974e916SYuri Benditovich 
23922974e916SYuri Benditovich     /* Both option and protocol is checked in this */
23932974e916SYuri Benditovich     if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) {
23942974e916SYuri Benditovich         chain->stat.bypass_not_tcp++;
23952974e916SYuri Benditovich         return RSC_BYPASS;
23962974e916SYuri Benditovich     }
23972974e916SYuri Benditovich 
23982974e916SYuri Benditovich     ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen);
23992974e916SYuri Benditovich     if (ip_len < sizeof(struct tcp_header) ||
24002974e916SYuri Benditovich         ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header)
24012974e916SYuri Benditovich                   - sizeof(struct ip6_header))) {
24022974e916SYuri Benditovich         chain->stat.ip_hacked++;
24032974e916SYuri Benditovich         return RSC_BYPASS;
24042974e916SYuri Benditovich     }
24052974e916SYuri Benditovich 
24062974e916SYuri Benditovich     /* Don't handle packets with ecn flag */
24072974e916SYuri Benditovich     if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) {
24082974e916SYuri Benditovich         chain->stat.ip_ecn++;
24092974e916SYuri Benditovich         return RSC_BYPASS;
24102974e916SYuri Benditovich     }
24112974e916SYuri Benditovich 
24122974e916SYuri Benditovich     return RSC_CANDIDATE;
24132974e916SYuri Benditovich }
24142974e916SYuri Benditovich 
24152974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc,
24162974e916SYuri Benditovich                                       const uint8_t *buf, size_t size)
24172974e916SYuri Benditovich {
24182974e916SYuri Benditovich     int32_t ret;
24192974e916SYuri Benditovich     uint16_t hdr_len;
24202974e916SYuri Benditovich     VirtioNetRscChain *chain;
24212974e916SYuri Benditovich     VirtioNetRscUnit unit;
24222974e916SYuri Benditovich 
24232974e916SYuri Benditovich     chain = (VirtioNetRscChain *)opq;
24242974e916SYuri Benditovich     hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len;
24252974e916SYuri Benditovich 
24262974e916SYuri Benditovich     if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header)
24272974e916SYuri Benditovich         + sizeof(tcp_header))) {
24282974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24292974e916SYuri Benditovich     }
24302974e916SYuri Benditovich 
24312974e916SYuri Benditovich     virtio_net_rsc_extract_unit6(chain, buf, &unit);
24322974e916SYuri Benditovich     if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain,
24332974e916SYuri Benditovich                                                  unit.ip, buf, size)) {
24342974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24352974e916SYuri Benditovich     }
24362974e916SYuri Benditovich 
24372974e916SYuri Benditovich     ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp);
24382974e916SYuri Benditovich     if (ret == RSC_BYPASS) {
24392974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24402974e916SYuri Benditovich     } else if (ret == RSC_FINAL) {
24412974e916SYuri Benditovich         return virtio_net_rsc_drain_flow(chain, nc, buf, size,
24422974e916SYuri Benditovich                 ((hdr_len + sizeof(struct eth_header)) + 8),
24432974e916SYuri Benditovich                 VIRTIO_NET_IP6_ADDR_SIZE,
24442974e916SYuri Benditovich                 hdr_len + sizeof(struct eth_header)
24452974e916SYuri Benditovich                 + sizeof(struct ip6_header));
24462974e916SYuri Benditovich     }
24472974e916SYuri Benditovich 
24482974e916SYuri Benditovich     return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit);
24492974e916SYuri Benditovich }
24502974e916SYuri Benditovich 
24512974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n,
24522974e916SYuri Benditovich                                                       NetClientState *nc,
24532974e916SYuri Benditovich                                                       uint16_t proto)
24542974e916SYuri Benditovich {
24552974e916SYuri Benditovich     VirtioNetRscChain *chain;
24562974e916SYuri Benditovich 
24572974e916SYuri Benditovich     if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) {
24582974e916SYuri Benditovich         return NULL;
24592974e916SYuri Benditovich     }
24602974e916SYuri Benditovich 
24612974e916SYuri Benditovich     QTAILQ_FOREACH(chain, &n->rsc_chains, next) {
24622974e916SYuri Benditovich         if (chain->proto == proto) {
24632974e916SYuri Benditovich             return chain;
24642974e916SYuri Benditovich         }
24652974e916SYuri Benditovich     }
24662974e916SYuri Benditovich 
24672974e916SYuri Benditovich     chain = g_malloc(sizeof(*chain));
24682974e916SYuri Benditovich     chain->n = n;
24692974e916SYuri Benditovich     chain->proto = proto;
24702974e916SYuri Benditovich     if (proto == (uint16_t)ETH_P_IP) {
24712974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD;
24722974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
24732974e916SYuri Benditovich     } else {
24742974e916SYuri Benditovich         chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD;
24752974e916SYuri Benditovich         chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
24762974e916SYuri Benditovich     }
24772974e916SYuri Benditovich     chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST,
24782974e916SYuri Benditovich                                       virtio_net_rsc_purge, chain);
24792974e916SYuri Benditovich     memset(&chain->stat, 0, sizeof(chain->stat));
24802974e916SYuri Benditovich 
24812974e916SYuri Benditovich     QTAILQ_INIT(&chain->buffers);
24822974e916SYuri Benditovich     QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next);
24832974e916SYuri Benditovich 
24842974e916SYuri Benditovich     return chain;
24852974e916SYuri Benditovich }
24862974e916SYuri Benditovich 
24872974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc,
24882974e916SYuri Benditovich                                       const uint8_t *buf,
24892974e916SYuri Benditovich                                       size_t size)
24902974e916SYuri Benditovich {
24912974e916SYuri Benditovich     uint16_t proto;
24922974e916SYuri Benditovich     VirtioNetRscChain *chain;
24932974e916SYuri Benditovich     struct eth_header *eth;
24942974e916SYuri Benditovich     VirtIONet *n;
24952974e916SYuri Benditovich 
24962974e916SYuri Benditovich     n = qemu_get_nic_opaque(nc);
24972974e916SYuri Benditovich     if (size < (n->host_hdr_len + sizeof(struct eth_header))) {
24982974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
24992974e916SYuri Benditovich     }
25002974e916SYuri Benditovich 
25012974e916SYuri Benditovich     eth = (struct eth_header *)(buf + n->guest_hdr_len);
25022974e916SYuri Benditovich     proto = htons(eth->h_proto);
25032974e916SYuri Benditovich 
25042974e916SYuri Benditovich     chain = virtio_net_rsc_lookup_chain(n, nc, proto);
25052974e916SYuri Benditovich     if (chain) {
25062974e916SYuri Benditovich         chain->stat.received++;
25072974e916SYuri Benditovich         if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) {
25082974e916SYuri Benditovich             return virtio_net_rsc_receive4(chain, nc, buf, size);
25092974e916SYuri Benditovich         } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) {
25102974e916SYuri Benditovich             return virtio_net_rsc_receive6(chain, nc, buf, size);
25112974e916SYuri Benditovich         }
25122974e916SYuri Benditovich     }
25132974e916SYuri Benditovich     return virtio_net_do_receive(nc, buf, size);
25142974e916SYuri Benditovich }
25152974e916SYuri Benditovich 
25162974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf,
25172974e916SYuri Benditovich                                   size_t size)
25182974e916SYuri Benditovich {
25192974e916SYuri Benditovich     VirtIONet *n = qemu_get_nic_opaque(nc);
25202974e916SYuri Benditovich     if ((n->rsc4_enabled || n->rsc6_enabled)) {
25212974e916SYuri Benditovich         return virtio_net_rsc_receive(nc, buf, size);
25222974e916SYuri Benditovich     } else {
25232974e916SYuri Benditovich         return virtio_net_do_receive(nc, buf, size);
25242974e916SYuri Benditovich     }
25252974e916SYuri Benditovich }
25262974e916SYuri Benditovich 
25276e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
25286e790746SPaolo Bonzini 
25296e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
25306e790746SPaolo Bonzini {
25316e790746SPaolo Bonzini     VirtIONet *n = qemu_get_nic_opaque(nc);
25326e790746SPaolo Bonzini     VirtIONetQueue *q = virtio_net_get_subqueue(nc);
253317a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2534df8d0708SLaurent Vivier     int ret;
25356e790746SPaolo Bonzini 
253651b19ebeSPaolo Bonzini     virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
253717a0ca55SKONRAD Frederic     virtio_notify(vdev, q->tx_vq);
25386e790746SPaolo Bonzini 
253951b19ebeSPaolo Bonzini     g_free(q->async_tx.elem);
254051b19ebeSPaolo Bonzini     q->async_tx.elem = NULL;
25416e790746SPaolo Bonzini 
25426e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2543df8d0708SLaurent Vivier     ret = virtio_net_flush_tx(q);
25447550a822SLaurent Vivier     if (ret >= n->tx_burst) {
2545df8d0708SLaurent Vivier         /*
2546df8d0708SLaurent Vivier          * the flush has been stopped by tx_burst
2547df8d0708SLaurent Vivier          * we will not receive notification for the
2548df8d0708SLaurent Vivier          * remainining part, so re-schedule
2549df8d0708SLaurent Vivier          */
2550df8d0708SLaurent Vivier         virtio_queue_set_notification(q->tx_vq, 0);
25517550a822SLaurent Vivier         if (q->tx_bh) {
2552df8d0708SLaurent Vivier             qemu_bh_schedule(q->tx_bh);
25537550a822SLaurent Vivier         } else {
25547550a822SLaurent Vivier             timer_mod(q->tx_timer,
25557550a822SLaurent Vivier                       qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
25567550a822SLaurent Vivier         }
2557df8d0708SLaurent Vivier         q->tx_waiting = 1;
2558df8d0708SLaurent Vivier     }
25596e790746SPaolo Bonzini }
25606e790746SPaolo Bonzini 
25616e790746SPaolo Bonzini /* TX */
25626e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
25636e790746SPaolo Bonzini {
25646e790746SPaolo Bonzini     VirtIONet *n = q->n;
256517a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
256651b19ebeSPaolo Bonzini     VirtQueueElement *elem;
25676e790746SPaolo Bonzini     int32_t num_packets = 0;
25686e790746SPaolo Bonzini     int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
256917a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
25706e790746SPaolo Bonzini         return num_packets;
25716e790746SPaolo Bonzini     }
25726e790746SPaolo Bonzini 
257351b19ebeSPaolo Bonzini     if (q->async_tx.elem) {
25746e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
25756e790746SPaolo Bonzini         return num_packets;
25766e790746SPaolo Bonzini     }
25776e790746SPaolo Bonzini 
257851b19ebeSPaolo Bonzini     for (;;) {
2579bd89dd98SJason Wang         ssize_t ret;
258051b19ebeSPaolo Bonzini         unsigned int out_num;
258151b19ebeSPaolo Bonzini         struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
2582feb93f36SJason Wang         struct virtio_net_hdr_mrg_rxbuf mhdr;
25836e790746SPaolo Bonzini 
258451b19ebeSPaolo Bonzini         elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
258551b19ebeSPaolo Bonzini         if (!elem) {
258651b19ebeSPaolo Bonzini             break;
258751b19ebeSPaolo Bonzini         }
258851b19ebeSPaolo Bonzini 
258951b19ebeSPaolo Bonzini         out_num = elem->out_num;
259051b19ebeSPaolo Bonzini         out_sg = elem->out_sg;
25916e790746SPaolo Bonzini         if (out_num < 1) {
2592fa5e56c2SGreg Kurz             virtio_error(vdev, "virtio-net header not in first element");
2593fa5e56c2SGreg Kurz             virtqueue_detach_element(q->tx_vq, elem, 0);
2594fa5e56c2SGreg Kurz             g_free(elem);
2595fa5e56c2SGreg Kurz             return -EINVAL;
25966e790746SPaolo Bonzini         }
25976e790746SPaolo Bonzini 
2598032a74a1SCédric Le Goater         if (n->has_vnet_hdr) {
2599feb93f36SJason Wang             if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
2600feb93f36SJason Wang                 n->guest_hdr_len) {
2601fa5e56c2SGreg Kurz                 virtio_error(vdev, "virtio-net header incorrect");
2602fa5e56c2SGreg Kurz                 virtqueue_detach_element(q->tx_vq, elem, 0);
2603fa5e56c2SGreg Kurz                 g_free(elem);
2604fa5e56c2SGreg Kurz                 return -EINVAL;
2605032a74a1SCédric Le Goater             }
26061bfa316cSGreg Kurz             if (n->needs_vnet_hdr_swap) {
2607feb93f36SJason Wang                 virtio_net_hdr_swap(vdev, (void *) &mhdr);
2608feb93f36SJason Wang                 sg2[0].iov_base = &mhdr;
2609feb93f36SJason Wang                 sg2[0].iov_len = n->guest_hdr_len;
2610feb93f36SJason Wang                 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
2611feb93f36SJason Wang                                    out_sg, out_num,
2612feb93f36SJason Wang                                    n->guest_hdr_len, -1);
2613feb93f36SJason Wang                 if (out_num == VIRTQUEUE_MAX_SIZE) {
2614feb93f36SJason Wang                     goto drop;
2615032a74a1SCédric Le Goater                 }
2616feb93f36SJason Wang                 out_num += 1;
2617feb93f36SJason Wang                 out_sg = sg2;
2618feb93f36SJason Wang             }
2619feb93f36SJason Wang         }
26206e790746SPaolo Bonzini         /*
26216e790746SPaolo Bonzini          * If host wants to see the guest header as is, we can
26226e790746SPaolo Bonzini          * pass it on unchanged. Otherwise, copy just the parts
26236e790746SPaolo Bonzini          * that host is interested in.
26246e790746SPaolo Bonzini          */
26256e790746SPaolo Bonzini         assert(n->host_hdr_len <= n->guest_hdr_len);
26266e790746SPaolo Bonzini         if (n->host_hdr_len != n->guest_hdr_len) {
26276e790746SPaolo Bonzini             unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
26286e790746SPaolo Bonzini                                        out_sg, out_num,
26296e790746SPaolo Bonzini                                        0, n->host_hdr_len);
26306e790746SPaolo Bonzini             sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
26316e790746SPaolo Bonzini                              out_sg, out_num,
26326e790746SPaolo Bonzini                              n->guest_hdr_len, -1);
26336e790746SPaolo Bonzini             out_num = sg_num;
26346e790746SPaolo Bonzini             out_sg = sg;
26356e790746SPaolo Bonzini         }
26366e790746SPaolo Bonzini 
26376e790746SPaolo Bonzini         ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
26386e790746SPaolo Bonzini                                       out_sg, out_num, virtio_net_tx_complete);
26396e790746SPaolo Bonzini         if (ret == 0) {
26406e790746SPaolo Bonzini             virtio_queue_set_notification(q->tx_vq, 0);
26416e790746SPaolo Bonzini             q->async_tx.elem = elem;
26426e790746SPaolo Bonzini             return -EBUSY;
26436e790746SPaolo Bonzini         }
26446e790746SPaolo Bonzini 
2645feb93f36SJason Wang drop:
264651b19ebeSPaolo Bonzini         virtqueue_push(q->tx_vq, elem, 0);
264717a0ca55SKONRAD Frederic         virtio_notify(vdev, q->tx_vq);
264851b19ebeSPaolo Bonzini         g_free(elem);
26496e790746SPaolo Bonzini 
26506e790746SPaolo Bonzini         if (++num_packets >= n->tx_burst) {
26516e790746SPaolo Bonzini             break;
26526e790746SPaolo Bonzini         }
26536e790746SPaolo Bonzini     }
26546e790746SPaolo Bonzini     return num_packets;
26556e790746SPaolo Bonzini }
26566e790746SPaolo Bonzini 
26577550a822SLaurent Vivier static void virtio_net_tx_timer(void *opaque);
26587550a822SLaurent Vivier 
26596e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
26606e790746SPaolo Bonzini {
266117a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
26626e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
26636e790746SPaolo Bonzini 
2664283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2665283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2666283e2c2aSYuri Benditovich         return;
2667283e2c2aSYuri Benditovich     }
2668283e2c2aSYuri Benditovich 
26696e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
267017a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
26716e790746SPaolo Bonzini         q->tx_waiting = 1;
26726e790746SPaolo Bonzini         return;
26736e790746SPaolo Bonzini     }
26746e790746SPaolo Bonzini 
26756e790746SPaolo Bonzini     if (q->tx_waiting) {
26767550a822SLaurent Vivier         /* We already have queued packets, immediately flush */
2677bc72ad67SAlex Bligh         timer_del(q->tx_timer);
26787550a822SLaurent Vivier         virtio_net_tx_timer(q);
26796e790746SPaolo Bonzini     } else {
26807550a822SLaurent Vivier         /* re-arm timer to flush it (and more) on next tick */
2681bc72ad67SAlex Bligh         timer_mod(q->tx_timer,
2682bc72ad67SAlex Bligh                   qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
26836e790746SPaolo Bonzini         q->tx_waiting = 1;
26846e790746SPaolo Bonzini         virtio_queue_set_notification(vq, 0);
26856e790746SPaolo Bonzini     }
26866e790746SPaolo Bonzini }
26876e790746SPaolo Bonzini 
26886e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
26896e790746SPaolo Bonzini {
269017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
26916e790746SPaolo Bonzini     VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
26926e790746SPaolo Bonzini 
2693283e2c2aSYuri Benditovich     if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) {
2694283e2c2aSYuri Benditovich         virtio_net_drop_tx_queue_data(vdev, vq);
2695283e2c2aSYuri Benditovich         return;
2696283e2c2aSYuri Benditovich     }
2697283e2c2aSYuri Benditovich 
26986e790746SPaolo Bonzini     if (unlikely(q->tx_waiting)) {
26996e790746SPaolo Bonzini         return;
27006e790746SPaolo Bonzini     }
27016e790746SPaolo Bonzini     q->tx_waiting = 1;
27026e790746SPaolo Bonzini     /* This happens when device was stopped but VCPU wasn't. */
270317a0ca55SKONRAD Frederic     if (!vdev->vm_running) {
27046e790746SPaolo Bonzini         return;
27056e790746SPaolo Bonzini     }
27066e790746SPaolo Bonzini     virtio_queue_set_notification(vq, 0);
27076e790746SPaolo Bonzini     qemu_bh_schedule(q->tx_bh);
27086e790746SPaolo Bonzini }
27096e790746SPaolo Bonzini 
27106e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque)
27116e790746SPaolo Bonzini {
27126e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
27136e790746SPaolo Bonzini     VirtIONet *n = q->n;
271417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
27157550a822SLaurent Vivier     int ret;
27167550a822SLaurent Vivier 
2717e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2718e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2719e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2720e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2721e8bcf842SMichael S. Tsirkin         return;
2722e8bcf842SMichael S. Tsirkin     }
27236e790746SPaolo Bonzini 
27246e790746SPaolo Bonzini     q->tx_waiting = 0;
27256e790746SPaolo Bonzini 
27266e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
272717a0ca55SKONRAD Frederic     if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
27286e790746SPaolo Bonzini         return;
272917a0ca55SKONRAD Frederic     }
27306e790746SPaolo Bonzini 
27317550a822SLaurent Vivier     ret = virtio_net_flush_tx(q);
27327550a822SLaurent Vivier     if (ret == -EBUSY || ret == -EINVAL) {
27337550a822SLaurent Vivier         return;
27347550a822SLaurent Vivier     }
27357550a822SLaurent Vivier     /*
27367550a822SLaurent Vivier      * If we flush a full burst of packets, assume there are
27377550a822SLaurent Vivier      * more coming and immediately rearm
27387550a822SLaurent Vivier      */
27397550a822SLaurent Vivier     if (ret >= n->tx_burst) {
27407550a822SLaurent Vivier         q->tx_waiting = 1;
27417550a822SLaurent Vivier         timer_mod(q->tx_timer,
27427550a822SLaurent Vivier                   qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
27437550a822SLaurent Vivier         return;
27447550a822SLaurent Vivier     }
27457550a822SLaurent Vivier     /*
27467550a822SLaurent Vivier      * If less than a full burst, re-enable notification and flush
27477550a822SLaurent Vivier      * anything that may have come in while we weren't looking.  If
27487550a822SLaurent Vivier      * we find something, assume the guest is still active and rearm
27497550a822SLaurent Vivier      */
27506e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
27517550a822SLaurent Vivier     ret = virtio_net_flush_tx(q);
27527550a822SLaurent Vivier     if (ret > 0) {
27537550a822SLaurent Vivier         virtio_queue_set_notification(q->tx_vq, 0);
27547550a822SLaurent Vivier         q->tx_waiting = 1;
27557550a822SLaurent Vivier         timer_mod(q->tx_timer,
27567550a822SLaurent Vivier                   qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
27577550a822SLaurent Vivier     }
27586e790746SPaolo Bonzini }
27596e790746SPaolo Bonzini 
27606e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque)
27616e790746SPaolo Bonzini {
27626e790746SPaolo Bonzini     VirtIONetQueue *q = opaque;
27636e790746SPaolo Bonzini     VirtIONet *n = q->n;
276417a0ca55SKONRAD Frederic     VirtIODevice *vdev = VIRTIO_DEVICE(n);
27656e790746SPaolo Bonzini     int32_t ret;
27666e790746SPaolo Bonzini 
2767e8bcf842SMichael S. Tsirkin     /* This happens when device was stopped but BH wasn't. */
2768e8bcf842SMichael S. Tsirkin     if (!vdev->vm_running) {
2769e8bcf842SMichael S. Tsirkin         /* Make sure tx waiting is set, so we'll run when restarted. */
2770e8bcf842SMichael S. Tsirkin         assert(q->tx_waiting);
2771e8bcf842SMichael S. Tsirkin         return;
2772e8bcf842SMichael S. Tsirkin     }
27736e790746SPaolo Bonzini 
27746e790746SPaolo Bonzini     q->tx_waiting = 0;
27756e790746SPaolo Bonzini 
27766e790746SPaolo Bonzini     /* Just in case the driver is not ready on more */
277717a0ca55SKONRAD Frederic     if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
27786e790746SPaolo Bonzini         return;
277917a0ca55SKONRAD Frederic     }
27806e790746SPaolo Bonzini 
27816e790746SPaolo Bonzini     ret = virtio_net_flush_tx(q);
2782fa5e56c2SGreg Kurz     if (ret == -EBUSY || ret == -EINVAL) {
2783fa5e56c2SGreg Kurz         return; /* Notification re-enable handled by tx_complete or device
2784fa5e56c2SGreg Kurz                  * broken */
27856e790746SPaolo Bonzini     }
27866e790746SPaolo Bonzini 
27876e790746SPaolo Bonzini     /* If we flush a full burst of packets, assume there are
27886e790746SPaolo Bonzini      * more coming and immediately reschedule */
27896e790746SPaolo Bonzini     if (ret >= n->tx_burst) {
27906e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
27916e790746SPaolo Bonzini         q->tx_waiting = 1;
27926e790746SPaolo Bonzini         return;
27936e790746SPaolo Bonzini     }
27946e790746SPaolo Bonzini 
27956e790746SPaolo Bonzini     /* If less than a full burst, re-enable notification and flush
27966e790746SPaolo Bonzini      * anything that may have come in while we weren't looking.  If
27976e790746SPaolo Bonzini      * we find something, assume the guest is still active and reschedule */
27986e790746SPaolo Bonzini     virtio_queue_set_notification(q->tx_vq, 1);
2799fa5e56c2SGreg Kurz     ret = virtio_net_flush_tx(q);
2800fa5e56c2SGreg Kurz     if (ret == -EINVAL) {
2801fa5e56c2SGreg Kurz         return;
2802fa5e56c2SGreg Kurz     } else if (ret > 0) {
28036e790746SPaolo Bonzini         virtio_queue_set_notification(q->tx_vq, 0);
28046e790746SPaolo Bonzini         qemu_bh_schedule(q->tx_bh);
28056e790746SPaolo Bonzini         q->tx_waiting = 1;
28066e790746SPaolo Bonzini     }
28076e790746SPaolo Bonzini }
28086e790746SPaolo Bonzini 
2809f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index)
2810f9d6dbf0SWen Congyang {
2811f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2812f9d6dbf0SWen Congyang 
28131c0fbfa3SMichael S. Tsirkin     n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
28141c0fbfa3SMichael S. Tsirkin                                            virtio_net_handle_rx);
28159b02e161SWei Wang 
2816f9d6dbf0SWen Congyang     if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
2817f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
28189b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
28199b02e161SWei Wang                              virtio_net_handle_tx_timer);
2820f9d6dbf0SWen Congyang         n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
2821f9d6dbf0SWen Congyang                                               virtio_net_tx_timer,
2822f9d6dbf0SWen Congyang                                               &n->vqs[index]);
2823f9d6dbf0SWen Congyang     } else {
2824f9d6dbf0SWen Congyang         n->vqs[index].tx_vq =
28259b02e161SWei Wang             virtio_add_queue(vdev, n->net_conf.tx_queue_size,
28269b02e161SWei Wang                              virtio_net_handle_tx_bh);
2827f9d6dbf0SWen Congyang         n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
2828f9d6dbf0SWen Congyang     }
2829f9d6dbf0SWen Congyang 
2830f9d6dbf0SWen Congyang     n->vqs[index].tx_waiting = 0;
2831f9d6dbf0SWen Congyang     n->vqs[index].n = n;
2832f9d6dbf0SWen Congyang }
2833f9d6dbf0SWen Congyang 
2834f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index)
2835f9d6dbf0SWen Congyang {
2836f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2837f9d6dbf0SWen Congyang     VirtIONetQueue *q = &n->vqs[index];
2838f9d6dbf0SWen Congyang     NetClientState *nc = qemu_get_subqueue(n->nic, index);
2839f9d6dbf0SWen Congyang 
2840f9d6dbf0SWen Congyang     qemu_purge_queued_packets(nc);
2841f9d6dbf0SWen Congyang 
2842f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2);
2843f9d6dbf0SWen Congyang     if (q->tx_timer) {
2844f9d6dbf0SWen Congyang         timer_free(q->tx_timer);
2845f989c30cSYunjian Wang         q->tx_timer = NULL;
2846f9d6dbf0SWen Congyang     } else {
2847f9d6dbf0SWen Congyang         qemu_bh_delete(q->tx_bh);
2848f989c30cSYunjian Wang         q->tx_bh = NULL;
2849f9d6dbf0SWen Congyang     }
2850f989c30cSYunjian Wang     q->tx_waiting = 0;
2851f9d6dbf0SWen Congyang     virtio_del_queue(vdev, index * 2 + 1);
2852f9d6dbf0SWen Congyang }
2853f9d6dbf0SWen Congyang 
2854441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs)
2855f9d6dbf0SWen Congyang {
2856f9d6dbf0SWen Congyang     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2857f9d6dbf0SWen Congyang     int old_num_queues = virtio_get_num_queues(vdev);
2858441537f1SJason Wang     int new_num_queues = new_max_queue_pairs * 2 + 1;
2859f9d6dbf0SWen Congyang     int i;
2860f9d6dbf0SWen Congyang 
2861f9d6dbf0SWen Congyang     assert(old_num_queues >= 3);
2862f9d6dbf0SWen Congyang     assert(old_num_queues % 2 == 1);
2863f9d6dbf0SWen Congyang 
2864f9d6dbf0SWen Congyang     if (old_num_queues == new_num_queues) {
2865f9d6dbf0SWen Congyang         return;
2866f9d6dbf0SWen Congyang     }
2867f9d6dbf0SWen Congyang 
2868f9d6dbf0SWen Congyang     /*
2869f9d6dbf0SWen Congyang      * We always need to remove and add ctrl vq if
2870f9d6dbf0SWen Congyang      * old_num_queues != new_num_queues. Remove ctrl_vq first,
287120f86a75SYuval Shaia      * and then we only enter one of the following two loops.
2872f9d6dbf0SWen Congyang      */
2873f9d6dbf0SWen Congyang     virtio_del_queue(vdev, old_num_queues - 1);
2874f9d6dbf0SWen Congyang 
2875f9d6dbf0SWen Congyang     for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
2876f9d6dbf0SWen Congyang         /* new_num_queues < old_num_queues */
2877f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i / 2);
2878f9d6dbf0SWen Congyang     }
2879f9d6dbf0SWen Congyang 
2880f9d6dbf0SWen Congyang     for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
2881f9d6dbf0SWen Congyang         /* new_num_queues > old_num_queues */
2882f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i / 2);
2883f9d6dbf0SWen Congyang     }
2884f9d6dbf0SWen Congyang 
2885f9d6dbf0SWen Congyang     /* add ctrl_vq last */
2886f9d6dbf0SWen Congyang     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
2887f9d6dbf0SWen Congyang }
2888f9d6dbf0SWen Congyang 
2889ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
28906e790746SPaolo Bonzini {
2891441537f1SJason Wang     int max = multiqueue ? n->max_queue_pairs : 1;
2892f9d6dbf0SWen Congyang 
28936e790746SPaolo Bonzini     n->multiqueue = multiqueue;
2894441537f1SJason Wang     virtio_net_change_num_queue_pairs(n, max);
28956e790746SPaolo Bonzini 
2896441537f1SJason Wang     virtio_net_set_queue_pairs(n);
28976e790746SPaolo Bonzini }
28986e790746SPaolo Bonzini 
2899982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id)
2900037dab2fSGreg Kurz {
2901982b78c5SDr. David Alan Gilbert     VirtIONet *n = opaque;
2902982b78c5SDr. David Alan Gilbert     VirtIODevice *vdev = VIRTIO_DEVICE(n);
2903037dab2fSGreg Kurz     int i, link_down;
2904037dab2fSGreg Kurz 
29059d8c6a25SDr. David Alan Gilbert     trace_virtio_net_post_load_device();
2906982b78c5SDr. David Alan Gilbert     virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs,
290795129d6fSCornelia Huck                                virtio_vdev_has_feature(vdev,
2908e22f0603SYuri Benditovich                                                        VIRTIO_F_VERSION_1),
2909e22f0603SYuri Benditovich                                virtio_vdev_has_feature(vdev,
2910e22f0603SYuri Benditovich                                                        VIRTIO_NET_F_HASH_REPORT));
29116e790746SPaolo Bonzini 
29126e790746SPaolo Bonzini     /* MAC_TABLE_ENTRIES may be different from the saved image */
2913982b78c5SDr. David Alan Gilbert     if (n->mac_table.in_use > MAC_TABLE_ENTRIES) {
29146e790746SPaolo Bonzini         n->mac_table.in_use = 0;
29156e790746SPaolo Bonzini     }
29166e790746SPaolo Bonzini 
2917982b78c5SDr. David Alan Gilbert     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
29186c666823SMichael S. Tsirkin         n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
29196c666823SMichael S. Tsirkin     }
29206c666823SMichael S. Tsirkin 
29217788c3f2SMikhail Sennikovsky     /*
29227788c3f2SMikhail Sennikovsky      * curr_guest_offloads will be later overwritten by the
29237788c3f2SMikhail Sennikovsky      * virtio_set_features_nocheck call done from the virtio_load.
29247788c3f2SMikhail Sennikovsky      * Here we make sure it is preserved and restored accordingly
29257788c3f2SMikhail Sennikovsky      * in the virtio_net_post_load_virtio callback.
29267788c3f2SMikhail Sennikovsky      */
29277788c3f2SMikhail Sennikovsky     n->saved_guest_offloads = n->curr_guest_offloads;
29286c666823SMichael S. Tsirkin 
2929441537f1SJason Wang     virtio_net_set_queue_pairs(n);
29306e790746SPaolo Bonzini 
29316e790746SPaolo Bonzini     /* Find the first multicast entry in the saved MAC filter */
29326e790746SPaolo Bonzini     for (i = 0; i < n->mac_table.in_use; i++) {
29336e790746SPaolo Bonzini         if (n->mac_table.macs[i * ETH_ALEN] & 1) {
29346e790746SPaolo Bonzini             break;
29356e790746SPaolo Bonzini         }
29366e790746SPaolo Bonzini     }
29376e790746SPaolo Bonzini     n->mac_table.first_multi = i;
29386e790746SPaolo Bonzini 
29396e790746SPaolo Bonzini     /* nc.link_down can't be migrated, so infer link_down according
29406e790746SPaolo Bonzini      * to link status bit in n->status */
29416e790746SPaolo Bonzini     link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
2942441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
29436e790746SPaolo Bonzini         qemu_get_subqueue(n->nic, i)->link_down = link_down;
29446e790746SPaolo Bonzini     }
29456e790746SPaolo Bonzini 
29466c666823SMichael S. Tsirkin     if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
29476c666823SMichael S. Tsirkin         virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
29489d8c6a25SDr. David Alan Gilbert         qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
29499d8c6a25SDr. David Alan Gilbert                                   QEMU_CLOCK_VIRTUAL,
29509d8c6a25SDr. David Alan Gilbert                                   virtio_net_announce_timer, n);
29519d8c6a25SDr. David Alan Gilbert         if (n->announce_timer.round) {
29529d8c6a25SDr. David Alan Gilbert             timer_mod(n->announce_timer.tm,
29539d8c6a25SDr. David Alan Gilbert                       qemu_clock_get_ms(n->announce_timer.type));
29549d8c6a25SDr. David Alan Gilbert         } else {
2955944458b6SDr. David Alan Gilbert             qemu_announce_timer_del(&n->announce_timer, false);
29569d8c6a25SDr. David Alan Gilbert         }
29576c666823SMichael S. Tsirkin     }
29586c666823SMichael S. Tsirkin 
2959e41b7114SYuri Benditovich     if (n->rss_data.enabled) {
29600145c393SAndrew Melnychenko         n->rss_data.enabled_software_rss = n->rss_data.populate_hash;
29610145c393SAndrew Melnychenko         if (!n->rss_data.populate_hash) {
29620145c393SAndrew Melnychenko             if (!virtio_net_attach_epbf_rss(n)) {
29630145c393SAndrew Melnychenko                 if (get_vhost_net(qemu_get_queue(n->nic)->peer)) {
29640145c393SAndrew Melnychenko                     warn_report("Can't post-load eBPF RSS for vhost");
29650145c393SAndrew Melnychenko                 } else {
29660145c393SAndrew Melnychenko                     warn_report("Can't post-load eBPF RSS - "
29670145c393SAndrew Melnychenko                                 "fallback to software RSS");
29680145c393SAndrew Melnychenko                     n->rss_data.enabled_software_rss = true;
29690145c393SAndrew Melnychenko                 }
29700145c393SAndrew Melnychenko             }
29710145c393SAndrew Melnychenko         }
29720145c393SAndrew Melnychenko 
2973e41b7114SYuri Benditovich         trace_virtio_net_rss_enable(n->rss_data.hash_types,
2974e41b7114SYuri Benditovich                                     n->rss_data.indirections_len,
2975e41b7114SYuri Benditovich                                     sizeof(n->rss_data.key));
2976e41b7114SYuri Benditovich     } else {
2977e41b7114SYuri Benditovich         trace_virtio_net_rss_disable();
2978e41b7114SYuri Benditovich     }
29796e790746SPaolo Bonzini     return 0;
29806e790746SPaolo Bonzini }
29816e790746SPaolo Bonzini 
29827788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev)
29837788c3f2SMikhail Sennikovsky {
29847788c3f2SMikhail Sennikovsky     VirtIONet *n = VIRTIO_NET(vdev);
29857788c3f2SMikhail Sennikovsky     /*
29867788c3f2SMikhail Sennikovsky      * The actual needed state is now in saved_guest_offloads,
29877788c3f2SMikhail Sennikovsky      * see virtio_net_post_load_device for detail.
29887788c3f2SMikhail Sennikovsky      * Restore it back and apply the desired offloads.
29897788c3f2SMikhail Sennikovsky      */
29907788c3f2SMikhail Sennikovsky     n->curr_guest_offloads = n->saved_guest_offloads;
29917788c3f2SMikhail Sennikovsky     if (peer_has_vnet_hdr(n)) {
29927788c3f2SMikhail Sennikovsky         virtio_net_apply_guest_offloads(n);
29937788c3f2SMikhail Sennikovsky     }
29947788c3f2SMikhail Sennikovsky 
29957788c3f2SMikhail Sennikovsky     return 0;
29967788c3f2SMikhail Sennikovsky }
29977788c3f2SMikhail Sennikovsky 
2998982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */
2999982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = {
3000982b78c5SDr. David Alan Gilbert     .name = "virtio-net-queue-tx_waiting",
3001982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
3002982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(tx_waiting, VirtIONetQueue),
3003982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3004982b78c5SDr. David Alan Gilbert    },
3005982b78c5SDr. David Alan Gilbert };
3006982b78c5SDr. David Alan Gilbert 
3007441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id)
3008982b78c5SDr. David Alan Gilbert {
3009441537f1SJason Wang     return VIRTIO_NET(opaque)->max_queue_pairs > 1;
3010982b78c5SDr. David Alan Gilbert }
3011982b78c5SDr. David Alan Gilbert 
3012982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id)
3013982b78c5SDr. David Alan Gilbert {
3014982b78c5SDr. David Alan Gilbert     return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque),
3015982b78c5SDr. David Alan Gilbert                                    VIRTIO_NET_F_CTRL_GUEST_OFFLOADS);
3016982b78c5SDr. David Alan Gilbert }
3017982b78c5SDr. David Alan Gilbert 
3018982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id)
3019982b78c5SDr. David Alan Gilbert {
3020982b78c5SDr. David Alan Gilbert     return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES;
3021982b78c5SDr. David Alan Gilbert }
3022982b78c5SDr. David Alan Gilbert 
3023982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id)
3024982b78c5SDr. David Alan Gilbert {
3025982b78c5SDr. David Alan Gilbert     return !mac_table_fits(opaque, version_id);
3026982b78c5SDr. David Alan Gilbert }
3027982b78c5SDr. David Alan Gilbert 
3028982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods
3029982b78c5SDr. David Alan Gilbert  * although only some fields are used by each.
3030982b78c5SDr. David Alan Gilbert  */
3031982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp {
3032982b78c5SDr. David Alan Gilbert     VirtIONet      *parent;
3033982b78c5SDr. David Alan Gilbert     VirtIONetQueue *vqs_1;
3034441537f1SJason Wang     uint16_t        curr_queue_pairs_1;
3035982b78c5SDr. David Alan Gilbert     uint8_t         has_ufo;
3036982b78c5SDr. David Alan Gilbert     uint32_t        has_vnet_hdr;
3037982b78c5SDr. David Alan Gilbert };
3038982b78c5SDr. David Alan Gilbert 
3039982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than
3040441537f1SJason Wang  * the 1st entry in the queue_pairs and only if there's more than one
3041982b78c5SDr. David Alan Gilbert  * entry.  We use the tmp mechanism to calculate a temporary
3042982b78c5SDr. David Alan Gilbert  * pointer and count and also validate the count.
3043982b78c5SDr. David Alan Gilbert  */
3044982b78c5SDr. David Alan Gilbert 
304544b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque)
3046982b78c5SDr. David Alan Gilbert {
3047982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3048982b78c5SDr. David Alan Gilbert 
3049982b78c5SDr. David Alan Gilbert     tmp->vqs_1 = tmp->parent->vqs + 1;
3050441537f1SJason Wang     tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1;
3051441537f1SJason Wang     if (tmp->parent->curr_queue_pairs == 0) {
3052441537f1SJason Wang         tmp->curr_queue_pairs_1 = 0;
3053982b78c5SDr. David Alan Gilbert     }
305444b1ff31SDr. David Alan Gilbert 
305544b1ff31SDr. David Alan Gilbert     return 0;
3056982b78c5SDr. David Alan Gilbert }
3057982b78c5SDr. David Alan Gilbert 
3058982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque)
3059982b78c5SDr. David Alan Gilbert {
3060982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3061982b78c5SDr. David Alan Gilbert 
3062982b78c5SDr. David Alan Gilbert     /* Reuse the pointer setup from save */
3063982b78c5SDr. David Alan Gilbert     virtio_net_tx_waiting_pre_save(opaque);
3064982b78c5SDr. David Alan Gilbert 
3065441537f1SJason Wang     if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) {
3066441537f1SJason Wang         error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x",
3067441537f1SJason Wang             tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs);
3068982b78c5SDr. David Alan Gilbert 
3069982b78c5SDr. David Alan Gilbert         return -EINVAL;
3070982b78c5SDr. David Alan Gilbert     }
3071982b78c5SDr. David Alan Gilbert 
3072982b78c5SDr. David Alan Gilbert     return 0; /* all good */
3073982b78c5SDr. David Alan Gilbert }
3074982b78c5SDr. David Alan Gilbert 
3075982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = {
3076982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-tx_waiting",
3077982b78c5SDr. David Alan Gilbert     .pre_load  = virtio_net_tx_waiting_pre_load,
3078982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_tx_waiting_pre_save,
3079982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3080982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp,
3081441537f1SJason Wang                                      curr_queue_pairs_1,
3082982b78c5SDr. David Alan Gilbert                                      vmstate_virtio_net_queue_tx_waiting,
3083982b78c5SDr. David Alan Gilbert                                      struct VirtIONetQueue),
3084982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3085982b78c5SDr. David Alan Gilbert     },
3086982b78c5SDr. David Alan Gilbert };
3087982b78c5SDr. David Alan Gilbert 
3088982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the
3089982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
3090982b78c5SDr. David Alan Gilbert  */
3091982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id)
3092982b78c5SDr. David Alan Gilbert {
3093982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3094982b78c5SDr. David Alan Gilbert 
3095982b78c5SDr. David Alan Gilbert     if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) {
3096982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires TUN_F_UFO support");
3097982b78c5SDr. David Alan Gilbert         return -EINVAL;
3098982b78c5SDr. David Alan Gilbert     }
3099982b78c5SDr. David Alan Gilbert 
3100982b78c5SDr. David Alan Gilbert     return 0;
3101982b78c5SDr. David Alan Gilbert }
3102982b78c5SDr. David Alan Gilbert 
310344b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque)
3104982b78c5SDr. David Alan Gilbert {
3105982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3106982b78c5SDr. David Alan Gilbert 
3107982b78c5SDr. David Alan Gilbert     tmp->has_ufo = tmp->parent->has_ufo;
310844b1ff31SDr. David Alan Gilbert 
310944b1ff31SDr. David Alan Gilbert     return 0;
3110982b78c5SDr. David Alan Gilbert }
3111982b78c5SDr. David Alan Gilbert 
3112982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = {
3113982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-ufo",
3114982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_ufo_post_load,
3115982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_ufo_pre_save,
3116982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3117982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp),
3118982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3119982b78c5SDr. David Alan Gilbert     },
3120982b78c5SDr. David Alan Gilbert };
3121982b78c5SDr. David Alan Gilbert 
3122982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the
3123982b78c5SDr. David Alan Gilbert  * flag set we need to check that we have it
3124982b78c5SDr. David Alan Gilbert  */
3125982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id)
3126982b78c5SDr. David Alan Gilbert {
3127982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3128982b78c5SDr. David Alan Gilbert 
3129982b78c5SDr. David Alan Gilbert     if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) {
3130982b78c5SDr. David Alan Gilbert         error_report("virtio-net: saved image requires vnet_hdr=on");
3131982b78c5SDr. David Alan Gilbert         return -EINVAL;
3132982b78c5SDr. David Alan Gilbert     }
3133982b78c5SDr. David Alan Gilbert 
3134982b78c5SDr. David Alan Gilbert     return 0;
3135982b78c5SDr. David Alan Gilbert }
3136982b78c5SDr. David Alan Gilbert 
313744b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque)
3138982b78c5SDr. David Alan Gilbert {
3139982b78c5SDr. David Alan Gilbert     struct VirtIONetMigTmp *tmp = opaque;
3140982b78c5SDr. David Alan Gilbert 
3141982b78c5SDr. David Alan Gilbert     tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr;
314244b1ff31SDr. David Alan Gilbert 
314344b1ff31SDr. David Alan Gilbert     return 0;
3144982b78c5SDr. David Alan Gilbert }
3145982b78c5SDr. David Alan Gilbert 
3146982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = {
3147982b78c5SDr. David Alan Gilbert     .name      = "virtio-net-vnet",
3148982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_vnet_post_load,
3149982b78c5SDr. David Alan Gilbert     .pre_save  = virtio_net_vnet_pre_save,
3150982b78c5SDr. David Alan Gilbert     .fields    = (VMStateField[]) {
3151982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp),
3152982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3153982b78c5SDr. David Alan Gilbert     },
3154982b78c5SDr. David Alan Gilbert };
3155982b78c5SDr. David Alan Gilbert 
3156e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque)
3157e41b7114SYuri Benditovich {
3158e41b7114SYuri Benditovich     return VIRTIO_NET(opaque)->rss_data.enabled;
3159e41b7114SYuri Benditovich }
3160e41b7114SYuri Benditovich 
3161e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = {
3162e41b7114SYuri Benditovich     .name      = "virtio-net-device/rss",
3163e41b7114SYuri Benditovich     .version_id = 1,
3164e41b7114SYuri Benditovich     .minimum_version_id = 1,
3165e41b7114SYuri Benditovich     .needed = virtio_net_rss_needed,
3166e41b7114SYuri Benditovich     .fields = (VMStateField[]) {
3167e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.enabled, VirtIONet),
3168e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.redirect, VirtIONet),
3169e41b7114SYuri Benditovich         VMSTATE_BOOL(rss_data.populate_hash, VirtIONet),
3170e41b7114SYuri Benditovich         VMSTATE_UINT32(rss_data.hash_types, VirtIONet),
3171e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.indirections_len, VirtIONet),
3172e41b7114SYuri Benditovich         VMSTATE_UINT16(rss_data.default_queue, VirtIONet),
3173e41b7114SYuri Benditovich         VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet,
3174e41b7114SYuri Benditovich                             VIRTIO_NET_RSS_MAX_KEY_SIZE),
3175e41b7114SYuri Benditovich         VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet,
3176e41b7114SYuri Benditovich                                     rss_data.indirections_len, 0,
3177e41b7114SYuri Benditovich                                     vmstate_info_uint16, uint16_t),
3178e41b7114SYuri Benditovich         VMSTATE_END_OF_LIST()
3179e41b7114SYuri Benditovich     },
3180e41b7114SYuri Benditovich };
3181e41b7114SYuri Benditovich 
3182982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = {
3183982b78c5SDr. David Alan Gilbert     .name = "virtio-net-device",
3184982b78c5SDr. David Alan Gilbert     .version_id = VIRTIO_NET_VM_VERSION,
3185982b78c5SDr. David Alan Gilbert     .minimum_version_id = VIRTIO_NET_VM_VERSION,
3186982b78c5SDr. David Alan Gilbert     .post_load = virtio_net_post_load_device,
3187982b78c5SDr. David Alan Gilbert     .fields = (VMStateField[]) {
3188982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN),
3189982b78c5SDr. David Alan Gilbert         VMSTATE_STRUCT_POINTER(vqs, VirtIONet,
3190982b78c5SDr. David Alan Gilbert                                vmstate_virtio_net_queue_tx_waiting,
3191982b78c5SDr. David Alan Gilbert                                VirtIONetQueue),
3192982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet),
3193982b78c5SDr. David Alan Gilbert         VMSTATE_UINT16(status, VirtIONet),
3194982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(promisc, VirtIONet),
3195982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(allmulti, VirtIONet),
3196982b78c5SDr. David Alan Gilbert         VMSTATE_UINT32(mac_table.in_use, VirtIONet),
3197982b78c5SDr. David Alan Gilbert 
3198982b78c5SDr. David Alan Gilbert         /* Guarded pair: If it fits we load it, else we throw it away
3199982b78c5SDr. David Alan Gilbert          * - can happen if source has a larger MAC table.; post-load
3200982b78c5SDr. David Alan Gilbert          *  sets flags in this case.
3201982b78c5SDr. David Alan Gilbert          */
3202982b78c5SDr. David Alan Gilbert         VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet,
3203982b78c5SDr. David Alan Gilbert                                 0, mac_table_fits, mac_table.in_use,
3204982b78c5SDr. David Alan Gilbert                                  ETH_ALEN),
3205982b78c5SDr. David Alan Gilbert         VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0,
3206982b78c5SDr. David Alan Gilbert                                      mac_table.in_use, ETH_ALEN),
3207982b78c5SDr. David Alan Gilbert 
3208982b78c5SDr. David Alan Gilbert         /* Note: This is an array of uint32's that's always been saved as a
3209982b78c5SDr. David Alan Gilbert          * buffer; hold onto your endiannesses; it's actually used as a bitmap
3210982b78c5SDr. David Alan Gilbert          * but based on the uint.
3211982b78c5SDr. David Alan Gilbert          */
3212982b78c5SDr. David Alan Gilbert         VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3),
3213982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3214982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_vnet),
3215982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet),
3216982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet),
3217982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(alluni, VirtIONet),
3218982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nomulti, VirtIONet),
3219982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nouni, VirtIONet),
3220982b78c5SDr. David Alan Gilbert         VMSTATE_UINT8(nobcast, VirtIONet),
3221982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3222982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_has_ufo),
3223441537f1SJason Wang         VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0,
3224982b78c5SDr. David Alan Gilbert                             vmstate_info_uint16_equal, uint16_t),
3225441537f1SJason Wang         VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1),
3226982b78c5SDr. David Alan Gilbert         VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp,
3227982b78c5SDr. David Alan Gilbert                          vmstate_virtio_net_tx_waiting),
3228982b78c5SDr. David Alan Gilbert         VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet,
3229982b78c5SDr. David Alan Gilbert                             has_ctrl_guest_offloads),
3230982b78c5SDr. David Alan Gilbert         VMSTATE_END_OF_LIST()
3231982b78c5SDr. David Alan Gilbert    },
3232e41b7114SYuri Benditovich     .subsections = (const VMStateDescription * []) {
3233e41b7114SYuri Benditovich         &vmstate_virtio_net_rss,
3234e41b7114SYuri Benditovich         NULL
3235e41b7114SYuri Benditovich     }
3236982b78c5SDr. David Alan Gilbert };
3237982b78c5SDr. David Alan Gilbert 
32386e790746SPaolo Bonzini static NetClientInfo net_virtio_info = {
3239f394b2e2SEric Blake     .type = NET_CLIENT_DRIVER_NIC,
32406e790746SPaolo Bonzini     .size = sizeof(NICState),
32416e790746SPaolo Bonzini     .can_receive = virtio_net_can_receive,
32426e790746SPaolo Bonzini     .receive = virtio_net_receive,
32436e790746SPaolo Bonzini     .link_status_changed = virtio_net_set_link_status,
3244b1be4280SAmos Kong     .query_rx_filter = virtio_net_query_rxfilter,
3245b2c929f0SDr. David Alan Gilbert     .announce = virtio_net_announce,
32466e790746SPaolo Bonzini };
32476e790746SPaolo Bonzini 
32486e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
32496e790746SPaolo Bonzini {
325017a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
325168b0a639SSi-Wei Liu     NetClientState *nc;
32526e790746SPaolo Bonzini     assert(n->vhost_started);
325368b0a639SSi-Wei Liu     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) {
325468b0a639SSi-Wei Liu         /* Must guard against invalid features and bogus queue index
325568b0a639SSi-Wei Liu          * from being set by malicious guest, or penetrated through
325668b0a639SSi-Wei Liu          * buggy migration stream.
325768b0a639SSi-Wei Liu          */
325868b0a639SSi-Wei Liu         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
325968b0a639SSi-Wei Liu             qemu_log_mask(LOG_GUEST_ERROR,
326068b0a639SSi-Wei Liu                           "%s: bogus vq index ignored\n", __func__);
326168b0a639SSi-Wei Liu             return false;
326268b0a639SSi-Wei Liu         }
326368b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, n->max_queue_pairs);
326468b0a639SSi-Wei Liu     } else {
326568b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, vq2q(idx));
326668b0a639SSi-Wei Liu     }
3267ed8b4afeSNikolay Nikolaev     return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
32686e790746SPaolo Bonzini }
32696e790746SPaolo Bonzini 
32706e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
32716e790746SPaolo Bonzini                                            bool mask)
32726e790746SPaolo Bonzini {
327317a0ca55SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(vdev);
327468b0a639SSi-Wei Liu     NetClientState *nc;
32756e790746SPaolo Bonzini     assert(n->vhost_started);
327668b0a639SSi-Wei Liu     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) {
327768b0a639SSi-Wei Liu         /* Must guard against invalid features and bogus queue index
327868b0a639SSi-Wei Liu          * from being set by malicious guest, or penetrated through
327968b0a639SSi-Wei Liu          * buggy migration stream.
328068b0a639SSi-Wei Liu          */
328168b0a639SSi-Wei Liu         if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
328268b0a639SSi-Wei Liu             qemu_log_mask(LOG_GUEST_ERROR,
328368b0a639SSi-Wei Liu                           "%s: bogus vq index ignored\n", __func__);
328468b0a639SSi-Wei Liu             return;
328568b0a639SSi-Wei Liu         }
328668b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, n->max_queue_pairs);
328768b0a639SSi-Wei Liu     } else {
328868b0a639SSi-Wei Liu         nc = qemu_get_subqueue(n->nic, vq2q(idx));
328968b0a639SSi-Wei Liu     }
3290a882b571SMichael S. Tsirkin     vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
3291a882b571SMichael S. Tsirkin                              vdev, idx, mask);
32926e790746SPaolo Bonzini }
32936e790746SPaolo Bonzini 
3294019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
32956e790746SPaolo Bonzini {
32960cd09c3aSCornelia Huck     virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
3297a93e599dSMaxime Coquelin 
3298d74c30c8SDaniil Tatianin     n->config_size = virtio_get_config_size(&cfg_size_params, host_features);
329917ec5a86SKONRAD Frederic }
33006e790746SPaolo Bonzini 
33018a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
33028a253ec2SKONRAD Frederic                                    const char *type)
33038a253ec2SKONRAD Frederic {
33048a253ec2SKONRAD Frederic     /*
33058a253ec2SKONRAD Frederic      * The name can be NULL, the netclient name will be type.x.
33068a253ec2SKONRAD Frederic      */
33078a253ec2SKONRAD Frederic     assert(type != NULL);
33088a253ec2SKONRAD Frederic 
33098a253ec2SKONRAD Frederic     g_free(n->netclient_name);
33108a253ec2SKONRAD Frederic     g_free(n->netclient_type);
33118a253ec2SKONRAD Frederic     n->netclient_name = g_strdup(name);
33128a253ec2SKONRAD Frederic     n->netclient_type = g_strdup(type);
33138a253ec2SKONRAD Frederic }
33148a253ec2SKONRAD Frederic 
33150e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev)
33169711cd0dSJens Freimann {
33179711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
33189711cd0dSJens Freimann     PCIDevice *pci_dev;
33199711cd0dSJens Freimann     Error *err = NULL;
33209711cd0dSJens Freimann 
33210e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
33229711cd0dSJens Freimann     if (hotplug_ctrl) {
33230e9a65c5SJuan Quintela         pci_dev = PCI_DEVICE(dev);
33249711cd0dSJens Freimann         pci_dev->partially_hotplugged = true;
33250e9a65c5SJuan Quintela         hotplug_handler_unplug_request(hotplug_ctrl, dev, &err);
33269711cd0dSJens Freimann         if (err) {
33279711cd0dSJens Freimann             error_report_err(err);
33289711cd0dSJens Freimann             return false;
33299711cd0dSJens Freimann         }
33309711cd0dSJens Freimann     } else {
33319711cd0dSJens Freimann         return false;
33329711cd0dSJens Freimann     }
33339711cd0dSJens Freimann     return true;
33349711cd0dSJens Freimann }
33359711cd0dSJens Freimann 
33360e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev,
33370e9a65c5SJuan Quintela                                     Error **errp)
33389711cd0dSJens Freimann {
33395a0948d3SMarkus Armbruster     Error *err = NULL;
33409711cd0dSJens Freimann     HotplugHandler *hotplug_ctrl;
33410e9a65c5SJuan Quintela     PCIDevice *pdev = PCI_DEVICE(dev);
334278274682SJuan Quintela     BusState *primary_bus;
33439711cd0dSJens Freimann 
33449711cd0dSJens Freimann     if (!pdev->partially_hotplugged) {
33459711cd0dSJens Freimann         return true;
33469711cd0dSJens Freimann     }
33470e9a65c5SJuan Quintela     primary_bus = dev->parent_bus;
334878274682SJuan Quintela     if (!primary_bus) {
3349150ab54aSJens Freimann         error_setg(errp, "virtio_net: couldn't find primary bus");
33505a0948d3SMarkus Armbruster         return false;
33519711cd0dSJens Freimann     }
33520e9a65c5SJuan Quintela     qdev_set_parent_bus(dev, primary_bus, &error_abort);
3353e2bde83eSJuan Quintela     qatomic_set(&n->failover_primary_hidden, false);
33540e9a65c5SJuan Quintela     hotplug_ctrl = qdev_get_hotplug_handler(dev);
33559711cd0dSJens Freimann     if (hotplug_ctrl) {
33560e9a65c5SJuan Quintela         hotplug_handler_pre_plug(hotplug_ctrl, dev, &err);
33575a0948d3SMarkus Armbruster         if (err) {
33585a0948d3SMarkus Armbruster             goto out;
33595a0948d3SMarkus Armbruster         }
33600e9a65c5SJuan Quintela         hotplug_handler_plug(hotplug_ctrl, dev, &err);
33619711cd0dSJens Freimann     }
3362109c20eaSLaurent Vivier     pdev->partially_hotplugged = false;
3363150ab54aSJens Freimann 
3364150ab54aSJens Freimann out:
33655a0948d3SMarkus Armbruster     error_propagate(errp, err);
33665a0948d3SMarkus Armbruster     return !err;
33679711cd0dSJens Freimann }
33689711cd0dSJens Freimann 
336907a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s)
33709711cd0dSJens Freimann {
33719711cd0dSJens Freimann     bool should_be_hidden;
33729711cd0dSJens Freimann     Error *err = NULL;
337307a5d816SJuan Quintela     DeviceState *dev = failover_find_primary_device(n);
337407a5d816SJuan Quintela 
337507a5d816SJuan Quintela     if (!dev) {
337607a5d816SJuan Quintela         return;
337707a5d816SJuan Quintela     }
33789711cd0dSJens Freimann 
3379e2bde83eSJuan Quintela     should_be_hidden = qatomic_read(&n->failover_primary_hidden);
33809711cd0dSJens Freimann 
33814dbac1aeSMarkus Armbruster     if (migration_in_setup(s) && !should_be_hidden) {
338207a5d816SJuan Quintela         if (failover_unplug_primary(n, dev)) {
338307a5d816SJuan Quintela             vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev);
338407a5d816SJuan Quintela             qapi_event_send_unplug_primary(dev->id);
3385e2bde83eSJuan Quintela             qatomic_set(&n->failover_primary_hidden, true);
33869711cd0dSJens Freimann         } else {
33879711cd0dSJens Freimann             warn_report("couldn't unplug primary device");
33889711cd0dSJens Freimann         }
33899711cd0dSJens Freimann     } else if (migration_has_failed(s)) {
3390150ab54aSJens Freimann         /* We already unplugged the device let's plug it back */
339107a5d816SJuan Quintela         if (!failover_replug_primary(n, dev, &err)) {
33929711cd0dSJens Freimann             if (err) {
33939711cd0dSJens Freimann                 error_report_err(err);
33949711cd0dSJens Freimann             }
33959711cd0dSJens Freimann         }
33969711cd0dSJens Freimann     }
33979711cd0dSJens Freimann }
33989711cd0dSJens Freimann 
33999711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data)
34009711cd0dSJens Freimann {
34019711cd0dSJens Freimann     MigrationState *s = data;
34029711cd0dSJens Freimann     VirtIONet *n = container_of(notifier, VirtIONet, migration_state);
34039711cd0dSJens Freimann     virtio_net_handle_migration_primary(n, s);
34049711cd0dSJens Freimann }
34059711cd0dSJens Freimann 
3406b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener,
3407f3558b1bSKevin Wolf                                          const QDict *device_opts,
3408f3558b1bSKevin Wolf                                          bool from_json,
3409f3558b1bSKevin Wolf                                          Error **errp)
34109711cd0dSJens Freimann {
34119711cd0dSJens Freimann     VirtIONet *n = container_of(listener, VirtIONet, primary_listener);
34124f0303aeSJuan Quintela     const char *standby_id;
34139711cd0dSJens Freimann 
34144d0e59acSJens Freimann     if (!device_opts) {
341589631fedSJuan Quintela         return false;
34164d0e59acSJens Freimann     }
3417bcfc906bSLaurent Vivier 
3418bcfc906bSLaurent Vivier     if (!qdict_haskey(device_opts, "failover_pair_id")) {
3419bcfc906bSLaurent Vivier         return false;
3420bcfc906bSLaurent Vivier     }
3421bcfc906bSLaurent Vivier 
3422bcfc906bSLaurent Vivier     if (!qdict_haskey(device_opts, "id")) {
3423bcfc906bSLaurent Vivier         error_setg(errp, "Device with failover_pair_id needs to have id");
3424bcfc906bSLaurent Vivier         return false;
3425bcfc906bSLaurent Vivier     }
3426bcfc906bSLaurent Vivier 
3427bcfc906bSLaurent Vivier     standby_id = qdict_get_str(device_opts, "failover_pair_id");
342889631fedSJuan Quintela     if (g_strcmp0(standby_id, n->netclient_name) != 0) {
342989631fedSJuan Quintela         return false;
34309711cd0dSJens Freimann     }
34319711cd0dSJens Freimann 
34327fe7791eSLaurent Vivier     /*
34337fe7791eSLaurent Vivier      * The hide helper can be called several times for a given device.
34347fe7791eSLaurent Vivier      * Check there is only one primary for a virtio-net device but
34357fe7791eSLaurent Vivier      * don't duplicate the qdict several times if it's called for the same
34367fe7791eSLaurent Vivier      * device.
34377fe7791eSLaurent Vivier      */
3438259a10dbSKevin Wolf     if (n->primary_opts) {
34397fe7791eSLaurent Vivier         const char *old, *new;
34407fe7791eSLaurent Vivier         /* devices with failover_pair_id always have an id */
34417fe7791eSLaurent Vivier         old = qdict_get_str(n->primary_opts, "id");
34427fe7791eSLaurent Vivier         new = qdict_get_str(device_opts, "id");
34437fe7791eSLaurent Vivier         if (strcmp(old, new) != 0) {
34447fe7791eSLaurent Vivier             error_setg(errp, "Cannot attach more than one primary device to "
34457fe7791eSLaurent Vivier                        "'%s': '%s' and '%s'", n->netclient_name, old, new);
3446259a10dbSKevin Wolf             return false;
3447259a10dbSKevin Wolf         }
34487fe7791eSLaurent Vivier     } else {
3449f3558b1bSKevin Wolf         n->primary_opts = qdict_clone_shallow(device_opts);
3450f3558b1bSKevin Wolf         n->primary_opts_from_json = from_json;
34517fe7791eSLaurent Vivier     }
3452259a10dbSKevin Wolf 
3453e2bde83eSJuan Quintela     /* failover_primary_hidden is set during feature negotiation */
34543abad4a2SJuan Quintela     return qatomic_read(&n->failover_primary_hidden);
34559711cd0dSJens Freimann }
34569711cd0dSJens Freimann 
3457e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp)
345817ec5a86SKONRAD Frederic {
3459e6f746b3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3460284a32f0SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3461284a32f0SAndreas Färber     NetClientState *nc;
34621773d9eeSKONRAD Frederic     int i;
346317ec5a86SKONRAD Frederic 
3464a93e599dSMaxime Coquelin     if (n->net_conf.mtu) {
3465127833eeSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_MTU);
3466a93e599dSMaxime Coquelin     }
3467a93e599dSMaxime Coquelin 
34689473939eSJason Baron     if (n->net_conf.duplex_str) {
34699473939eSJason Baron         if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) {
34709473939eSJason Baron             n->net_conf.duplex = DUPLEX_HALF;
34719473939eSJason Baron         } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) {
34729473939eSJason Baron             n->net_conf.duplex = DUPLEX_FULL;
34739473939eSJason Baron         } else {
34749473939eSJason Baron             error_setg(errp, "'duplex' must be 'half' or 'full'");
3475843c4cfcSMarkus Armbruster             return;
34769473939eSJason Baron         }
34779473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
34789473939eSJason Baron     } else {
34799473939eSJason Baron         n->net_conf.duplex = DUPLEX_UNKNOWN;
34809473939eSJason Baron     }
34819473939eSJason Baron 
34829473939eSJason Baron     if (n->net_conf.speed < SPEED_UNKNOWN) {
34839473939eSJason Baron         error_setg(errp, "'speed' must be between 0 and INT_MAX");
3484843c4cfcSMarkus Armbruster         return;
3485843c4cfcSMarkus Armbruster     }
3486843c4cfcSMarkus Armbruster     if (n->net_conf.speed >= 0) {
34879473939eSJason Baron         n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX);
34889473939eSJason Baron     }
34899473939eSJason Baron 
34909711cd0dSJens Freimann     if (n->failover) {
3491b91ad981SJuan Quintela         n->primary_listener.hide_device = failover_hide_primary_device;
3492e2bde83eSJuan Quintela         qatomic_set(&n->failover_primary_hidden, true);
34939711cd0dSJens Freimann         device_listener_register(&n->primary_listener);
34949711cd0dSJens Freimann         n->migration_state.notify = virtio_net_migration_state_notifier;
34959711cd0dSJens Freimann         add_migration_state_change_notifier(&n->migration_state);
34969711cd0dSJens Freimann         n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY);
34979711cd0dSJens Freimann     }
34989711cd0dSJens Freimann 
3499da3e8a23SShannon Zhao     virtio_net_set_config_size(n, n->host_features);
35003857cd5cSJonah Palmer     virtio_init(vdev, VIRTIO_ID_NET, n->config_size);
350117ec5a86SKONRAD Frederic 
35021c0fbfa3SMichael S. Tsirkin     /*
35031c0fbfa3SMichael S. Tsirkin      * We set a lower limit on RX queue size to what it always was.
35041c0fbfa3SMichael S. Tsirkin      * Guests that want a smaller ring can always resize it without
35051c0fbfa3SMichael S. Tsirkin      * help from us (using virtio 1 and up).
35061c0fbfa3SMichael S. Tsirkin      */
35071c0fbfa3SMichael S. Tsirkin     if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
35081c0fbfa3SMichael S. Tsirkin         n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
35095f997fd1SMichal Privoznik         !is_power_of_2(n->net_conf.rx_queue_size)) {
35101c0fbfa3SMichael S. Tsirkin         error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
35111c0fbfa3SMichael S. Tsirkin                    "must be a power of 2 between %d and %d.",
35121c0fbfa3SMichael S. Tsirkin                    n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
35131c0fbfa3SMichael S. Tsirkin                    VIRTQUEUE_MAX_SIZE);
35141c0fbfa3SMichael S. Tsirkin         virtio_cleanup(vdev);
35151c0fbfa3SMichael S. Tsirkin         return;
35161c0fbfa3SMichael S. Tsirkin     }
35171c0fbfa3SMichael S. Tsirkin 
35189b02e161SWei Wang     if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE ||
35199b02e161SWei Wang         n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE ||
35209b02e161SWei Wang         !is_power_of_2(n->net_conf.tx_queue_size)) {
35219b02e161SWei Wang         error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), "
35229b02e161SWei Wang                    "must be a power of 2 between %d and %d",
35239b02e161SWei Wang                    n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE,
35249b02e161SWei Wang                    VIRTQUEUE_MAX_SIZE);
35259b02e161SWei Wang         virtio_cleanup(vdev);
35269b02e161SWei Wang         return;
35279b02e161SWei Wang     }
35289b02e161SWei Wang 
352922288fe5SJason Wang     n->max_ncs = MAX(n->nic_conf.peers.queues, 1);
353022288fe5SJason Wang 
353122288fe5SJason Wang     /*
353222288fe5SJason Wang      * Figure out the datapath queue pairs since the backend could
353322288fe5SJason Wang      * provide control queue via peers as well.
353422288fe5SJason Wang      */
353522288fe5SJason Wang     if (n->nic_conf.peers.queues) {
353622288fe5SJason Wang         for (i = 0; i < n->max_ncs; i++) {
353722288fe5SJason Wang             if (n->nic_conf.peers.ncs[i]->is_datapath) {
353822288fe5SJason Wang                 ++n->max_queue_pairs;
353922288fe5SJason Wang             }
354022288fe5SJason Wang         }
354122288fe5SJason Wang     }
354222288fe5SJason Wang     n->max_queue_pairs = MAX(n->max_queue_pairs, 1);
354322288fe5SJason Wang 
3544441537f1SJason Wang     if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) {
354522288fe5SJason Wang         error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), "
3546631b22eaSStefan Weil                    "must be a positive integer less than %d.",
3547441537f1SJason Wang                    n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2);
35487e0e736eSJason Wang         virtio_cleanup(vdev);
35497e0e736eSJason Wang         return;
35507e0e736eSJason Wang     }
3551b21e2380SMarkus Armbruster     n->vqs = g_new0(VirtIONetQueue, n->max_queue_pairs);
3552441537f1SJason Wang     n->curr_queue_pairs = 1;
35531773d9eeSKONRAD Frederic     n->tx_timeout = n->net_conf.txtimer;
35546e790746SPaolo Bonzini 
35551773d9eeSKONRAD Frederic     if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
35561773d9eeSKONRAD Frederic                        && strcmp(n->net_conf.tx, "bh")) {
35570765691eSMarkus Armbruster         warn_report("virtio-net: "
35586e790746SPaolo Bonzini                     "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
35591773d9eeSKONRAD Frederic                     n->net_conf.tx);
35600765691eSMarkus Armbruster         error_printf("Defaulting to \"bh\"");
35616e790746SPaolo Bonzini     }
35626e790746SPaolo Bonzini 
35632eef278bSMichael S. Tsirkin     n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n),
35642eef278bSMichael S. Tsirkin                                     n->net_conf.tx_queue_size);
35659b02e161SWei Wang 
3566441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
3567f9d6dbf0SWen Congyang         virtio_net_add_queue(n, i);
3568da51a335SJason Wang     }
3569da51a335SJason Wang 
357017a0ca55SKONRAD Frederic     n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
35711773d9eeSKONRAD Frederic     qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
35721773d9eeSKONRAD Frederic     memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
35736e790746SPaolo Bonzini     n->status = VIRTIO_NET_S_LINK_UP;
35749d8c6a25SDr. David Alan Gilbert     qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(),
35759d8c6a25SDr. David Alan Gilbert                               QEMU_CLOCK_VIRTUAL,
3576f57fcf70SJason Wang                               virtio_net_announce_timer, n);
3577b2c929f0SDr. David Alan Gilbert     n->announce_timer.round = 0;
35786e790746SPaolo Bonzini 
35798a253ec2SKONRAD Frederic     if (n->netclient_type) {
35808a253ec2SKONRAD Frederic         /*
35818a253ec2SKONRAD Frederic          * Happen when virtio_net_set_netclient_name has been called.
35828a253ec2SKONRAD Frederic          */
35838a253ec2SKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
35848a253ec2SKONRAD Frederic                               n->netclient_type, n->netclient_name, n);
35858a253ec2SKONRAD Frederic     } else {
35861773d9eeSKONRAD Frederic         n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
3587284a32f0SAndreas Färber                               object_get_typename(OBJECT(dev)), dev->id, n);
35888a253ec2SKONRAD Frederic     }
35898a253ec2SKONRAD Frederic 
3590441537f1SJason Wang     for (i = 0; i < n->max_queue_pairs; i++) {
3591d4c62930SBin Meng         n->nic->ncs[i].do_not_pad = true;
3592d4c62930SBin Meng     }
3593d4c62930SBin Meng 
35946e790746SPaolo Bonzini     peer_test_vnet_hdr(n);
35956e790746SPaolo Bonzini     if (peer_has_vnet_hdr(n)) {
3596441537f1SJason Wang         for (i = 0; i < n->max_queue_pairs; i++) {
3597d6085e3aSStefan Hajnoczi             qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
35986e790746SPaolo Bonzini         }
35996e790746SPaolo Bonzini         n->host_hdr_len = sizeof(struct virtio_net_hdr);
36006e790746SPaolo Bonzini     } else {
36016e790746SPaolo Bonzini         n->host_hdr_len = 0;
36026e790746SPaolo Bonzini     }
36036e790746SPaolo Bonzini 
36041773d9eeSKONRAD Frederic     qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
36056e790746SPaolo Bonzini 
36066e790746SPaolo Bonzini     n->vqs[0].tx_waiting = 0;
36071773d9eeSKONRAD Frederic     n->tx_burst = n->net_conf.txburst;
3608e22f0603SYuri Benditovich     virtio_net_set_mrg_rx_bufs(n, 0, 0, 0);
36096e790746SPaolo Bonzini     n->promisc = 1; /* for compatibility */
36106e790746SPaolo Bonzini 
36116e790746SPaolo Bonzini     n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
36126e790746SPaolo Bonzini 
36136e790746SPaolo Bonzini     n->vlans = g_malloc0(MAX_VLAN >> 3);
36146e790746SPaolo Bonzini 
3615b1be4280SAmos Kong     nc = qemu_get_queue(n->nic);
3616b1be4280SAmos Kong     nc->rxfilter_notify_enabled = 1;
3617b1be4280SAmos Kong 
3618e87936eaSCindy Lu    if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) {
3619e87936eaSCindy Lu         struct virtio_net_config netcfg = {};
3620e87936eaSCindy Lu         memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN);
3621e87936eaSCindy Lu         vhost_net_set_config(get_vhost_net(nc->peer),
3622e87936eaSCindy Lu             (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER);
3623e87936eaSCindy Lu     }
36242974e916SYuri Benditovich     QTAILQ_INIT(&n->rsc_chains);
3625284a32f0SAndreas Färber     n->qdev = dev;
36264474e37aSYuri Benditovich 
36274474e37aSYuri Benditovich     net_rx_pkt_init(&n->rx_pkt, false);
36280145c393SAndrew Melnychenko 
36290145c393SAndrew Melnychenko     if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) {
36300145c393SAndrew Melnychenko         virtio_net_load_ebpf(n);
36310145c393SAndrew Melnychenko     }
363217ec5a86SKONRAD Frederic }
363317ec5a86SKONRAD Frederic 
3634b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev)
363517ec5a86SKONRAD Frederic {
3636306ec6c3SAndreas Färber     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
3637306ec6c3SAndreas Färber     VirtIONet *n = VIRTIO_NET(dev);
3638441537f1SJason Wang     int i, max_queue_pairs;
363917ec5a86SKONRAD Frederic 
36400145c393SAndrew Melnychenko     if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) {
36410145c393SAndrew Melnychenko         virtio_net_unload_ebpf(n);
36420145c393SAndrew Melnychenko     }
36430145c393SAndrew Melnychenko 
364417ec5a86SKONRAD Frederic     /* This will stop vhost backend if appropriate. */
364517ec5a86SKONRAD Frederic     virtio_net_set_status(vdev, 0);
364617ec5a86SKONRAD Frederic 
36478a253ec2SKONRAD Frederic     g_free(n->netclient_name);
36488a253ec2SKONRAD Frederic     n->netclient_name = NULL;
36498a253ec2SKONRAD Frederic     g_free(n->netclient_type);
36508a253ec2SKONRAD Frederic     n->netclient_type = NULL;
36518a253ec2SKONRAD Frederic 
365217ec5a86SKONRAD Frederic     g_free(n->mac_table.macs);
365317ec5a86SKONRAD Frederic     g_free(n->vlans);
365417ec5a86SKONRAD Frederic 
36559711cd0dSJens Freimann     if (n->failover) {
3656f3558b1bSKevin Wolf         qobject_unref(n->primary_opts);
365765018100SJuan Quintela         device_listener_unregister(&n->primary_listener);
36581e157667SLaurent Vivier         remove_migration_state_change_notifier(&n->migration_state);
3659f3558b1bSKevin Wolf     } else {
3660f3558b1bSKevin Wolf         assert(n->primary_opts == NULL);
36619711cd0dSJens Freimann     }
36629711cd0dSJens Freimann 
3663441537f1SJason Wang     max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1;
3664441537f1SJason Wang     for (i = 0; i < max_queue_pairs; i++) {
3665f9d6dbf0SWen Congyang         virtio_net_del_queue(n, i);
366617ec5a86SKONRAD Frederic     }
3667d945d9f1SYuri Benditovich     /* delete also control vq */
3668441537f1SJason Wang     virtio_del_queue(vdev, max_queue_pairs * 2);
3669944458b6SDr. David Alan Gilbert     qemu_announce_timer_del(&n->announce_timer, false);
367017ec5a86SKONRAD Frederic     g_free(n->vqs);
367117ec5a86SKONRAD Frederic     qemu_del_nic(n->nic);
36722974e916SYuri Benditovich     virtio_net_rsc_cleanup(n);
367359079029SYuri Benditovich     g_free(n->rss_data.indirections_table);
36744474e37aSYuri Benditovich     net_rx_pkt_uninit(n->rx_pkt);
36756a1a8cc7SKONRAD Frederic     virtio_cleanup(vdev);
367617ec5a86SKONRAD Frederic }
367717ec5a86SKONRAD Frederic 
367817ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj)
367917ec5a86SKONRAD Frederic {
368017ec5a86SKONRAD Frederic     VirtIONet *n = VIRTIO_NET(obj);
368117ec5a86SKONRAD Frederic 
368217ec5a86SKONRAD Frederic     /*
368317ec5a86SKONRAD Frederic      * The default config_size is sizeof(struct virtio_net_config).
368417ec5a86SKONRAD Frederic      * Can be overriden with virtio_net_set_config_size.
368517ec5a86SKONRAD Frederic      */
368617ec5a86SKONRAD Frederic     n->config_size = sizeof(struct virtio_net_config);
3687aa4197c3SGonglei     device_add_bootindex_property(obj, &n->nic_conf.bootindex,
3688aa4197c3SGonglei                                   "bootindex", "/ethernet-phy@0",
368940c2281cSMarkus Armbruster                                   DEVICE(n));
36900145c393SAndrew Melnychenko 
36910145c393SAndrew Melnychenko     ebpf_rss_init(&n->ebpf_rss);
369217ec5a86SKONRAD Frederic }
369317ec5a86SKONRAD Frederic 
369444b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque)
36954d45dcfbSHalil Pasic {
36964d45dcfbSHalil Pasic     VirtIONet *n = opaque;
36974d45dcfbSHalil Pasic 
36984d45dcfbSHalil Pasic     /* At this point, backend must be stopped, otherwise
36994d45dcfbSHalil Pasic      * it might keep writing to memory. */
37004d45dcfbSHalil Pasic     assert(!n->vhost_started);
370144b1ff31SDr. David Alan Gilbert 
370244b1ff31SDr. David Alan Gilbert     return 0;
37034d45dcfbSHalil Pasic }
37044d45dcfbSHalil Pasic 
37059711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque)
37069711cd0dSJens Freimann {
37079711cd0dSJens Freimann     DeviceState *dev = opaque;
370821e8709bSJuan Quintela     DeviceState *primary;
37099711cd0dSJens Freimann     VirtIODevice *vdev = VIRTIO_DEVICE(dev);
37109711cd0dSJens Freimann     VirtIONet *n = VIRTIO_NET(vdev);
37119711cd0dSJens Freimann 
3712284f42a5SJens Freimann     if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) {
3713284f42a5SJens Freimann         return false;
3714284f42a5SJens Freimann     }
371521e8709bSJuan Quintela     primary = failover_find_primary_device(n);
371621e8709bSJuan Quintela     return primary ? primary->pending_deleted_event : false;
37179711cd0dSJens Freimann }
37189711cd0dSJens Freimann 
37199711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque)
37209711cd0dSJens Freimann {
37219711cd0dSJens Freimann     DeviceState *dev = opaque;
37229711cd0dSJens Freimann     VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev);
37239711cd0dSJens Freimann 
37249711cd0dSJens Freimann     return vdc->primary_unplug_pending(dev);
37259711cd0dSJens Freimann }
37269711cd0dSJens Freimann 
3727c255488dSJonah Palmer static struct vhost_dev *virtio_net_get_vhost(VirtIODevice *vdev)
3728c255488dSJonah Palmer {
3729c255488dSJonah Palmer     VirtIONet *n = VIRTIO_NET(vdev);
3730c255488dSJonah Palmer     NetClientState *nc = qemu_get_queue(n->nic);
3731c255488dSJonah Palmer     struct vhost_net *net = get_vhost_net(nc->peer);
3732c255488dSJonah Palmer     return &net->dev;
3733c255488dSJonah Palmer }
3734c255488dSJonah Palmer 
37354d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = {
37364d45dcfbSHalil Pasic     .name = "virtio-net",
37374d45dcfbSHalil Pasic     .minimum_version_id = VIRTIO_NET_VM_VERSION,
37384d45dcfbSHalil Pasic     .version_id = VIRTIO_NET_VM_VERSION,
37394d45dcfbSHalil Pasic     .fields = (VMStateField[]) {
37404d45dcfbSHalil Pasic         VMSTATE_VIRTIO_DEVICE,
37414d45dcfbSHalil Pasic         VMSTATE_END_OF_LIST()
37424d45dcfbSHalil Pasic     },
37434d45dcfbSHalil Pasic     .pre_save = virtio_net_pre_save,
37449711cd0dSJens Freimann     .dev_unplug_pending = dev_unplug_pending,
37454d45dcfbSHalil Pasic };
3746290c2428SDr. David Alan Gilbert 
374717ec5a86SKONRAD Frederic static Property virtio_net_properties[] = {
3748127833eeSJason Baron     DEFINE_PROP_BIT64("csum", VirtIONet, host_features,
3749127833eeSJason Baron                     VIRTIO_NET_F_CSUM, true),
3750127833eeSJason Baron     DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features,
375187108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_CSUM, true),
3752127833eeSJason Baron     DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
3753127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features,
375487108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO4, true),
3755127833eeSJason Baron     DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features,
375687108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_TSO6, true),
3757127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features,
375887108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ECN, true),
3759127833eeSJason Baron     DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features,
376087108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_UFO, true),
3761127833eeSJason Baron     DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features,
376287108bb2SShannon Zhao                     VIRTIO_NET_F_GUEST_ANNOUNCE, true),
3763127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features,
376487108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO4, true),
3765127833eeSJason Baron     DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features,
376687108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_TSO6, true),
3767127833eeSJason Baron     DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features,
376887108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_ECN, true),
3769127833eeSJason Baron     DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features,
377087108bb2SShannon Zhao                     VIRTIO_NET_F_HOST_UFO, true),
3771127833eeSJason Baron     DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features,
377287108bb2SShannon Zhao                     VIRTIO_NET_F_MRG_RXBUF, true),
3773127833eeSJason Baron     DEFINE_PROP_BIT64("status", VirtIONet, host_features,
377487108bb2SShannon Zhao                     VIRTIO_NET_F_STATUS, true),
3775127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features,
377687108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VQ, true),
3777127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features,
377887108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX, true),
3779127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features,
378087108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_VLAN, true),
3781127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features,
378287108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_RX_EXTRA, true),
3783127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features,
378487108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_MAC_ADDR, true),
3785127833eeSJason Baron     DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features,
378687108bb2SShannon Zhao                     VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
3787127833eeSJason Baron     DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
378859079029SYuri Benditovich     DEFINE_PROP_BIT64("rss", VirtIONet, host_features,
378959079029SYuri Benditovich                     VIRTIO_NET_F_RSS, false),
3790e22f0603SYuri Benditovich     DEFINE_PROP_BIT64("hash", VirtIONet, host_features,
3791e22f0603SYuri Benditovich                     VIRTIO_NET_F_HASH_REPORT, false),
37922974e916SYuri Benditovich     DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features,
37932974e916SYuri Benditovich                     VIRTIO_NET_F_RSC_EXT, false),
37942974e916SYuri Benditovich     DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout,
37952974e916SYuri Benditovich                        VIRTIO_NET_RSC_DEFAULT_INTERVAL),
379617ec5a86SKONRAD Frederic     DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
379717ec5a86SKONRAD Frederic     DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
379817ec5a86SKONRAD Frederic                        TX_TIMER_INTERVAL),
379917ec5a86SKONRAD Frederic     DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
380017ec5a86SKONRAD Frederic     DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
38011c0fbfa3SMichael S. Tsirkin     DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
38021c0fbfa3SMichael S. Tsirkin                        VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
38039b02e161SWei Wang     DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size,
38049b02e161SWei Wang                        VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE),
3805a93e599dSMaxime Coquelin     DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0),
380675ebec11SMaxime Coquelin     DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend,
380775ebec11SMaxime Coquelin                      true),
38089473939eSJason Baron     DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN),
38099473939eSJason Baron     DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str),
38109711cd0dSJens Freimann     DEFINE_PROP_BOOL("failover", VirtIONet, failover, false),
381117ec5a86SKONRAD Frederic     DEFINE_PROP_END_OF_LIST(),
381217ec5a86SKONRAD Frederic };
381317ec5a86SKONRAD Frederic 
381417ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data)
381517ec5a86SKONRAD Frederic {
381617ec5a86SKONRAD Frederic     DeviceClass *dc = DEVICE_CLASS(klass);
381717ec5a86SKONRAD Frederic     VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
3818e6f746b3SAndreas Färber 
38194f67d30bSMarc-André Lureau     device_class_set_props(dc, virtio_net_properties);
3820290c2428SDr. David Alan Gilbert     dc->vmsd = &vmstate_virtio_net;
3821125ee0edSMarcel Apfelbaum     set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
3822e6f746b3SAndreas Färber     vdc->realize = virtio_net_device_realize;
3823306ec6c3SAndreas Färber     vdc->unrealize = virtio_net_device_unrealize;
382417ec5a86SKONRAD Frederic     vdc->get_config = virtio_net_get_config;
382517ec5a86SKONRAD Frederic     vdc->set_config = virtio_net_set_config;
382617ec5a86SKONRAD Frederic     vdc->get_features = virtio_net_get_features;
382717ec5a86SKONRAD Frederic     vdc->set_features = virtio_net_set_features;
382817ec5a86SKONRAD Frederic     vdc->bad_features = virtio_net_bad_features;
382917ec5a86SKONRAD Frederic     vdc->reset = virtio_net_reset;
383017ec5a86SKONRAD Frederic     vdc->set_status = virtio_net_set_status;
383117ec5a86SKONRAD Frederic     vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
383217ec5a86SKONRAD Frederic     vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
38332a083ffdSMichael S. Tsirkin     vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO);
38347788c3f2SMikhail Sennikovsky     vdc->post_load = virtio_net_post_load_virtio;
3835982b78c5SDr. David Alan Gilbert     vdc->vmsd = &vmstate_virtio_net_device;
38369711cd0dSJens Freimann     vdc->primary_unplug_pending = primary_unplug_pending;
3837c255488dSJonah Palmer     vdc->get_vhost = virtio_net_get_vhost;
383817ec5a86SKONRAD Frederic }
383917ec5a86SKONRAD Frederic 
384017ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = {
384117ec5a86SKONRAD Frederic     .name = TYPE_VIRTIO_NET,
384217ec5a86SKONRAD Frederic     .parent = TYPE_VIRTIO_DEVICE,
384317ec5a86SKONRAD Frederic     .instance_size = sizeof(VirtIONet),
384417ec5a86SKONRAD Frederic     .instance_init = virtio_net_instance_init,
384517ec5a86SKONRAD Frederic     .class_init = virtio_net_class_init,
384617ec5a86SKONRAD Frederic };
384717ec5a86SKONRAD Frederic 
384817ec5a86SKONRAD Frederic static void virtio_register_types(void)
384917ec5a86SKONRAD Frederic {
385017ec5a86SKONRAD Frederic     type_register_static(&virtio_net_info);
385117ec5a86SKONRAD Frederic }
385217ec5a86SKONRAD Frederic 
385317ec5a86SKONRAD Frederic type_init(virtio_register_types)
3854