16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Network Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 149b8bfe21SPeter Maydell #include "qemu/osdep.h" 159711cd0dSJens Freimann #include "qemu/atomic.h" 166e790746SPaolo Bonzini #include "qemu/iov.h" 1768b0a639SSi-Wei Liu #include "qemu/log.h" 18db725815SMarkus Armbruster #include "qemu/main-loop.h" 190b8fa32fSMarkus Armbruster #include "qemu/module.h" 206e790746SPaolo Bonzini #include "hw/virtio/virtio.h" 216e790746SPaolo Bonzini #include "net/net.h" 226e790746SPaolo Bonzini #include "net/checksum.h" 236e790746SPaolo Bonzini #include "net/tap.h" 246e790746SPaolo Bonzini #include "qemu/error-report.h" 256e790746SPaolo Bonzini #include "qemu/timer.h" 269711cd0dSJens Freimann #include "qemu/option.h" 279711cd0dSJens Freimann #include "qemu/option_int.h" 289711cd0dSJens Freimann #include "qemu/config-file.h" 299711cd0dSJens Freimann #include "qapi/qmp/qdict.h" 306e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h" 316e790746SPaolo Bonzini #include "net/vhost_net.h" 329d8c6a25SDr. David Alan Gilbert #include "net/announce.h" 3317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h" 34e688df6bSMarkus Armbruster #include "qapi/error.h" 359af23989SMarkus Armbruster #include "qapi/qapi-events-net.h" 36a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h" 379711cd0dSJens Freimann #include "qapi/qapi-types-migration.h" 389711cd0dSJens Freimann #include "qapi/qapi-events-migration.h" 391399c60dSRusty Russell #include "hw/virtio/virtio-access.h" 40f8d806c9SJuan Quintela #include "migration/misc.h" 419473939eSJason Baron #include "standard-headers/linux/ethtool.h" 422f780b6aSMarkus Armbruster #include "sysemu/sysemu.h" 439d8c6a25SDr. David Alan Gilbert #include "trace.h" 449711cd0dSJens Freimann #include "monitor/qdev.h" 45edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h" 464474e37aSYuri Benditovich #include "net_rx_pkt.h" 47108a6481SCindy Lu #include "hw/virtio/vhost.h" 481b529d90SLaurent Vivier #include "sysemu/qtest.h" 496e790746SPaolo Bonzini 506e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION 11 516e790746SPaolo Bonzini 521c0fbfa3SMichael S. Tsirkin /* previously fixed value */ 531c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256 549b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256 559b02e161SWei Wang 56441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */ 571c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 589b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 591c0fbfa3SMichael S. Tsirkin 602974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE 8 /* ipv4 saddr + daddr */ 612974e916SYuri Benditovich 622974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG 0x3F 632974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH 0xF000 642974e916SYuri Benditovich 652974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */ 662974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header)) 672974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535 682974e916SYuri Benditovich 692974e916SYuri Benditovich /* header length value in ip header without option */ 702974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5 712974e916SYuri Benditovich 722974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE 32 /* ipv6 saddr + daddr */ 732974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD 742974e916SYuri Benditovich 752974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance 762974e916SYuri Benditovich a lot, and should be tuned carefully, '300000'(300us) is the recommended 772974e916SYuri Benditovich value to pass the WHQL test, '50000' can gain 2x netperf throughput with 782974e916SYuri Benditovich tso/gso/gro 'off'. */ 792974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000 802974e916SYuri Benditovich 8159079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \ 8259079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \ 8359079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \ 8459079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \ 8559079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \ 8659079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \ 8759079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \ 8859079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \ 8959079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) 9059079029SYuri Benditovich 91ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = { 92127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MAC, 935d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mac)}, 94127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_STATUS, 955d5b33c0SMax Reitz .end = endof(struct virtio_net_config, status)}, 96127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MQ, 975d5b33c0SMax Reitz .end = endof(struct virtio_net_config, max_virtqueue_pairs)}, 98127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MTU, 995d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mtu)}, 1009473939eSJason Baron {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX, 1015d5b33c0SMax Reitz .end = endof(struct virtio_net_config, duplex)}, 102e22f0603SYuri Benditovich {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT), 10359079029SYuri Benditovich .end = endof(struct virtio_net_config, supported_hash_types)}, 1046e790746SPaolo Bonzini {} 1056e790746SPaolo Bonzini }; 1066e790746SPaolo Bonzini 107d74c30c8SDaniil Tatianin static const VirtIOConfigSizeParams cfg_size_params = { 108d74c30c8SDaniil Tatianin .min_size = endof(struct virtio_net_config, mac), 109d74c30c8SDaniil Tatianin .max_size = sizeof(struct virtio_net_config), 110d74c30c8SDaniil Tatianin .feature_sizes = feature_sizes 111d74c30c8SDaniil Tatianin }; 112d74c30c8SDaniil Tatianin 1136e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc) 1146e790746SPaolo Bonzini { 1156e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1166e790746SPaolo Bonzini 1176e790746SPaolo Bonzini return &n->vqs[nc->queue_index]; 1186e790746SPaolo Bonzini } 1196e790746SPaolo Bonzini 1206e790746SPaolo Bonzini static int vq2q(int queue_index) 1216e790746SPaolo Bonzini { 1226e790746SPaolo Bonzini return queue_index / 2; 1236e790746SPaolo Bonzini } 1246e790746SPaolo Bonzini 1254fdf69abSKangjie Xu static void flush_or_purge_queued_packets(NetClientState *nc) 1264fdf69abSKangjie Xu { 1274fdf69abSKangjie Xu if (!nc->peer) { 1284fdf69abSKangjie Xu return; 1294fdf69abSKangjie Xu } 1304fdf69abSKangjie Xu 1314fdf69abSKangjie Xu qemu_flush_or_purge_queued_packets(nc->peer, true); 1324fdf69abSKangjie Xu assert(!virtio_net_get_subqueue(nc)->async_tx.elem); 1334fdf69abSKangjie Xu } 1344fdf69abSKangjie Xu 1356e790746SPaolo Bonzini /* TODO 1366e790746SPaolo Bonzini * - we could suppress RX interrupt if we were so inclined. 1376e790746SPaolo Bonzini */ 1386e790746SPaolo Bonzini 1396e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config) 1406e790746SPaolo Bonzini { 14117a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1426e790746SPaolo Bonzini struct virtio_net_config netcfg; 143c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 144fb592882SCindy Lu static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } }; 1456e790746SPaolo Bonzini 146108a6481SCindy Lu int ret = 0; 147108a6481SCindy Lu memset(&netcfg, 0 , sizeof(struct virtio_net_config)); 1481399c60dSRusty Russell virtio_stw_p(vdev, &netcfg.status, n->status); 149441537f1SJason Wang virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs); 150a93e599dSMaxime Coquelin virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu); 1516e790746SPaolo Bonzini memcpy(netcfg.mac, n->mac, ETH_ALEN); 1529473939eSJason Baron virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed); 1539473939eSJason Baron netcfg.duplex = n->net_conf.duplex; 15459079029SYuri Benditovich netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE; 15559079029SYuri Benditovich virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length, 156e22f0603SYuri Benditovich virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ? 157e22f0603SYuri Benditovich VIRTIO_NET_RSS_MAX_TABLE_LEN : 1); 15859079029SYuri Benditovich virtio_stl_p(vdev, &netcfg.supported_hash_types, 15959079029SYuri Benditovich VIRTIO_NET_RSS_SUPPORTED_HASHES); 1606e790746SPaolo Bonzini memcpy(config, &netcfg, n->config_size); 161108a6481SCindy Lu 162c546ecf2SJason Wang /* 163c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 164c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 165c546ecf2SJason Wang */ 166c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 167108a6481SCindy Lu ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg, 168108a6481SCindy Lu n->config_size); 169ebc141a6SEugenio Pérez if (ret == -1) { 170ebc141a6SEugenio Pérez return; 171ebc141a6SEugenio Pérez } 172ebc141a6SEugenio Pérez 173fb592882SCindy Lu /* 174ebc141a6SEugenio Pérez * Some NIC/kernel combinations present 0 as the mac address. As that 175ebc141a6SEugenio Pérez * is not a legal address, try to proceed with the address from the 176ebc141a6SEugenio Pérez * QEMU command line in the hope that the address has been configured 177ebc141a6SEugenio Pérez * correctly elsewhere - just not reported by the device. 178fb592882SCindy Lu */ 179fb592882SCindy Lu if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) { 180fb592882SCindy Lu info_report("Zero hardware mac address detected. Ignoring."); 181fb592882SCindy Lu memcpy(netcfg.mac, n->mac, ETH_ALEN); 182fb592882SCindy Lu } 183ebc141a6SEugenio Pérez 1844f93aafcSEugenio Pérez netcfg.status |= virtio_tswap16(vdev, 1854f93aafcSEugenio Pérez n->status & VIRTIO_NET_S_ANNOUNCE); 186108a6481SCindy Lu memcpy(config, &netcfg, n->config_size); 187108a6481SCindy Lu } 188108a6481SCindy Lu } 1896e790746SPaolo Bonzini 1906e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config) 1916e790746SPaolo Bonzini { 19217a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1936e790746SPaolo Bonzini struct virtio_net_config netcfg = {}; 194c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 1956e790746SPaolo Bonzini 1966e790746SPaolo Bonzini memcpy(&netcfg, config, n->config_size); 1976e790746SPaolo Bonzini 19895129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) && 19995129d6fSCornelia Huck !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) && 2006e790746SPaolo Bonzini memcmp(netcfg.mac, n->mac, ETH_ALEN)) { 2016e790746SPaolo Bonzini memcpy(n->mac, netcfg.mac, ETH_ALEN); 2026e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 2036e790746SPaolo Bonzini } 204108a6481SCindy Lu 205c546ecf2SJason Wang /* 206c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 207c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 208c546ecf2SJason Wang */ 209c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 210c546ecf2SJason Wang vhost_net_set_config(get_vhost_net(nc->peer), 211c546ecf2SJason Wang (uint8_t *)&netcfg, 0, n->config_size, 212f8ed3648SManos Pitsidianakis VHOST_SET_CONFIG_TYPE_FRONTEND); 213108a6481SCindy Lu } 2146e790746SPaolo Bonzini } 2156e790746SPaolo Bonzini 2166e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status) 2176e790746SPaolo Bonzini { 21817a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2196e790746SPaolo Bonzini return (status & VIRTIO_CONFIG_S_DRIVER_OK) && 22017a0ca55SKONRAD Frederic (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running; 2216e790746SPaolo Bonzini } 2226e790746SPaolo Bonzini 223b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net) 224b2c929f0SDr. David Alan Gilbert { 225b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(net); 226b2c929f0SDr. David Alan Gilbert trace_virtio_net_announce_notify(); 227b2c929f0SDr. David Alan Gilbert 228b2c929f0SDr. David Alan Gilbert net->status |= VIRTIO_NET_S_ANNOUNCE; 229b2c929f0SDr. David Alan Gilbert virtio_notify_config(vdev); 230b2c929f0SDr. David Alan Gilbert } 231b2c929f0SDr. David Alan Gilbert 232f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque) 233f57fcf70SJason Wang { 234f57fcf70SJason Wang VirtIONet *n = opaque; 2359d8c6a25SDr. David Alan Gilbert trace_virtio_net_announce_timer(n->announce_timer.round); 236f57fcf70SJason Wang 2379d8c6a25SDr. David Alan Gilbert n->announce_timer.round--; 238b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 239b2c929f0SDr. David Alan Gilbert } 240b2c929f0SDr. David Alan Gilbert 241b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc) 242b2c929f0SDr. David Alan Gilbert { 243b2c929f0SDr. David Alan Gilbert VirtIONet *n = qemu_get_nic_opaque(nc); 244b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 245b2c929f0SDr. David Alan Gilbert 246b2c929f0SDr. David Alan Gilbert /* 247b2c929f0SDr. David Alan Gilbert * Make sure the virtio migration announcement timer isn't running 248b2c929f0SDr. David Alan Gilbert * If it is, let it trigger announcement so that we do not cause 249b2c929f0SDr. David Alan Gilbert * confusion. 250b2c929f0SDr. David Alan Gilbert */ 251b2c929f0SDr. David Alan Gilbert if (n->announce_timer.round) { 252b2c929f0SDr. David Alan Gilbert return; 253b2c929f0SDr. David Alan Gilbert } 254b2c929f0SDr. David Alan Gilbert 255b2c929f0SDr. David Alan Gilbert if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 256b2c929f0SDr. David Alan Gilbert virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 257b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 258b2c929f0SDr. David Alan Gilbert } 259f57fcf70SJason Wang } 260f57fcf70SJason Wang 2616e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status) 2626e790746SPaolo Bonzini { 26317a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2646e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 265441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 266aa858194SSi-Wei Liu int cvq = virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ) ? 267aa858194SSi-Wei Liu n->max_ncs - n->max_queue_pairs : 0; 2686e790746SPaolo Bonzini 269ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 2706e790746SPaolo Bonzini return; 2716e790746SPaolo Bonzini } 2726e790746SPaolo Bonzini 2738c1ac475SRadim Krčmář if ((virtio_net_started(n, status) && !nc->peer->link_down) == 2748c1ac475SRadim Krčmář !!n->vhost_started) { 2756e790746SPaolo Bonzini return; 2766e790746SPaolo Bonzini } 2776e790746SPaolo Bonzini if (!n->vhost_started) { 278086abc1cSMichael S. Tsirkin int r, i; 279086abc1cSMichael S. Tsirkin 2801bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2811bfa316cSGreg Kurz error_report("backend does not support %s vnet headers; " 2821bfa316cSGreg Kurz "falling back on userspace virtio", 2831bfa316cSGreg Kurz virtio_is_big_endian(vdev) ? "BE" : "LE"); 2841bfa316cSGreg Kurz return; 2851bfa316cSGreg Kurz } 2861bfa316cSGreg Kurz 287086abc1cSMichael S. Tsirkin /* Any packets outstanding? Purge them to avoid touching rings 288086abc1cSMichael S. Tsirkin * when vhost is running. 289086abc1cSMichael S. Tsirkin */ 290441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 291086abc1cSMichael S. Tsirkin NetClientState *qnc = qemu_get_subqueue(n->nic, i); 292086abc1cSMichael S. Tsirkin 293086abc1cSMichael S. Tsirkin /* Purge both directions: TX and RX. */ 294086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->peer->incoming_queue, qnc); 295086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->incoming_queue, qnc->peer); 296086abc1cSMichael S. Tsirkin } 297086abc1cSMichael S. Tsirkin 298a93e599dSMaxime Coquelin if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) { 299a93e599dSMaxime Coquelin r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu); 300a93e599dSMaxime Coquelin if (r < 0) { 301a93e599dSMaxime Coquelin error_report("%uBytes MTU not supported by the backend", 302a93e599dSMaxime Coquelin n->net_conf.mtu); 303a93e599dSMaxime Coquelin 304a93e599dSMaxime Coquelin return; 305a93e599dSMaxime Coquelin } 306a93e599dSMaxime Coquelin } 307a93e599dSMaxime Coquelin 3086e790746SPaolo Bonzini n->vhost_started = 1; 30922288fe5SJason Wang r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq); 3106e790746SPaolo Bonzini if (r < 0) { 3116e790746SPaolo Bonzini error_report("unable to start vhost net: %d: " 3126e790746SPaolo Bonzini "falling back on userspace virtio", -r); 3136e790746SPaolo Bonzini n->vhost_started = 0; 3146e790746SPaolo Bonzini } 3156e790746SPaolo Bonzini } else { 31622288fe5SJason Wang vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq); 3176e790746SPaolo Bonzini n->vhost_started = 0; 3186e790746SPaolo Bonzini } 3196e790746SPaolo Bonzini } 3206e790746SPaolo Bonzini 3211bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev, 3221bfa316cSGreg Kurz NetClientState *peer, 3231bfa316cSGreg Kurz bool enable) 3241bfa316cSGreg Kurz { 3251bfa316cSGreg Kurz if (virtio_is_big_endian(vdev)) { 3261bfa316cSGreg Kurz return qemu_set_vnet_be(peer, enable); 3271bfa316cSGreg Kurz } else { 3281bfa316cSGreg Kurz return qemu_set_vnet_le(peer, enable); 3291bfa316cSGreg Kurz } 3301bfa316cSGreg Kurz } 3311bfa316cSGreg Kurz 3321bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs, 333441537f1SJason Wang int queue_pairs, bool enable) 3341bfa316cSGreg Kurz { 3351bfa316cSGreg Kurz int i; 3361bfa316cSGreg Kurz 337441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 3381bfa316cSGreg Kurz if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 && 3391bfa316cSGreg Kurz enable) { 3401bfa316cSGreg Kurz while (--i >= 0) { 3411bfa316cSGreg Kurz virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false); 3421bfa316cSGreg Kurz } 3431bfa316cSGreg Kurz 3441bfa316cSGreg Kurz return true; 3451bfa316cSGreg Kurz } 3461bfa316cSGreg Kurz } 3471bfa316cSGreg Kurz 3481bfa316cSGreg Kurz return false; 3491bfa316cSGreg Kurz } 3501bfa316cSGreg Kurz 3511bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status) 3521bfa316cSGreg Kurz { 3531bfa316cSGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(n); 354441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3551bfa316cSGreg Kurz 3561bfa316cSGreg Kurz if (virtio_net_started(n, status)) { 3571bfa316cSGreg Kurz /* Before using the device, we tell the network backend about the 3581bfa316cSGreg Kurz * endianness to use when parsing vnet headers. If the backend 3591bfa316cSGreg Kurz * can't do it, we fallback onto fixing the headers in the core 3601bfa316cSGreg Kurz * virtio-net code. 3611bfa316cSGreg Kurz */ 3621bfa316cSGreg Kurz n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs, 363441537f1SJason Wang queue_pairs, true); 3641bfa316cSGreg Kurz } else if (virtio_net_started(n, vdev->status)) { 3651bfa316cSGreg Kurz /* After using the device, we need to reset the network backend to 3661bfa316cSGreg Kurz * the default (guest native endianness), otherwise the guest may 3671bfa316cSGreg Kurz * lose network connectivity if it is rebooted into a different 3681bfa316cSGreg Kurz * endianness. 3691bfa316cSGreg Kurz */ 370441537f1SJason Wang virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false); 3711bfa316cSGreg Kurz } 3721bfa316cSGreg Kurz } 3731bfa316cSGreg Kurz 374283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq) 375283e2c2aSYuri Benditovich { 376283e2c2aSYuri Benditovich unsigned int dropped = virtqueue_drop_all(vq); 377283e2c2aSYuri Benditovich if (dropped) { 378283e2c2aSYuri Benditovich virtio_notify(vdev, vq); 379283e2c2aSYuri Benditovich } 380283e2c2aSYuri Benditovich } 381283e2c2aSYuri Benditovich 3826e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status) 3836e790746SPaolo Bonzini { 38417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 3856e790746SPaolo Bonzini VirtIONetQueue *q; 3866e790746SPaolo Bonzini int i; 3876e790746SPaolo Bonzini uint8_t queue_status; 3886e790746SPaolo Bonzini 3891bfa316cSGreg Kurz virtio_net_vnet_endian_status(n, status); 3906e790746SPaolo Bonzini virtio_net_vhost_status(n, status); 3916e790746SPaolo Bonzini 392441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 39338705bb5SFam Zheng NetClientState *ncs = qemu_get_subqueue(n->nic, i); 39438705bb5SFam Zheng bool queue_started; 3956e790746SPaolo Bonzini q = &n->vqs[i]; 3966e790746SPaolo Bonzini 397441537f1SJason Wang if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) { 3986e790746SPaolo Bonzini queue_status = 0; 3996e790746SPaolo Bonzini } else { 4006e790746SPaolo Bonzini queue_status = status; 4016e790746SPaolo Bonzini } 40238705bb5SFam Zheng queue_started = 40338705bb5SFam Zheng virtio_net_started(n, queue_status) && !n->vhost_started; 40438705bb5SFam Zheng 40538705bb5SFam Zheng if (queue_started) { 40638705bb5SFam Zheng qemu_flush_queued_packets(ncs); 40738705bb5SFam Zheng } 4086e790746SPaolo Bonzini 4096e790746SPaolo Bonzini if (!q->tx_waiting) { 4106e790746SPaolo Bonzini continue; 4116e790746SPaolo Bonzini } 4126e790746SPaolo Bonzini 41338705bb5SFam Zheng if (queue_started) { 4146e790746SPaolo Bonzini if (q->tx_timer) { 415bc72ad67SAlex Bligh timer_mod(q->tx_timer, 416bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 4176e790746SPaolo Bonzini } else { 4186e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 4196e790746SPaolo Bonzini } 4206e790746SPaolo Bonzini } else { 4216e790746SPaolo Bonzini if (q->tx_timer) { 422bc72ad67SAlex Bligh timer_del(q->tx_timer); 4236e790746SPaolo Bonzini } else { 4246e790746SPaolo Bonzini qemu_bh_cancel(q->tx_bh); 4256e790746SPaolo Bonzini } 426283e2c2aSYuri Benditovich if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 && 42770e53e6eSJason Wang (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) && 42870e53e6eSJason Wang vdev->vm_running) { 429283e2c2aSYuri Benditovich /* if tx is waiting we are likely have some packets in tx queue 430283e2c2aSYuri Benditovich * and disabled notification */ 431283e2c2aSYuri Benditovich q->tx_waiting = 0; 432283e2c2aSYuri Benditovich virtio_queue_set_notification(q->tx_vq, 1); 433283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, q->tx_vq); 434283e2c2aSYuri Benditovich } 4356e790746SPaolo Bonzini } 4366e790746SPaolo Bonzini } 4376e790746SPaolo Bonzini } 4386e790746SPaolo Bonzini 4396e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc) 4406e790746SPaolo Bonzini { 4416e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 44217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 4436e790746SPaolo Bonzini uint16_t old_status = n->status; 4446e790746SPaolo Bonzini 4456e790746SPaolo Bonzini if (nc->link_down) 4466e790746SPaolo Bonzini n->status &= ~VIRTIO_NET_S_LINK_UP; 4476e790746SPaolo Bonzini else 4486e790746SPaolo Bonzini n->status |= VIRTIO_NET_S_LINK_UP; 4496e790746SPaolo Bonzini 4506e790746SPaolo Bonzini if (n->status != old_status) 45117a0ca55SKONRAD Frederic virtio_notify_config(vdev); 4526e790746SPaolo Bonzini 45317a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 4546e790746SPaolo Bonzini } 4556e790746SPaolo Bonzini 456b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc) 457b1be4280SAmos Kong { 458b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 459b1be4280SAmos Kong 460b1be4280SAmos Kong if (nc->rxfilter_notify_enabled) { 461ddfb0baaSMarkus Armbruster char *path = object_get_canonical_path(OBJECT(n->qdev)); 4627480874aSMarkus Armbruster qapi_event_send_nic_rx_filter_changed(n->netclient_name, path); 46396e35046SAmos Kong g_free(path); 464b1be4280SAmos Kong 465b1be4280SAmos Kong /* disable event notification to avoid events flooding */ 466b1be4280SAmos Kong nc->rxfilter_notify_enabled = 0; 467b1be4280SAmos Kong } 468b1be4280SAmos Kong } 469b1be4280SAmos Kong 470f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n) 471f7bc8ef8SAmos Kong { 47254aa3de7SEric Blake intList *list; 473f7bc8ef8SAmos Kong int i, j; 474f7bc8ef8SAmos Kong 475f7bc8ef8SAmos Kong list = NULL; 476f7bc8ef8SAmos Kong for (i = 0; i < MAX_VLAN >> 5; i++) { 477f7bc8ef8SAmos Kong for (j = 0; n->vlans[i] && j <= 0x1f; j++) { 478f7bc8ef8SAmos Kong if (n->vlans[i] & (1U << j)) { 47954aa3de7SEric Blake QAPI_LIST_PREPEND(list, (i << 5) + j); 480f7bc8ef8SAmos Kong } 481f7bc8ef8SAmos Kong } 482f7bc8ef8SAmos Kong } 483f7bc8ef8SAmos Kong 484f7bc8ef8SAmos Kong return list; 485f7bc8ef8SAmos Kong } 486f7bc8ef8SAmos Kong 487b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc) 488b1be4280SAmos Kong { 489b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 490f7bc8ef8SAmos Kong VirtIODevice *vdev = VIRTIO_DEVICE(n); 491b1be4280SAmos Kong RxFilterInfo *info; 49254aa3de7SEric Blake strList *str_list; 493f7bc8ef8SAmos Kong int i; 494b1be4280SAmos Kong 495b1be4280SAmos Kong info = g_malloc0(sizeof(*info)); 496b1be4280SAmos Kong info->name = g_strdup(nc->name); 497b1be4280SAmos Kong info->promiscuous = n->promisc; 498b1be4280SAmos Kong 499b1be4280SAmos Kong if (n->nouni) { 500b1be4280SAmos Kong info->unicast = RX_STATE_NONE; 501b1be4280SAmos Kong } else if (n->alluni) { 502b1be4280SAmos Kong info->unicast = RX_STATE_ALL; 503b1be4280SAmos Kong } else { 504b1be4280SAmos Kong info->unicast = RX_STATE_NORMAL; 505b1be4280SAmos Kong } 506b1be4280SAmos Kong 507b1be4280SAmos Kong if (n->nomulti) { 508b1be4280SAmos Kong info->multicast = RX_STATE_NONE; 509b1be4280SAmos Kong } else if (n->allmulti) { 510b1be4280SAmos Kong info->multicast = RX_STATE_ALL; 511b1be4280SAmos Kong } else { 512b1be4280SAmos Kong info->multicast = RX_STATE_NORMAL; 513b1be4280SAmos Kong } 514b1be4280SAmos Kong 515b1be4280SAmos Kong info->broadcast_allowed = n->nobcast; 516b1be4280SAmos Kong info->multicast_overflow = n->mac_table.multi_overflow; 517b1be4280SAmos Kong info->unicast_overflow = n->mac_table.uni_overflow; 518b1be4280SAmos Kong 519b0575ba4SScott Feldman info->main_mac = qemu_mac_strdup_printf(n->mac); 520b1be4280SAmos Kong 521b1be4280SAmos Kong str_list = NULL; 522b1be4280SAmos Kong for (i = 0; i < n->mac_table.first_multi; i++) { 52354aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 52454aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 525b1be4280SAmos Kong } 526b1be4280SAmos Kong info->unicast_table = str_list; 527b1be4280SAmos Kong 528b1be4280SAmos Kong str_list = NULL; 529b1be4280SAmos Kong for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 53054aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 53154aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 532b1be4280SAmos Kong } 533b1be4280SAmos Kong info->multicast_table = str_list; 534f7bc8ef8SAmos Kong info->vlan_table = get_vlan_table(n); 535b1be4280SAmos Kong 53695129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) { 537f7bc8ef8SAmos Kong info->vlan = RX_STATE_ALL; 538f7bc8ef8SAmos Kong } else if (!info->vlan_table) { 539f7bc8ef8SAmos Kong info->vlan = RX_STATE_NONE; 540f7bc8ef8SAmos Kong } else { 541f7bc8ef8SAmos Kong info->vlan = RX_STATE_NORMAL; 542b1be4280SAmos Kong } 543b1be4280SAmos Kong 544b1be4280SAmos Kong /* enable event notification after query */ 545b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 546b1be4280SAmos Kong 547b1be4280SAmos Kong return info; 548b1be4280SAmos Kong } 549b1be4280SAmos Kong 5507dc6be52SXuan Zhuo static void virtio_net_queue_reset(VirtIODevice *vdev, uint32_t queue_index) 5517dc6be52SXuan Zhuo { 5527dc6be52SXuan Zhuo VirtIONet *n = VIRTIO_NET(vdev); 553f47af0afSXuan Zhuo NetClientState *nc; 554f47af0afSXuan Zhuo 555f47af0afSXuan Zhuo /* validate queue_index and skip for cvq */ 556f47af0afSXuan Zhuo if (queue_index >= n->max_queue_pairs * 2) { 557f47af0afSXuan Zhuo return; 558f47af0afSXuan Zhuo } 559f47af0afSXuan Zhuo 560f47af0afSXuan Zhuo nc = qemu_get_subqueue(n->nic, vq2q(queue_index)); 5617dc6be52SXuan Zhuo 5627dc6be52SXuan Zhuo if (!nc->peer) { 5637dc6be52SXuan Zhuo return; 5647dc6be52SXuan Zhuo } 5657dc6be52SXuan Zhuo 5667dc6be52SXuan Zhuo if (get_vhost_net(nc->peer) && 5677dc6be52SXuan Zhuo nc->peer->info->type == NET_CLIENT_DRIVER_TAP) { 5687dc6be52SXuan Zhuo vhost_net_virtqueue_reset(vdev, nc, queue_index); 5697dc6be52SXuan Zhuo } 5707dc6be52SXuan Zhuo 5717dc6be52SXuan Zhuo flush_or_purge_queued_packets(nc); 5727dc6be52SXuan Zhuo } 5737dc6be52SXuan Zhuo 5747f863302SKangjie Xu static void virtio_net_queue_enable(VirtIODevice *vdev, uint32_t queue_index) 5757f863302SKangjie Xu { 5767f863302SKangjie Xu VirtIONet *n = VIRTIO_NET(vdev); 577f47af0afSXuan Zhuo NetClientState *nc; 5787f863302SKangjie Xu int r; 5797f863302SKangjie Xu 580f47af0afSXuan Zhuo /* validate queue_index and skip for cvq */ 581f47af0afSXuan Zhuo if (queue_index >= n->max_queue_pairs * 2) { 582f47af0afSXuan Zhuo return; 583f47af0afSXuan Zhuo } 584f47af0afSXuan Zhuo 585f47af0afSXuan Zhuo nc = qemu_get_subqueue(n->nic, vq2q(queue_index)); 586f47af0afSXuan Zhuo 5877f863302SKangjie Xu if (!nc->peer || !vdev->vhost_started) { 5887f863302SKangjie Xu return; 5897f863302SKangjie Xu } 5907f863302SKangjie Xu 5917f863302SKangjie Xu if (get_vhost_net(nc->peer) && 5927f863302SKangjie Xu nc->peer->info->type == NET_CLIENT_DRIVER_TAP) { 5937f863302SKangjie Xu r = vhost_net_virtqueue_restart(vdev, nc, queue_index); 5947f863302SKangjie Xu if (r < 0) { 5957f863302SKangjie Xu error_report("unable to restart vhost net virtqueue: %d, " 5967f863302SKangjie Xu "when resetting the queue", queue_index); 5977f863302SKangjie Xu } 5987f863302SKangjie Xu } 5997f863302SKangjie Xu } 6007f863302SKangjie Xu 6016e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev) 6026e790746SPaolo Bonzini { 60317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 60494b52958SGreg Kurz int i; 6056e790746SPaolo Bonzini 6066e790746SPaolo Bonzini /* Reset back to compatibility mode */ 6076e790746SPaolo Bonzini n->promisc = 1; 6086e790746SPaolo Bonzini n->allmulti = 0; 6096e790746SPaolo Bonzini n->alluni = 0; 6106e790746SPaolo Bonzini n->nomulti = 0; 6116e790746SPaolo Bonzini n->nouni = 0; 6126e790746SPaolo Bonzini n->nobcast = 0; 6136e790746SPaolo Bonzini /* multiqueue is disabled by default */ 614441537f1SJason Wang n->curr_queue_pairs = 1; 6159d8c6a25SDr. David Alan Gilbert timer_del(n->announce_timer.tm); 6169d8c6a25SDr. David Alan Gilbert n->announce_timer.round = 0; 617f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 6186e790746SPaolo Bonzini 6196e790746SPaolo Bonzini /* Flush any MAC and VLAN filter table state */ 6206e790746SPaolo Bonzini n->mac_table.in_use = 0; 6216e790746SPaolo Bonzini n->mac_table.first_multi = 0; 6226e790746SPaolo Bonzini n->mac_table.multi_overflow = 0; 6236e790746SPaolo Bonzini n->mac_table.uni_overflow = 0; 6246e790746SPaolo Bonzini memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN); 6256e790746SPaolo Bonzini memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac)); 626702d66a8SMichael S. Tsirkin qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 6276e790746SPaolo Bonzini memset(n->vlans, 0, MAX_VLAN >> 3); 62894b52958SGreg Kurz 62994b52958SGreg Kurz /* Flush any async TX */ 630441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6314fdf69abSKangjie Xu flush_or_purge_queued_packets(qemu_get_subqueue(n->nic, i)); 63294b52958SGreg Kurz } 6336e790746SPaolo Bonzini } 6346e790746SPaolo Bonzini 6356e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n) 6366e790746SPaolo Bonzini { 6376e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 6386e790746SPaolo Bonzini if (!nc->peer) { 6396e790746SPaolo Bonzini return; 6406e790746SPaolo Bonzini } 6416e790746SPaolo Bonzini 642d6085e3aSStefan Hajnoczi n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer); 6436e790746SPaolo Bonzini } 6446e790746SPaolo Bonzini 6456e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n) 6466e790746SPaolo Bonzini { 6476e790746SPaolo Bonzini return n->has_vnet_hdr; 6486e790746SPaolo Bonzini } 6496e790746SPaolo Bonzini 6506e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n) 6516e790746SPaolo Bonzini { 6526e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) 6536e790746SPaolo Bonzini return 0; 6546e790746SPaolo Bonzini 655d6085e3aSStefan Hajnoczi n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer); 6566e790746SPaolo Bonzini 6576e790746SPaolo Bonzini return n->has_ufo; 6586e790746SPaolo Bonzini } 6596e790746SPaolo Bonzini 66053da8b5aSYuri Benditovich static int peer_has_uso(VirtIONet *n) 66153da8b5aSYuri Benditovich { 66253da8b5aSYuri Benditovich if (!peer_has_vnet_hdr(n)) { 66353da8b5aSYuri Benditovich return 0; 66453da8b5aSYuri Benditovich } 66553da8b5aSYuri Benditovich 66653da8b5aSYuri Benditovich return qemu_has_uso(qemu_get_queue(n->nic)->peer); 66753da8b5aSYuri Benditovich } 66853da8b5aSYuri Benditovich 669bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs, 670e22f0603SYuri Benditovich int version_1, int hash_report) 6716e790746SPaolo Bonzini { 6726e790746SPaolo Bonzini int i; 6736e790746SPaolo Bonzini NetClientState *nc; 6746e790746SPaolo Bonzini 6756e790746SPaolo Bonzini n->mergeable_rx_bufs = mergeable_rx_bufs; 6766e790746SPaolo Bonzini 677bb9d17f8SCornelia Huck if (version_1) { 678e22f0603SYuri Benditovich n->guest_hdr_len = hash_report ? 679e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_v1_hash) : 680e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_mrg_rxbuf); 681e22f0603SYuri Benditovich n->rss_data.populate_hash = !!hash_report; 682bb9d17f8SCornelia Huck } else { 6836e790746SPaolo Bonzini n->guest_hdr_len = n->mergeable_rx_bufs ? 684bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr_mrg_rxbuf) : 685bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr); 686bb9d17f8SCornelia Huck } 6876e790746SPaolo Bonzini 688441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6896e790746SPaolo Bonzini nc = qemu_get_subqueue(n->nic, i); 6906e790746SPaolo Bonzini 6916e790746SPaolo Bonzini if (peer_has_vnet_hdr(n) && 692d6085e3aSStefan Hajnoczi qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) { 693d6085e3aSStefan Hajnoczi qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len); 6946e790746SPaolo Bonzini n->host_hdr_len = n->guest_hdr_len; 6956e790746SPaolo Bonzini } 6966e790746SPaolo Bonzini } 6976e790746SPaolo Bonzini } 6986e790746SPaolo Bonzini 6992eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n) 7002eef278bSMichael S. Tsirkin { 7012eef278bSMichael S. Tsirkin NetClientState *peer = n->nic_conf.peers.ncs[0]; 7022eef278bSMichael S. Tsirkin 7032eef278bSMichael S. Tsirkin /* 7040ea5778fSEugenio Pérez * Backends other than vhost-user or vhost-vdpa don't support max queue 7050ea5778fSEugenio Pérez * size. 7062eef278bSMichael S. Tsirkin */ 7072eef278bSMichael S. Tsirkin if (!peer) { 7082eef278bSMichael S. Tsirkin return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 7092eef278bSMichael S. Tsirkin } 7102eef278bSMichael S. Tsirkin 7110ea5778fSEugenio Pérez switch(peer->info->type) { 7120ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_USER: 7130ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_VDPA: 7142eef278bSMichael S. Tsirkin return VIRTQUEUE_MAX_SIZE; 7150ea5778fSEugenio Pérez default: 7160ea5778fSEugenio Pérez return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 7170ea5778fSEugenio Pérez }; 7182eef278bSMichael S. Tsirkin } 7192eef278bSMichael S. Tsirkin 7206e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index) 7216e790746SPaolo Bonzini { 7226e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 7236e790746SPaolo Bonzini 7246e790746SPaolo Bonzini if (!nc->peer) { 7256e790746SPaolo Bonzini return 0; 7266e790746SPaolo Bonzini } 7276e790746SPaolo Bonzini 728f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 7297263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 1); 7307263a0adSChangchun Ouyang } 7317263a0adSChangchun Ouyang 732f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 7336e790746SPaolo Bonzini return 0; 7346e790746SPaolo Bonzini } 7356e790746SPaolo Bonzini 736441537f1SJason Wang if (n->max_queue_pairs == 1) { 7371074b879SJason Wang return 0; 7381074b879SJason Wang } 7391074b879SJason Wang 7406e790746SPaolo Bonzini return tap_enable(nc->peer); 7416e790746SPaolo Bonzini } 7426e790746SPaolo Bonzini 7436e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index) 7446e790746SPaolo Bonzini { 7456e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 7466e790746SPaolo Bonzini 7476e790746SPaolo Bonzini if (!nc->peer) { 7486e790746SPaolo Bonzini return 0; 7496e790746SPaolo Bonzini } 7506e790746SPaolo Bonzini 751f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 7527263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 0); 7537263a0adSChangchun Ouyang } 7547263a0adSChangchun Ouyang 755f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 7566e790746SPaolo Bonzini return 0; 7576e790746SPaolo Bonzini } 7586e790746SPaolo Bonzini 7596e790746SPaolo Bonzini return tap_disable(nc->peer); 7606e790746SPaolo Bonzini } 7616e790746SPaolo Bonzini 762441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n) 7636e790746SPaolo Bonzini { 7646e790746SPaolo Bonzini int i; 765ddfa83eaSJoel Stanley int r; 7666e790746SPaolo Bonzini 76768b5f314SYuri Benditovich if (n->nic->peer_deleted) { 76868b5f314SYuri Benditovich return; 76968b5f314SYuri Benditovich } 77068b5f314SYuri Benditovich 771441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 772441537f1SJason Wang if (i < n->curr_queue_pairs) { 773ddfa83eaSJoel Stanley r = peer_attach(n, i); 774ddfa83eaSJoel Stanley assert(!r); 7756e790746SPaolo Bonzini } else { 776ddfa83eaSJoel Stanley r = peer_detach(n, i); 777ddfa83eaSJoel Stanley assert(!r); 7786e790746SPaolo Bonzini } 7796e790746SPaolo Bonzini } 7806e790746SPaolo Bonzini } 7816e790746SPaolo Bonzini 782ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue); 7836e790746SPaolo Bonzini 7849d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features, 7859d5b731dSJason Wang Error **errp) 7866e790746SPaolo Bonzini { 78717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 7886e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 7896e790746SPaolo Bonzini 790da3e8a23SShannon Zhao /* Firstly sync all virtio-net possible supported features */ 791da3e8a23SShannon Zhao features |= n->host_features; 792da3e8a23SShannon Zhao 7930cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7946e790746SPaolo Bonzini 7956e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) { 7960cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_CSUM); 7970cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4); 7980cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6); 7990cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN); 8006e790746SPaolo Bonzini 8010cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM); 8020cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4); 8030cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6); 8040cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN); 805e22f0603SYuri Benditovich 80653da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HOST_USO); 80753da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO4); 80853da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO6); 80953da8b5aSYuri Benditovich 810e22f0603SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT); 8116e790746SPaolo Bonzini } 8126e790746SPaolo Bonzini 8136e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) { 8140cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO); 8150cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO); 8166e790746SPaolo Bonzini } 8176e790746SPaolo Bonzini 81853da8b5aSYuri Benditovich if (!peer_has_uso(n)) { 81953da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HOST_USO); 82053da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO4); 82153da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO6); 82253da8b5aSYuri Benditovich } 82353da8b5aSYuri Benditovich 824ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 8256e790746SPaolo Bonzini return features; 8266e790746SPaolo Bonzini } 8272974e916SYuri Benditovich 8280145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 82959079029SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_RSS); 8300145c393SAndrew Melnychenko } 83175ebec11SMaxime Coquelin features = vhost_net_get_features(get_vhost_net(nc->peer), features); 83275ebec11SMaxime Coquelin vdev->backend_features = features; 83375ebec11SMaxime Coquelin 83475ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 83575ebec11SMaxime Coquelin (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) { 83675ebec11SMaxime Coquelin features |= (1ULL << VIRTIO_NET_F_MTU); 83775ebec11SMaxime Coquelin } 83875ebec11SMaxime Coquelin 839cd69d47cSEugenio Pérez /* 840cd69d47cSEugenio Pérez * Since GUEST_ANNOUNCE is emulated the feature bit could be set without 841cd69d47cSEugenio Pérez * enabled. This happens in the vDPA case. 842cd69d47cSEugenio Pérez * 843cd69d47cSEugenio Pérez * Make sure the feature set is not incoherent, as the driver could refuse 844cd69d47cSEugenio Pérez * to start. 845cd69d47cSEugenio Pérez * 846cd69d47cSEugenio Pérez * TODO: QEMU is able to emulate a CVQ just for guest_announce purposes, 847cd69d47cSEugenio Pérez * helping guest to notify the new location with vDPA devices that does not 848cd69d47cSEugenio Pérez * support it. 849cd69d47cSEugenio Pérez */ 850cd69d47cSEugenio Pérez if (!virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_CTRL_VQ)) { 851cd69d47cSEugenio Pérez virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ANNOUNCE); 852cd69d47cSEugenio Pérez } 853cd69d47cSEugenio Pérez 85475ebec11SMaxime Coquelin return features; 8556e790746SPaolo Bonzini } 8566e790746SPaolo Bonzini 857019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev) 8586e790746SPaolo Bonzini { 859019a3edbSGerd Hoffmann uint64_t features = 0; 8606e790746SPaolo Bonzini 8616e790746SPaolo Bonzini /* Linux kernel 2.6.25. It understood MAC (as everyone must), 8626e790746SPaolo Bonzini * but also these: */ 8630cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 8640cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_CSUM); 8650cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4); 8660cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6); 8670cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN); 8686e790746SPaolo Bonzini 8696e790746SPaolo Bonzini return features; 8706e790746SPaolo Bonzini } 8716e790746SPaolo Bonzini 872644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n) 873644c9858SDmitry Fleytman { 874ad37bb3bSStefan Hajnoczi qemu_set_offload(qemu_get_queue(n->nic)->peer, 875644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)), 876644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)), 877644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)), 878644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)), 8792ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)), 8802ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_USO4)), 8812ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_USO6))); 882644c9858SDmitry Fleytman } 883644c9858SDmitry Fleytman 88453da8b5aSYuri Benditovich static uint64_t virtio_net_guest_offloads_by_features(uint64_t features) 885644c9858SDmitry Fleytman { 886644c9858SDmitry Fleytman static const uint64_t guest_offloads_mask = 887644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_CSUM) | 888644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO4) | 889644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO6) | 890644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_ECN) | 89153da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_UFO) | 89253da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_USO4) | 89353da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_USO6); 894644c9858SDmitry Fleytman 895644c9858SDmitry Fleytman return guest_offloads_mask & features; 896644c9858SDmitry Fleytman } 897644c9858SDmitry Fleytman 8980b545b1eSHawkins Jiawei uint64_t virtio_net_supported_guest_offloads(const VirtIONet *n) 899644c9858SDmitry Fleytman { 900644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 901644c9858SDmitry Fleytman return virtio_net_guest_offloads_by_features(vdev->guest_features); 902644c9858SDmitry Fleytman } 903644c9858SDmitry Fleytman 904f5e1847bSJuan Quintela typedef struct { 905f5e1847bSJuan Quintela VirtIONet *n; 90612b2fad7SKevin Wolf DeviceState *dev; 90712b2fad7SKevin Wolf } FailoverDevice; 908f5e1847bSJuan Quintela 909f5e1847bSJuan Quintela /** 91012b2fad7SKevin Wolf * Set the failover primary device 911f5e1847bSJuan Quintela * 912f5e1847bSJuan Quintela * @opaque: FailoverId to setup 913f5e1847bSJuan Quintela * @opts: opts for device we are handling 914f5e1847bSJuan Quintela * @errp: returns an error if this function fails 915f5e1847bSJuan Quintela */ 91612b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque) 917f5e1847bSJuan Quintela { 91812b2fad7SKevin Wolf FailoverDevice *fdev = opaque; 91912b2fad7SKevin Wolf PCIDevice *pci_dev = (PCIDevice *) 92012b2fad7SKevin Wolf object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE); 921f5e1847bSJuan Quintela 92212b2fad7SKevin Wolf if (!pci_dev) { 92312b2fad7SKevin Wolf return 0; 92412b2fad7SKevin Wolf } 92512b2fad7SKevin Wolf 92612b2fad7SKevin Wolf if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) { 92712b2fad7SKevin Wolf fdev->dev = dev; 928f5e1847bSJuan Quintela return 1; 929f5e1847bSJuan Quintela } 930f5e1847bSJuan Quintela 931f5e1847bSJuan Quintela return 0; 932f5e1847bSJuan Quintela } 933f5e1847bSJuan Quintela 934f5e1847bSJuan Quintela /** 93585d3b931SJuan Quintela * Find the primary device for this failover virtio-net 93685d3b931SJuan Quintela * 93785d3b931SJuan Quintela * @n: VirtIONet device 93885d3b931SJuan Quintela * @errp: returns an error if this function fails 93985d3b931SJuan Quintela */ 9400a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n) 9419711cd0dSJens Freimann { 94212b2fad7SKevin Wolf FailoverDevice fdev = { 94312b2fad7SKevin Wolf .n = n, 94412b2fad7SKevin Wolf }; 9459711cd0dSJens Freimann 94612b2fad7SKevin Wolf qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL, 94712b2fad7SKevin Wolf NULL, NULL, &fdev); 94812b2fad7SKevin Wolf return fdev.dev; 9499711cd0dSJens Freimann } 9509711cd0dSJens Freimann 95121e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp) 95221e8709bSJuan Quintela { 95321e8709bSJuan Quintela Error *err = NULL; 95421e8709bSJuan Quintela DeviceState *dev = failover_find_primary_device(n); 95521e8709bSJuan Quintela 95621e8709bSJuan Quintela if (dev) { 95721e8709bSJuan Quintela return; 95821e8709bSJuan Quintela } 95921e8709bSJuan Quintela 960259a10dbSKevin Wolf if (!n->primary_opts) { 96197ca9c59SLaurent Vivier error_setg(errp, "Primary device not found"); 96297ca9c59SLaurent Vivier error_append_hint(errp, "Virtio-net failover will not work. Make " 96397ca9c59SLaurent Vivier "sure primary device has parameter" 96497ca9c59SLaurent Vivier " failover_pair_id=%s\n", n->netclient_name); 96521e8709bSJuan Quintela return; 96621e8709bSJuan Quintela } 967259a10dbSKevin Wolf 968f3558b1bSKevin Wolf dev = qdev_device_add_from_qdict(n->primary_opts, 969f3558b1bSKevin Wolf n->primary_opts_from_json, 970f3558b1bSKevin Wolf &err); 97121e8709bSJuan Quintela if (err) { 972f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 973259a10dbSKevin Wolf n->primary_opts = NULL; 97400e7b129SLaurent Vivier } else { 97500e7b129SLaurent Vivier object_unref(OBJECT(dev)); 97621e8709bSJuan Quintela } 97721e8709bSJuan Quintela error_propagate(errp, err); 97821e8709bSJuan Quintela } 97921e8709bSJuan Quintela 980d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features) 9816e790746SPaolo Bonzini { 98217a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 9839711cd0dSJens Freimann Error *err = NULL; 9846e790746SPaolo Bonzini int i; 9856e790746SPaolo Bonzini 98675ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 98775ebec11SMaxime Coquelin !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) { 98875ebec11SMaxime Coquelin features &= ~(1ULL << VIRTIO_NET_F_MTU); 98975ebec11SMaxime Coquelin } 99075ebec11SMaxime Coquelin 991ef546f12SCornelia Huck virtio_net_set_multiqueue(n, 99259079029SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_RSS) || 99395129d6fSCornelia Huck virtio_has_feature(features, VIRTIO_NET_F_MQ)); 9946e790746SPaolo Bonzini 995ef546f12SCornelia Huck virtio_net_set_mrg_rx_bufs(n, 99695129d6fSCornelia Huck virtio_has_feature(features, 997bb9d17f8SCornelia Huck VIRTIO_NET_F_MRG_RXBUF), 99895129d6fSCornelia Huck virtio_has_feature(features, 999e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 1000e22f0603SYuri Benditovich virtio_has_feature(features, 1001e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 10026e790746SPaolo Bonzini 10032974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 10042974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4); 10052974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 10062974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6); 1007e22f0603SYuri Benditovich n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS); 10082974e916SYuri Benditovich 10096e790746SPaolo Bonzini if (n->has_vnet_hdr) { 1010644c9858SDmitry Fleytman n->curr_guest_offloads = 1011644c9858SDmitry Fleytman virtio_net_guest_offloads_by_features(features); 1012644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 10136e790746SPaolo Bonzini } 10146e790746SPaolo Bonzini 1015441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 10166e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, i); 10176e790746SPaolo Bonzini 1018ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 10196e790746SPaolo Bonzini continue; 10206e790746SPaolo Bonzini } 1021ed8b4afeSNikolay Nikolaev vhost_net_ack_features(get_vhost_net(nc->peer), features); 1022c9bdc449SHyman Huang(黄勇) 1023c9bdc449SHyman Huang(黄勇) /* 1024c9bdc449SHyman Huang(黄勇) * keep acked_features in NetVhostUserState up-to-date so it 1025c9bdc449SHyman Huang(黄勇) * can't miss any features configured by guest virtio driver. 1026c9bdc449SHyman Huang(黄勇) */ 1027c9bdc449SHyman Huang(黄勇) vhost_net_save_acked_features(nc->peer); 10286e790746SPaolo Bonzini } 10290b1eaa88SStefan Fritsch 103006b636a1SHawkins Jiawei if (!virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) { 10310b1eaa88SStefan Fritsch memset(n->vlans, 0xff, MAX_VLAN >> 3); 10320b1eaa88SStefan Fritsch } 10339711cd0dSJens Freimann 10349711cd0dSJens Freimann if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) { 10359711cd0dSJens Freimann qapi_event_send_failover_negotiated(n->netclient_name); 1036e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 10379711cd0dSJens Freimann failover_add_primary(n, &err); 10389711cd0dSJens Freimann if (err) { 10391b529d90SLaurent Vivier if (!qtest_enabled()) { 10409711cd0dSJens Freimann warn_report_err(err); 10411b529d90SLaurent Vivier } else { 10421b529d90SLaurent Vivier error_free(err); 10431b529d90SLaurent Vivier } 10449711cd0dSJens Freimann } 10456e790746SPaolo Bonzini } 104621e8709bSJuan Quintela } 10476e790746SPaolo Bonzini 10486e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd, 10496e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 10506e790746SPaolo Bonzini { 10516e790746SPaolo Bonzini uint8_t on; 10526e790746SPaolo Bonzini size_t s; 1053b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 10546e790746SPaolo Bonzini 10556e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on)); 10566e790746SPaolo Bonzini if (s != sizeof(on)) { 10576e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10586e790746SPaolo Bonzini } 10596e790746SPaolo Bonzini 10606e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) { 10616e790746SPaolo Bonzini n->promisc = on; 10626e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) { 10636e790746SPaolo Bonzini n->allmulti = on; 10646e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) { 10656e790746SPaolo Bonzini n->alluni = on; 10666e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) { 10676e790746SPaolo Bonzini n->nomulti = on; 10686e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) { 10696e790746SPaolo Bonzini n->nouni = on; 10706e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) { 10716e790746SPaolo Bonzini n->nobcast = on; 10726e790746SPaolo Bonzini } else { 10736e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10746e790746SPaolo Bonzini } 10756e790746SPaolo Bonzini 1076b1be4280SAmos Kong rxfilter_notify(nc); 1077b1be4280SAmos Kong 10786e790746SPaolo Bonzini return VIRTIO_NET_OK; 10796e790746SPaolo Bonzini } 10806e790746SPaolo Bonzini 1081644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd, 1082644c9858SDmitry Fleytman struct iovec *iov, unsigned int iov_cnt) 1083644c9858SDmitry Fleytman { 1084644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 1085644c9858SDmitry Fleytman uint64_t offloads; 1086644c9858SDmitry Fleytman size_t s; 1087644c9858SDmitry Fleytman 108895129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 1089644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1090644c9858SDmitry Fleytman } 1091644c9858SDmitry Fleytman 1092644c9858SDmitry Fleytman s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads)); 1093644c9858SDmitry Fleytman if (s != sizeof(offloads)) { 1094644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1095644c9858SDmitry Fleytman } 1096644c9858SDmitry Fleytman 1097644c9858SDmitry Fleytman if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) { 1098644c9858SDmitry Fleytman uint64_t supported_offloads; 1099644c9858SDmitry Fleytman 1100189ae6bbSJason Wang offloads = virtio_ldq_p(vdev, &offloads); 1101189ae6bbSJason Wang 1102644c9858SDmitry Fleytman if (!n->has_vnet_hdr) { 1103644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1104644c9858SDmitry Fleytman } 1105644c9858SDmitry Fleytman 11062974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 11072974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4); 11082974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 11092974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6); 11102974e916SYuri Benditovich virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT); 11112974e916SYuri Benditovich 1112644c9858SDmitry Fleytman supported_offloads = virtio_net_supported_guest_offloads(n); 1113644c9858SDmitry Fleytman if (offloads & ~supported_offloads) { 1114644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1115644c9858SDmitry Fleytman } 1116644c9858SDmitry Fleytman 1117644c9858SDmitry Fleytman n->curr_guest_offloads = offloads; 1118644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 1119644c9858SDmitry Fleytman 1120644c9858SDmitry Fleytman return VIRTIO_NET_OK; 1121644c9858SDmitry Fleytman } else { 1122644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1123644c9858SDmitry Fleytman } 1124644c9858SDmitry Fleytman } 1125644c9858SDmitry Fleytman 11266e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd, 11276e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 11286e790746SPaolo Bonzini { 11291399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 11306e790746SPaolo Bonzini struct virtio_net_ctrl_mac mac_data; 11316e790746SPaolo Bonzini size_t s; 1132b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 11336e790746SPaolo Bonzini 11346e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) { 11356e790746SPaolo Bonzini if (iov_size(iov, iov_cnt) != sizeof(n->mac)) { 11366e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11376e790746SPaolo Bonzini } 11386e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac)); 11396e790746SPaolo Bonzini assert(s == sizeof(n->mac)); 11406e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1141b1be4280SAmos Kong rxfilter_notify(nc); 1142b1be4280SAmos Kong 11436e790746SPaolo Bonzini return VIRTIO_NET_OK; 11446e790746SPaolo Bonzini } 11456e790746SPaolo Bonzini 11466e790746SPaolo Bonzini if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) { 11476e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11486e790746SPaolo Bonzini } 11496e790746SPaolo Bonzini 1150cae2e556SAmos Kong int in_use = 0; 1151cae2e556SAmos Kong int first_multi = 0; 1152cae2e556SAmos Kong uint8_t uni_overflow = 0; 1153cae2e556SAmos Kong uint8_t multi_overflow = 0; 1154cae2e556SAmos Kong uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 11556e790746SPaolo Bonzini 11566e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 11576e790746SPaolo Bonzini sizeof(mac_data.entries)); 11581399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 11596e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1160b1be4280SAmos Kong goto error; 11616e790746SPaolo Bonzini } 11626e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 11636e790746SPaolo Bonzini 11646e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) { 1165b1be4280SAmos Kong goto error; 11666e790746SPaolo Bonzini } 11676e790746SPaolo Bonzini 11686e790746SPaolo Bonzini if (mac_data.entries <= MAC_TABLE_ENTRIES) { 1169cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, macs, 11706e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 11716e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1172b1be4280SAmos Kong goto error; 11736e790746SPaolo Bonzini } 1174cae2e556SAmos Kong in_use += mac_data.entries; 11756e790746SPaolo Bonzini } else { 1176cae2e556SAmos Kong uni_overflow = 1; 11776e790746SPaolo Bonzini } 11786e790746SPaolo Bonzini 11796e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN); 11806e790746SPaolo Bonzini 1181cae2e556SAmos Kong first_multi = in_use; 11826e790746SPaolo Bonzini 11836e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 11846e790746SPaolo Bonzini sizeof(mac_data.entries)); 11851399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 11866e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1187b1be4280SAmos Kong goto error; 11886e790746SPaolo Bonzini } 11896e790746SPaolo Bonzini 11906e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 11916e790746SPaolo Bonzini 11926e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) { 1193b1be4280SAmos Kong goto error; 11946e790746SPaolo Bonzini } 11956e790746SPaolo Bonzini 1196edc24385SMichael S. Tsirkin if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) { 1197cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN], 11986e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 11996e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1200b1be4280SAmos Kong goto error; 12016e790746SPaolo Bonzini } 1202cae2e556SAmos Kong in_use += mac_data.entries; 12036e790746SPaolo Bonzini } else { 1204cae2e556SAmos Kong multi_overflow = 1; 12056e790746SPaolo Bonzini } 12066e790746SPaolo Bonzini 1207cae2e556SAmos Kong n->mac_table.in_use = in_use; 1208cae2e556SAmos Kong n->mac_table.first_multi = first_multi; 1209cae2e556SAmos Kong n->mac_table.uni_overflow = uni_overflow; 1210cae2e556SAmos Kong n->mac_table.multi_overflow = multi_overflow; 1211cae2e556SAmos Kong memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN); 1212cae2e556SAmos Kong g_free(macs); 1213b1be4280SAmos Kong rxfilter_notify(nc); 1214b1be4280SAmos Kong 12156e790746SPaolo Bonzini return VIRTIO_NET_OK; 1216b1be4280SAmos Kong 1217b1be4280SAmos Kong error: 1218cae2e556SAmos Kong g_free(macs); 1219b1be4280SAmos Kong return VIRTIO_NET_ERR; 12206e790746SPaolo Bonzini } 12216e790746SPaolo Bonzini 12226e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd, 12236e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 12246e790746SPaolo Bonzini { 12251399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 12266e790746SPaolo Bonzini uint16_t vid; 12276e790746SPaolo Bonzini size_t s; 1228b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 12296e790746SPaolo Bonzini 12306e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid)); 12311399c60dSRusty Russell vid = virtio_lduw_p(vdev, &vid); 12326e790746SPaolo Bonzini if (s != sizeof(vid)) { 12336e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12346e790746SPaolo Bonzini } 12356e790746SPaolo Bonzini 12366e790746SPaolo Bonzini if (vid >= MAX_VLAN) 12376e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12386e790746SPaolo Bonzini 12396e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_VLAN_ADD) 12406e790746SPaolo Bonzini n->vlans[vid >> 5] |= (1U << (vid & 0x1f)); 12416e790746SPaolo Bonzini else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL) 12426e790746SPaolo Bonzini n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f)); 12436e790746SPaolo Bonzini else 12446e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12456e790746SPaolo Bonzini 1246b1be4280SAmos Kong rxfilter_notify(nc); 1247b1be4280SAmos Kong 12486e790746SPaolo Bonzini return VIRTIO_NET_OK; 12496e790746SPaolo Bonzini } 12506e790746SPaolo Bonzini 1251f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd, 1252f57fcf70SJason Wang struct iovec *iov, unsigned int iov_cnt) 1253f57fcf70SJason Wang { 12549d8c6a25SDr. David Alan Gilbert trace_virtio_net_handle_announce(n->announce_timer.round); 1255f57fcf70SJason Wang if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK && 1256f57fcf70SJason Wang n->status & VIRTIO_NET_S_ANNOUNCE) { 1257f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 12589d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 12599d8c6a25SDr. David Alan Gilbert qemu_announce_timer_step(&n->announce_timer); 1260f57fcf70SJason Wang } 1261f57fcf70SJason Wang return VIRTIO_NET_OK; 1262f57fcf70SJason Wang } else { 1263f57fcf70SJason Wang return VIRTIO_NET_ERR; 1264f57fcf70SJason Wang } 1265f57fcf70SJason Wang } 1266f57fcf70SJason Wang 12670145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n); 12680145c393SAndrew Melnychenko 126959079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n) 127059079029SYuri Benditovich { 127159079029SYuri Benditovich if (n->rss_data.enabled) { 127259079029SYuri Benditovich trace_virtio_net_rss_disable(); 127359079029SYuri Benditovich } 127459079029SYuri Benditovich n->rss_data.enabled = false; 12750145c393SAndrew Melnychenko 12760145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 12770145c393SAndrew Melnychenko } 12780145c393SAndrew Melnychenko 12790145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd) 12800145c393SAndrew Melnychenko { 12810145c393SAndrew Melnychenko NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0); 12820145c393SAndrew Melnychenko if (nc == NULL || nc->info->set_steering_ebpf == NULL) { 12830145c393SAndrew Melnychenko return false; 12840145c393SAndrew Melnychenko } 12850145c393SAndrew Melnychenko 12860145c393SAndrew Melnychenko return nc->info->set_steering_ebpf(nc, prog_fd); 12870145c393SAndrew Melnychenko } 12880145c393SAndrew Melnychenko 12890145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data, 12900145c393SAndrew Melnychenko struct EBPFRSSConfig *config) 12910145c393SAndrew Melnychenko { 12920145c393SAndrew Melnychenko config->redirect = data->redirect; 12930145c393SAndrew Melnychenko config->populate_hash = data->populate_hash; 12940145c393SAndrew Melnychenko config->hash_types = data->hash_types; 12950145c393SAndrew Melnychenko config->indirections_len = data->indirections_len; 12960145c393SAndrew Melnychenko config->default_queue = data->default_queue; 12970145c393SAndrew Melnychenko } 12980145c393SAndrew Melnychenko 12990145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n) 13000145c393SAndrew Melnychenko { 13010145c393SAndrew Melnychenko struct EBPFRSSConfig config = {}; 13020145c393SAndrew Melnychenko 13030145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 13040145c393SAndrew Melnychenko return false; 13050145c393SAndrew Melnychenko } 13060145c393SAndrew Melnychenko 13070145c393SAndrew Melnychenko rss_data_to_rss_config(&n->rss_data, &config); 13080145c393SAndrew Melnychenko 13090145c393SAndrew Melnychenko if (!ebpf_rss_set_all(&n->ebpf_rss, &config, 13100145c393SAndrew Melnychenko n->rss_data.indirections_table, n->rss_data.key)) { 13110145c393SAndrew Melnychenko return false; 13120145c393SAndrew Melnychenko } 13130145c393SAndrew Melnychenko 13140145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) { 13150145c393SAndrew Melnychenko return false; 13160145c393SAndrew Melnychenko } 13170145c393SAndrew Melnychenko 13180145c393SAndrew Melnychenko return true; 13190145c393SAndrew Melnychenko } 13200145c393SAndrew Melnychenko 13210145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n) 13220145c393SAndrew Melnychenko { 13230145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 13240145c393SAndrew Melnychenko } 13250145c393SAndrew Melnychenko 13260145c393SAndrew Melnychenko static bool virtio_net_load_ebpf(VirtIONet *n) 13270145c393SAndrew Melnychenko { 13280145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, -1)) { 13292431f4f1SMichael Tokarev /* backend doesn't support steering ebpf */ 13300145c393SAndrew Melnychenko return false; 13310145c393SAndrew Melnychenko } 13320145c393SAndrew Melnychenko 13330145c393SAndrew Melnychenko return ebpf_rss_load(&n->ebpf_rss); 13340145c393SAndrew Melnychenko } 13350145c393SAndrew Melnychenko 13360145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n) 13370145c393SAndrew Melnychenko { 13380145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 13390145c393SAndrew Melnychenko ebpf_rss_unload(&n->ebpf_rss); 134059079029SYuri Benditovich } 134159079029SYuri Benditovich 134259079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n, 1343e22f0603SYuri Benditovich struct iovec *iov, 1344e22f0603SYuri Benditovich unsigned int iov_cnt, 1345e22f0603SYuri Benditovich bool do_rss) 134659079029SYuri Benditovich { 134759079029SYuri Benditovich VirtIODevice *vdev = VIRTIO_DEVICE(n); 134859079029SYuri Benditovich struct virtio_net_rss_config cfg; 134959079029SYuri Benditovich size_t s, offset = 0, size_get; 1350441537f1SJason Wang uint16_t queue_pairs, i; 135159079029SYuri Benditovich struct { 135259079029SYuri Benditovich uint16_t us; 135359079029SYuri Benditovich uint8_t b; 135459079029SYuri Benditovich } QEMU_PACKED temp; 135559079029SYuri Benditovich const char *err_msg = ""; 135659079029SYuri Benditovich uint32_t err_value = 0; 135759079029SYuri Benditovich 1358e22f0603SYuri Benditovich if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) { 135959079029SYuri Benditovich err_msg = "RSS is not negotiated"; 136059079029SYuri Benditovich goto error; 136159079029SYuri Benditovich } 1362e22f0603SYuri Benditovich if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) { 1363e22f0603SYuri Benditovich err_msg = "Hash report is not negotiated"; 1364e22f0603SYuri Benditovich goto error; 1365e22f0603SYuri Benditovich } 136659079029SYuri Benditovich size_get = offsetof(struct virtio_net_rss_config, indirection_table); 136759079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get); 136859079029SYuri Benditovich if (s != size_get) { 136959079029SYuri Benditovich err_msg = "Short command buffer"; 137059079029SYuri Benditovich err_value = (uint32_t)s; 137159079029SYuri Benditovich goto error; 137259079029SYuri Benditovich } 137359079029SYuri Benditovich n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types); 137459079029SYuri Benditovich n->rss_data.indirections_len = 137559079029SYuri Benditovich virtio_lduw_p(vdev, &cfg.indirection_table_mask); 137659079029SYuri Benditovich n->rss_data.indirections_len++; 1377e22f0603SYuri Benditovich if (!do_rss) { 1378e22f0603SYuri Benditovich n->rss_data.indirections_len = 1; 1379e22f0603SYuri Benditovich } 138059079029SYuri Benditovich if (!is_power_of_2(n->rss_data.indirections_len)) { 138159079029SYuri Benditovich err_msg = "Invalid size of indirection table"; 138259079029SYuri Benditovich err_value = n->rss_data.indirections_len; 138359079029SYuri Benditovich goto error; 138459079029SYuri Benditovich } 138559079029SYuri Benditovich if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) { 138659079029SYuri Benditovich err_msg = "Too large indirection table"; 138759079029SYuri Benditovich err_value = n->rss_data.indirections_len; 138859079029SYuri Benditovich goto error; 138959079029SYuri Benditovich } 1390e22f0603SYuri Benditovich n->rss_data.default_queue = do_rss ? 1391e22f0603SYuri Benditovich virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0; 1392441537f1SJason Wang if (n->rss_data.default_queue >= n->max_queue_pairs) { 139359079029SYuri Benditovich err_msg = "Invalid default queue"; 139459079029SYuri Benditovich err_value = n->rss_data.default_queue; 139559079029SYuri Benditovich goto error; 139659079029SYuri Benditovich } 139759079029SYuri Benditovich offset += size_get; 139859079029SYuri Benditovich size_get = sizeof(uint16_t) * n->rss_data.indirections_len; 139959079029SYuri Benditovich g_free(n->rss_data.indirections_table); 140059079029SYuri Benditovich n->rss_data.indirections_table = g_malloc(size_get); 140159079029SYuri Benditovich if (!n->rss_data.indirections_table) { 140259079029SYuri Benditovich err_msg = "Can't allocate indirections table"; 140359079029SYuri Benditovich err_value = n->rss_data.indirections_len; 140459079029SYuri Benditovich goto error; 140559079029SYuri Benditovich } 140659079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, 140759079029SYuri Benditovich n->rss_data.indirections_table, size_get); 140859079029SYuri Benditovich if (s != size_get) { 140959079029SYuri Benditovich err_msg = "Short indirection table buffer"; 141059079029SYuri Benditovich err_value = (uint32_t)s; 141159079029SYuri Benditovich goto error; 141259079029SYuri Benditovich } 141359079029SYuri Benditovich for (i = 0; i < n->rss_data.indirections_len; ++i) { 141459079029SYuri Benditovich uint16_t val = n->rss_data.indirections_table[i]; 141559079029SYuri Benditovich n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val); 141659079029SYuri Benditovich } 141759079029SYuri Benditovich offset += size_get; 141859079029SYuri Benditovich size_get = sizeof(temp); 141959079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get); 142059079029SYuri Benditovich if (s != size_get) { 1421441537f1SJason Wang err_msg = "Can't get queue_pairs"; 142259079029SYuri Benditovich err_value = (uint32_t)s; 142359079029SYuri Benditovich goto error; 142459079029SYuri Benditovich } 1425441537f1SJason Wang queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs; 1426441537f1SJason Wang if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) { 1427441537f1SJason Wang err_msg = "Invalid number of queue_pairs"; 1428441537f1SJason Wang err_value = queue_pairs; 142959079029SYuri Benditovich goto error; 143059079029SYuri Benditovich } 143159079029SYuri Benditovich if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) { 143259079029SYuri Benditovich err_msg = "Invalid key size"; 143359079029SYuri Benditovich err_value = temp.b; 143459079029SYuri Benditovich goto error; 143559079029SYuri Benditovich } 143659079029SYuri Benditovich if (!temp.b && n->rss_data.hash_types) { 143759079029SYuri Benditovich err_msg = "No key provided"; 143859079029SYuri Benditovich err_value = 0; 143959079029SYuri Benditovich goto error; 144059079029SYuri Benditovich } 144159079029SYuri Benditovich if (!temp.b && !n->rss_data.hash_types) { 144259079029SYuri Benditovich virtio_net_disable_rss(n); 1443441537f1SJason Wang return queue_pairs; 144459079029SYuri Benditovich } 144559079029SYuri Benditovich offset += size_get; 144659079029SYuri Benditovich size_get = temp.b; 144759079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get); 144859079029SYuri Benditovich if (s != size_get) { 144959079029SYuri Benditovich err_msg = "Can get key buffer"; 145059079029SYuri Benditovich err_value = (uint32_t)s; 145159079029SYuri Benditovich goto error; 145259079029SYuri Benditovich } 145359079029SYuri Benditovich n->rss_data.enabled = true; 14540145c393SAndrew Melnychenko 14550145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 14560145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 14570145c393SAndrew Melnychenko /* EBPF must be loaded for vhost */ 14580145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 14590145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS for vhost"); 14600145c393SAndrew Melnychenko goto error; 14610145c393SAndrew Melnychenko } 14620145c393SAndrew Melnychenko /* fallback to software RSS */ 14630145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS - fallback to software RSS"); 14640145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 14650145c393SAndrew Melnychenko } 14660145c393SAndrew Melnychenko } else { 14670145c393SAndrew Melnychenko /* use software RSS for hash populating */ 14680145c393SAndrew Melnychenko /* and detach eBPF if was loaded before */ 14690145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 14700145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 14710145c393SAndrew Melnychenko } 14720145c393SAndrew Melnychenko 147359079029SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 147459079029SYuri Benditovich n->rss_data.indirections_len, 147559079029SYuri Benditovich temp.b); 1476441537f1SJason Wang return queue_pairs; 147759079029SYuri Benditovich error: 147859079029SYuri Benditovich trace_virtio_net_rss_error(err_msg, err_value); 147959079029SYuri Benditovich virtio_net_disable_rss(n); 148059079029SYuri Benditovich return 0; 148159079029SYuri Benditovich } 148259079029SYuri Benditovich 14836e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd, 14846e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 14856e790746SPaolo Bonzini { 148617a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1487441537f1SJason Wang uint16_t queue_pairs; 14882a7888ccSSi-Wei Liu NetClientState *nc = qemu_get_queue(n->nic); 14896e790746SPaolo Bonzini 149059079029SYuri Benditovich virtio_net_disable_rss(n); 1491e22f0603SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) { 1492441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false); 1493441537f1SJason Wang return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR; 1494e22f0603SYuri Benditovich } 149559079029SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) { 1496441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true); 149759079029SYuri Benditovich } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) { 149859079029SYuri Benditovich struct virtio_net_ctrl_mq mq; 149959079029SYuri Benditovich size_t s; 150059079029SYuri Benditovich if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) { 150159079029SYuri Benditovich return VIRTIO_NET_ERR; 150259079029SYuri Benditovich } 15036e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq)); 15046e790746SPaolo Bonzini if (s != sizeof(mq)) { 15056e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15066e790746SPaolo Bonzini } 1507441537f1SJason Wang queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs); 15086e790746SPaolo Bonzini 150959079029SYuri Benditovich } else { 15106e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15116e790746SPaolo Bonzini } 15126e790746SPaolo Bonzini 1513441537f1SJason Wang if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN || 1514441537f1SJason Wang queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX || 1515441537f1SJason Wang queue_pairs > n->max_queue_pairs || 15166e790746SPaolo Bonzini !n->multiqueue) { 15176e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15186e790746SPaolo Bonzini } 15196e790746SPaolo Bonzini 1520441537f1SJason Wang n->curr_queue_pairs = queue_pairs; 1521ca8717f9SEugenio Pérez if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 1522ca8717f9SEugenio Pérez /* 1523ca8717f9SEugenio Pérez * Avoid updating the backend for a vdpa device: We're only interested 1524ca8717f9SEugenio Pérez * in updating the device model queues. 1525ca8717f9SEugenio Pérez */ 1526ca8717f9SEugenio Pérez return VIRTIO_NET_OK; 1527ca8717f9SEugenio Pérez } 1528441537f1SJason Wang /* stop the backend before changing the number of queue_pairs to avoid handling a 15296e790746SPaolo Bonzini * disabled queue */ 153017a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 1531441537f1SJason Wang virtio_net_set_queue_pairs(n); 15326e790746SPaolo Bonzini 15336e790746SPaolo Bonzini return VIRTIO_NET_OK; 15346e790746SPaolo Bonzini } 1535ba7eadb5SGreg Kurz 1536640b8a1cSEugenio Pérez size_t virtio_net_handle_ctrl_iov(VirtIODevice *vdev, 1537640b8a1cSEugenio Pérez const struct iovec *in_sg, unsigned in_num, 1538640b8a1cSEugenio Pérez const struct iovec *out_sg, 1539640b8a1cSEugenio Pérez unsigned out_num) 15406e790746SPaolo Bonzini { 154117a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 15426e790746SPaolo Bonzini struct virtio_net_ctrl_hdr ctrl; 15436e790746SPaolo Bonzini virtio_net_ctrl_ack status = VIRTIO_NET_ERR; 15446e790746SPaolo Bonzini size_t s; 1545771b6ed3SJason Wang struct iovec *iov, *iov2; 1546640b8a1cSEugenio Pérez 1547640b8a1cSEugenio Pérez if (iov_size(in_sg, in_num) < sizeof(status) || 1548640b8a1cSEugenio Pérez iov_size(out_sg, out_num) < sizeof(ctrl)) { 1549640b8a1cSEugenio Pérez virtio_error(vdev, "virtio-net ctrl missing headers"); 1550640b8a1cSEugenio Pérez return 0; 1551640b8a1cSEugenio Pérez } 1552640b8a1cSEugenio Pérez 1553640b8a1cSEugenio Pérez iov2 = iov = g_memdup2(out_sg, sizeof(struct iovec) * out_num); 1554640b8a1cSEugenio Pérez s = iov_to_buf(iov, out_num, 0, &ctrl, sizeof(ctrl)); 1555640b8a1cSEugenio Pérez iov_discard_front(&iov, &out_num, sizeof(ctrl)); 1556640b8a1cSEugenio Pérez if (s != sizeof(ctrl)) { 1557640b8a1cSEugenio Pérez status = VIRTIO_NET_ERR; 1558640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_RX) { 1559640b8a1cSEugenio Pérez status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, out_num); 1560640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) { 1561640b8a1cSEugenio Pérez status = virtio_net_handle_mac(n, ctrl.cmd, iov, out_num); 1562640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) { 1563640b8a1cSEugenio Pérez status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, out_num); 1564640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) { 1565640b8a1cSEugenio Pérez status = virtio_net_handle_announce(n, ctrl.cmd, iov, out_num); 1566640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) { 1567640b8a1cSEugenio Pérez status = virtio_net_handle_mq(n, ctrl.cmd, iov, out_num); 1568640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) { 1569640b8a1cSEugenio Pérez status = virtio_net_handle_offloads(n, ctrl.cmd, iov, out_num); 1570640b8a1cSEugenio Pérez } 1571640b8a1cSEugenio Pérez 1572640b8a1cSEugenio Pérez s = iov_from_buf(in_sg, in_num, 0, &status, sizeof(status)); 1573640b8a1cSEugenio Pérez assert(s == sizeof(status)); 1574640b8a1cSEugenio Pérez 1575640b8a1cSEugenio Pérez g_free(iov2); 1576640b8a1cSEugenio Pérez return sizeof(status); 1577640b8a1cSEugenio Pérez } 1578640b8a1cSEugenio Pérez 1579640b8a1cSEugenio Pérez static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq) 1580640b8a1cSEugenio Pérez { 1581640b8a1cSEugenio Pérez VirtQueueElement *elem; 15826e790746SPaolo Bonzini 158351b19ebeSPaolo Bonzini for (;;) { 1584640b8a1cSEugenio Pérez size_t written; 158551b19ebeSPaolo Bonzini elem = virtqueue_pop(vq, sizeof(VirtQueueElement)); 158651b19ebeSPaolo Bonzini if (!elem) { 158751b19ebeSPaolo Bonzini break; 158851b19ebeSPaolo Bonzini } 1589640b8a1cSEugenio Pérez 1590640b8a1cSEugenio Pérez written = virtio_net_handle_ctrl_iov(vdev, elem->in_sg, elem->in_num, 1591640b8a1cSEugenio Pérez elem->out_sg, elem->out_num); 1592640b8a1cSEugenio Pérez if (written > 0) { 1593640b8a1cSEugenio Pérez virtqueue_push(vq, elem, written); 1594640b8a1cSEugenio Pérez virtio_notify(vdev, vq); 1595640b8a1cSEugenio Pérez g_free(elem); 1596640b8a1cSEugenio Pérez } else { 1597ba7eadb5SGreg Kurz virtqueue_detach_element(vq, elem, 0); 1598ba7eadb5SGreg Kurz g_free(elem); 1599ba7eadb5SGreg Kurz break; 16006e790746SPaolo Bonzini } 16016e790746SPaolo Bonzini } 16026e790746SPaolo Bonzini } 16036e790746SPaolo Bonzini 16046e790746SPaolo Bonzini /* RX */ 16056e790746SPaolo Bonzini 16066e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq) 16076e790746SPaolo Bonzini { 160817a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 16096e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(vq)); 16106e790746SPaolo Bonzini 16116e790746SPaolo Bonzini qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index)); 16126e790746SPaolo Bonzini } 16136e790746SPaolo Bonzini 1614b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc) 16156e790746SPaolo Bonzini { 16166e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 161717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 16186e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 16196e790746SPaolo Bonzini 162017a0ca55SKONRAD Frederic if (!vdev->vm_running) { 1621b8c4b67eSPhilippe Mathieu-Daudé return false; 16226e790746SPaolo Bonzini } 16236e790746SPaolo Bonzini 1624441537f1SJason Wang if (nc->queue_index >= n->curr_queue_pairs) { 1625b8c4b67eSPhilippe Mathieu-Daudé return false; 16266e790746SPaolo Bonzini } 16276e790746SPaolo Bonzini 16286e790746SPaolo Bonzini if (!virtio_queue_ready(q->rx_vq) || 162917a0ca55SKONRAD Frederic !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 1630b8c4b67eSPhilippe Mathieu-Daudé return false; 16316e790746SPaolo Bonzini } 16326e790746SPaolo Bonzini 1633b8c4b67eSPhilippe Mathieu-Daudé return true; 16346e790746SPaolo Bonzini } 16356e790746SPaolo Bonzini 16366e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize) 16376e790746SPaolo Bonzini { 16386e790746SPaolo Bonzini VirtIONet *n = q->n; 16396e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 16406e790746SPaolo Bonzini (n->mergeable_rx_bufs && 16416e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 16426e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 1); 16436e790746SPaolo Bonzini 16446e790746SPaolo Bonzini /* To avoid a race condition where the guest has made some buffers 16456e790746SPaolo Bonzini * available after the above check but before notification was 16466e790746SPaolo Bonzini * enabled, check for available buffers again. 16476e790746SPaolo Bonzini */ 16486e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 16496e790746SPaolo Bonzini (n->mergeable_rx_bufs && 16506e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 16516e790746SPaolo Bonzini return 0; 16526e790746SPaolo Bonzini } 16536e790746SPaolo Bonzini } 16546e790746SPaolo Bonzini 16556e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 0); 16566e790746SPaolo Bonzini return 1; 16576e790746SPaolo Bonzini } 16586e790746SPaolo Bonzini 16591399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr) 1660032a74a1SCédric Le Goater { 16611399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->hdr_len); 16621399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->gso_size); 16631399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_start); 16641399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_offset); 1665032a74a1SCédric Le Goater } 1666032a74a1SCédric Le Goater 16676e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so 16686e790746SPaolo Bonzini * it never finds out that the packets don't have valid checksums. This 16696e790746SPaolo Bonzini * causes dhclient to get upset. Fedora's carried a patch for ages to 16706e790746SPaolo Bonzini * fix this with Xen but it hasn't appeared in an upstream release of 16716e790746SPaolo Bonzini * dhclient yet. 16726e790746SPaolo Bonzini * 16736e790746SPaolo Bonzini * To avoid breaking existing guests, we catch udp packets and add 16746e790746SPaolo Bonzini * checksums. This is terrible but it's better than hacking the guest 16756e790746SPaolo Bonzini * kernels. 16766e790746SPaolo Bonzini * 16776e790746SPaolo Bonzini * N.B. if we introduce a zero-copy API, this operation is no longer free so 16786e790746SPaolo Bonzini * we should provide a mechanism to disable it to avoid polluting the host 16796e790746SPaolo Bonzini * cache. 16806e790746SPaolo Bonzini */ 16816e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr, 16826e790746SPaolo Bonzini uint8_t *buf, size_t size) 16836e790746SPaolo Bonzini { 16846e790746SPaolo Bonzini if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */ 16856e790746SPaolo Bonzini (size > 27 && size < 1500) && /* normal sized MTU */ 16866e790746SPaolo Bonzini (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */ 16876e790746SPaolo Bonzini (buf[23] == 17) && /* ip.protocol == UDP */ 16886e790746SPaolo Bonzini (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */ 1689f5746335SBin Meng net_checksum_calculate(buf, size, CSUM_UDP); 16906e790746SPaolo Bonzini hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM; 16916e790746SPaolo Bonzini } 16926e790746SPaolo Bonzini } 16936e790746SPaolo Bonzini 16946e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt, 16956e790746SPaolo Bonzini const void *buf, size_t size) 16966e790746SPaolo Bonzini { 16976e790746SPaolo Bonzini if (n->has_vnet_hdr) { 16986e790746SPaolo Bonzini /* FIXME this cast is evil */ 16996e790746SPaolo Bonzini void *wbuf = (void *)buf; 17006e790746SPaolo Bonzini work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len, 17016e790746SPaolo Bonzini size - n->host_hdr_len); 17021bfa316cSGreg Kurz 17031bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 17041399c60dSRusty Russell virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf); 17051bfa316cSGreg Kurz } 17066e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr)); 17076e790746SPaolo Bonzini } else { 17086e790746SPaolo Bonzini struct virtio_net_hdr hdr = { 17096e790746SPaolo Bonzini .flags = 0, 17106e790746SPaolo Bonzini .gso_type = VIRTIO_NET_HDR_GSO_NONE 17116e790746SPaolo Bonzini }; 17126e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr); 17136e790746SPaolo Bonzini } 17146e790746SPaolo Bonzini } 17156e790746SPaolo Bonzini 17166e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size) 17176e790746SPaolo Bonzini { 17186e790746SPaolo Bonzini static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff}; 17196e790746SPaolo Bonzini static const uint8_t vlan[] = {0x81, 0x00}; 17206e790746SPaolo Bonzini uint8_t *ptr = (uint8_t *)buf; 17216e790746SPaolo Bonzini int i; 17226e790746SPaolo Bonzini 17236e790746SPaolo Bonzini if (n->promisc) 17246e790746SPaolo Bonzini return 1; 17256e790746SPaolo Bonzini 17266e790746SPaolo Bonzini ptr += n->host_hdr_len; 17276e790746SPaolo Bonzini 17286e790746SPaolo Bonzini if (!memcmp(&ptr[12], vlan, sizeof(vlan))) { 17297542d3e7SPeter Maydell int vid = lduw_be_p(ptr + 14) & 0xfff; 17306e790746SPaolo Bonzini if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f)))) 17316e790746SPaolo Bonzini return 0; 17326e790746SPaolo Bonzini } 17336e790746SPaolo Bonzini 17346e790746SPaolo Bonzini if (ptr[0] & 1) { // multicast 17356e790746SPaolo Bonzini if (!memcmp(ptr, bcast, sizeof(bcast))) { 17366e790746SPaolo Bonzini return !n->nobcast; 17376e790746SPaolo Bonzini } else if (n->nomulti) { 17386e790746SPaolo Bonzini return 0; 17396e790746SPaolo Bonzini } else if (n->allmulti || n->mac_table.multi_overflow) { 17406e790746SPaolo Bonzini return 1; 17416e790746SPaolo Bonzini } 17426e790746SPaolo Bonzini 17436e790746SPaolo Bonzini for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 17446e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 17456e790746SPaolo Bonzini return 1; 17466e790746SPaolo Bonzini } 17476e790746SPaolo Bonzini } 17486e790746SPaolo Bonzini } else { // unicast 17496e790746SPaolo Bonzini if (n->nouni) { 17506e790746SPaolo Bonzini return 0; 17516e790746SPaolo Bonzini } else if (n->alluni || n->mac_table.uni_overflow) { 17526e790746SPaolo Bonzini return 1; 17536e790746SPaolo Bonzini } else if (!memcmp(ptr, n->mac, ETH_ALEN)) { 17546e790746SPaolo Bonzini return 1; 17556e790746SPaolo Bonzini } 17566e790746SPaolo Bonzini 17576e790746SPaolo Bonzini for (i = 0; i < n->mac_table.first_multi; i++) { 17586e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 17596e790746SPaolo Bonzini return 1; 17606e790746SPaolo Bonzini } 17616e790746SPaolo Bonzini } 17626e790746SPaolo Bonzini } 17636e790746SPaolo Bonzini 17646e790746SPaolo Bonzini return 0; 17656e790746SPaolo Bonzini } 17666e790746SPaolo Bonzini 176769ff5ef8SAkihiko Odaki static uint8_t virtio_net_get_hash_type(bool hasip4, 176869ff5ef8SAkihiko Odaki bool hasip6, 176965f474bbSAkihiko Odaki EthL4HdrProto l4hdr_proto, 17704474e37aSYuri Benditovich uint32_t types) 17714474e37aSYuri Benditovich { 177269ff5ef8SAkihiko Odaki if (hasip4) { 177365f474bbSAkihiko Odaki switch (l4hdr_proto) { 177465f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_TCP: 177565f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4) { 17764474e37aSYuri Benditovich return NetPktRssIpV4Tcp; 17774474e37aSYuri Benditovich } 177865f474bbSAkihiko Odaki break; 177965f474bbSAkihiko Odaki 178065f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_UDP: 178165f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4) { 17824474e37aSYuri Benditovich return NetPktRssIpV4Udp; 17834474e37aSYuri Benditovich } 178465f474bbSAkihiko Odaki break; 178565f474bbSAkihiko Odaki 178665f474bbSAkihiko Odaki default: 178765f474bbSAkihiko Odaki break; 178865f474bbSAkihiko Odaki } 178965f474bbSAkihiko Odaki 17904474e37aSYuri Benditovich if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) { 17914474e37aSYuri Benditovich return NetPktRssIpV4; 17924474e37aSYuri Benditovich } 179369ff5ef8SAkihiko Odaki } else if (hasip6) { 179465f474bbSAkihiko Odaki switch (l4hdr_proto) { 179565f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_TCP: 179665f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) { 179765f474bbSAkihiko Odaki return NetPktRssIpV6TcpEx; 179865f474bbSAkihiko Odaki } 179965f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv6) { 180065f474bbSAkihiko Odaki return NetPktRssIpV6Tcp; 180165f474bbSAkihiko Odaki } 180265f474bbSAkihiko Odaki break; 18034474e37aSYuri Benditovich 180465f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_UDP: 180565f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) { 180665f474bbSAkihiko Odaki return NetPktRssIpV6UdpEx; 18074474e37aSYuri Benditovich } 180865f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv6) { 180965f474bbSAkihiko Odaki return NetPktRssIpV6Udp; 18104474e37aSYuri Benditovich } 181165f474bbSAkihiko Odaki break; 181265f474bbSAkihiko Odaki 181365f474bbSAkihiko Odaki default: 181465f474bbSAkihiko Odaki break; 181565f474bbSAkihiko Odaki } 181665f474bbSAkihiko Odaki 181765f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) { 181865f474bbSAkihiko Odaki return NetPktRssIpV6Ex; 181965f474bbSAkihiko Odaki } 182065f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv6) { 182165f474bbSAkihiko Odaki return NetPktRssIpV6; 18224474e37aSYuri Benditovich } 18234474e37aSYuri Benditovich } 18244474e37aSYuri Benditovich return 0xff; 18254474e37aSYuri Benditovich } 18264474e37aSYuri Benditovich 1827e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report, 1828e22f0603SYuri Benditovich uint32_t hash) 1829e22f0603SYuri Benditovich { 1830e22f0603SYuri Benditovich struct virtio_net_hdr_v1_hash *hdr = (void *)buf; 1831e22f0603SYuri Benditovich hdr->hash_value = hash; 1832e22f0603SYuri Benditovich hdr->hash_report = report; 1833e22f0603SYuri Benditovich } 1834e22f0603SYuri Benditovich 18354474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf, 183697cd965cSPaolo Bonzini size_t size) 18376e790746SPaolo Bonzini { 18386e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1839e22f0603SYuri Benditovich unsigned int index = nc->queue_index, new_index = index; 18404474e37aSYuri Benditovich struct NetRxPkt *pkt = n->rx_pkt; 18414474e37aSYuri Benditovich uint8_t net_hash_type; 18424474e37aSYuri Benditovich uint32_t hash; 184365f474bbSAkihiko Odaki bool hasip4, hasip6; 184465f474bbSAkihiko Odaki EthL4HdrProto l4hdr_proto; 1845e22f0603SYuri Benditovich static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = { 1846e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv4, 1847e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv4, 1848e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6, 1849e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6, 1850e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6_EX, 1851e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6_EX, 1852e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv4, 1853e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6, 1854e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6_EX 1855e22f0603SYuri Benditovich }; 18562f0fa232SAkihiko Odaki struct iovec iov = { 18572f0fa232SAkihiko Odaki .iov_base = (void *)buf, 18582f0fa232SAkihiko Odaki .iov_len = size 18592f0fa232SAkihiko Odaki }; 18604474e37aSYuri Benditovich 18612f0fa232SAkihiko Odaki net_rx_pkt_set_protocols(pkt, &iov, 1, n->host_hdr_len); 186265f474bbSAkihiko Odaki net_rx_pkt_get_protocols(pkt, &hasip4, &hasip6, &l4hdr_proto); 186365f474bbSAkihiko Odaki net_hash_type = virtio_net_get_hash_type(hasip4, hasip6, l4hdr_proto, 18644474e37aSYuri Benditovich n->rss_data.hash_types); 18654474e37aSYuri Benditovich if (net_hash_type > NetPktRssIpV6UdpEx) { 1866e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1867e22f0603SYuri Benditovich virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0); 1868e22f0603SYuri Benditovich } 1869e22f0603SYuri Benditovich return n->rss_data.redirect ? n->rss_data.default_queue : -1; 18704474e37aSYuri Benditovich } 18714474e37aSYuri Benditovich 18724474e37aSYuri Benditovich hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key); 1873e22f0603SYuri Benditovich 1874e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1875e22f0603SYuri Benditovich virtio_set_packet_hash(buf, reports[net_hash_type], hash); 1876e22f0603SYuri Benditovich } 1877e22f0603SYuri Benditovich 1878e22f0603SYuri Benditovich if (n->rss_data.redirect) { 18794474e37aSYuri Benditovich new_index = hash & (n->rss_data.indirections_len - 1); 18804474e37aSYuri Benditovich new_index = n->rss_data.indirections_table[new_index]; 18814474e37aSYuri Benditovich } 1882e22f0603SYuri Benditovich 1883e22f0603SYuri Benditovich return (index == new_index) ? -1 : new_index; 18844474e37aSYuri Benditovich } 18854474e37aSYuri Benditovich 18864474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf, 18874474e37aSYuri Benditovich size_t size, bool no_rss) 18884474e37aSYuri Benditovich { 18894474e37aSYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 18906e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 189117a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1892bedd7e93SJason Wang VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE]; 1893bedd7e93SJason Wang size_t lens[VIRTQUEUE_MAX_SIZE]; 18946e790746SPaolo Bonzini struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE]; 18956e790746SPaolo Bonzini struct virtio_net_hdr_mrg_rxbuf mhdr; 18966e790746SPaolo Bonzini unsigned mhdr_cnt = 0; 1897bedd7e93SJason Wang size_t offset, i, guest_offset, j; 1898bedd7e93SJason Wang ssize_t err; 18996e790746SPaolo Bonzini 19006e790746SPaolo Bonzini if (!virtio_net_can_receive(nc)) { 19016e790746SPaolo Bonzini return -1; 19026e790746SPaolo Bonzini } 19036e790746SPaolo Bonzini 19040145c393SAndrew Melnychenko if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) { 19054474e37aSYuri Benditovich int index = virtio_net_process_rss(nc, buf, size); 19064474e37aSYuri Benditovich if (index >= 0) { 19074474e37aSYuri Benditovich NetClientState *nc2 = qemu_get_subqueue(n->nic, index); 19084474e37aSYuri Benditovich return virtio_net_receive_rcu(nc2, buf, size, true); 19094474e37aSYuri Benditovich } 19104474e37aSYuri Benditovich } 19114474e37aSYuri Benditovich 19126e790746SPaolo Bonzini /* hdr_len refers to the header we supply to the guest */ 19136e790746SPaolo Bonzini if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) { 19146e790746SPaolo Bonzini return 0; 19156e790746SPaolo Bonzini } 19166e790746SPaolo Bonzini 19176e790746SPaolo Bonzini if (!receive_filter(n, buf, size)) 19186e790746SPaolo Bonzini return size; 19196e790746SPaolo Bonzini 19206e790746SPaolo Bonzini offset = i = 0; 19216e790746SPaolo Bonzini 19226e790746SPaolo Bonzini while (offset < size) { 192351b19ebeSPaolo Bonzini VirtQueueElement *elem; 19246e790746SPaolo Bonzini int len, total; 192551b19ebeSPaolo Bonzini const struct iovec *sg; 19266e790746SPaolo Bonzini 19276e790746SPaolo Bonzini total = 0; 19286e790746SPaolo Bonzini 1929bedd7e93SJason Wang if (i == VIRTQUEUE_MAX_SIZE) { 1930bedd7e93SJason Wang virtio_error(vdev, "virtio-net unexpected long buffer chain"); 1931bedd7e93SJason Wang err = size; 1932bedd7e93SJason Wang goto err; 1933bedd7e93SJason Wang } 1934bedd7e93SJason Wang 193551b19ebeSPaolo Bonzini elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement)); 193651b19ebeSPaolo Bonzini if (!elem) { 1937ba10b9c0SGreg Kurz if (i) { 1938ba10b9c0SGreg Kurz virtio_error(vdev, "virtio-net unexpected empty queue: " 19396e790746SPaolo Bonzini "i %zd mergeable %d offset %zd, size %zd, " 1940019a3edbSGerd Hoffmann "guest hdr len %zd, host hdr len %zd " 1941019a3edbSGerd Hoffmann "guest features 0x%" PRIx64, 19426e790746SPaolo Bonzini i, n->mergeable_rx_bufs, offset, size, 1943019a3edbSGerd Hoffmann n->guest_hdr_len, n->host_hdr_len, 1944019a3edbSGerd Hoffmann vdev->guest_features); 1945ba10b9c0SGreg Kurz } 1946bedd7e93SJason Wang err = -1; 1947bedd7e93SJason Wang goto err; 19486e790746SPaolo Bonzini } 19496e790746SPaolo Bonzini 195051b19ebeSPaolo Bonzini if (elem->in_num < 1) { 1951ba10b9c0SGreg Kurz virtio_error(vdev, 1952ba10b9c0SGreg Kurz "virtio-net receive queue contains no in buffers"); 1953ba10b9c0SGreg Kurz virtqueue_detach_element(q->rx_vq, elem, 0); 1954ba10b9c0SGreg Kurz g_free(elem); 1955bedd7e93SJason Wang err = -1; 1956bedd7e93SJason Wang goto err; 19576e790746SPaolo Bonzini } 19586e790746SPaolo Bonzini 195951b19ebeSPaolo Bonzini sg = elem->in_sg; 19606e790746SPaolo Bonzini if (i == 0) { 19616e790746SPaolo Bonzini assert(offset == 0); 19626e790746SPaolo Bonzini if (n->mergeable_rx_bufs) { 19636e790746SPaolo Bonzini mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg), 196451b19ebeSPaolo Bonzini sg, elem->in_num, 19656e790746SPaolo Bonzini offsetof(typeof(mhdr), num_buffers), 19666e790746SPaolo Bonzini sizeof(mhdr.num_buffers)); 19676e790746SPaolo Bonzini } 19686e790746SPaolo Bonzini 196951b19ebeSPaolo Bonzini receive_header(n, sg, elem->in_num, buf, size); 1970e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1971e22f0603SYuri Benditovich offset = sizeof(mhdr); 1972e22f0603SYuri Benditovich iov_from_buf(sg, elem->in_num, offset, 1973e22f0603SYuri Benditovich buf + offset, n->host_hdr_len - sizeof(mhdr)); 1974e22f0603SYuri Benditovich } 19756e790746SPaolo Bonzini offset = n->host_hdr_len; 19766e790746SPaolo Bonzini total += n->guest_hdr_len; 19776e790746SPaolo Bonzini guest_offset = n->guest_hdr_len; 19786e790746SPaolo Bonzini } else { 19796e790746SPaolo Bonzini guest_offset = 0; 19806e790746SPaolo Bonzini } 19816e790746SPaolo Bonzini 19826e790746SPaolo Bonzini /* copy in packet. ugh */ 198351b19ebeSPaolo Bonzini len = iov_from_buf(sg, elem->in_num, guest_offset, 19846e790746SPaolo Bonzini buf + offset, size - offset); 19856e790746SPaolo Bonzini total += len; 19866e790746SPaolo Bonzini offset += len; 19876e790746SPaolo Bonzini /* If buffers can't be merged, at this point we 19886e790746SPaolo Bonzini * must have consumed the complete packet. 19896e790746SPaolo Bonzini * Otherwise, drop it. */ 19906e790746SPaolo Bonzini if (!n->mergeable_rx_bufs && offset < size) { 199127e57efeSLadi Prosek virtqueue_unpop(q->rx_vq, elem, total); 199251b19ebeSPaolo Bonzini g_free(elem); 1993bedd7e93SJason Wang err = size; 1994bedd7e93SJason Wang goto err; 19956e790746SPaolo Bonzini } 19966e790746SPaolo Bonzini 1997bedd7e93SJason Wang elems[i] = elem; 1998bedd7e93SJason Wang lens[i] = total; 1999bedd7e93SJason Wang i++; 20006e790746SPaolo Bonzini } 20016e790746SPaolo Bonzini 20026e790746SPaolo Bonzini if (mhdr_cnt) { 20031399c60dSRusty Russell virtio_stw_p(vdev, &mhdr.num_buffers, i); 20046e790746SPaolo Bonzini iov_from_buf(mhdr_sg, mhdr_cnt, 20056e790746SPaolo Bonzini 0, 20066e790746SPaolo Bonzini &mhdr.num_buffers, sizeof mhdr.num_buffers); 20076e790746SPaolo Bonzini } 20086e790746SPaolo Bonzini 2009bedd7e93SJason Wang for (j = 0; j < i; j++) { 2010bedd7e93SJason Wang /* signal other side */ 2011bedd7e93SJason Wang virtqueue_fill(q->rx_vq, elems[j], lens[j], j); 2012bedd7e93SJason Wang g_free(elems[j]); 2013bedd7e93SJason Wang } 2014bedd7e93SJason Wang 20156e790746SPaolo Bonzini virtqueue_flush(q->rx_vq, i); 201617a0ca55SKONRAD Frederic virtio_notify(vdev, q->rx_vq); 20176e790746SPaolo Bonzini 20186e790746SPaolo Bonzini return size; 2019bedd7e93SJason Wang 2020bedd7e93SJason Wang err: 2021bedd7e93SJason Wang for (j = 0; j < i; j++) { 2022abe300d9SJason Wang virtqueue_detach_element(q->rx_vq, elems[j], lens[j]); 2023bedd7e93SJason Wang g_free(elems[j]); 2024bedd7e93SJason Wang } 2025bedd7e93SJason Wang 2026bedd7e93SJason Wang return err; 20276e790746SPaolo Bonzini } 20286e790746SPaolo Bonzini 20292974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf, 203097cd965cSPaolo Bonzini size_t size) 203197cd965cSPaolo Bonzini { 2032068ddfa9SDr. David Alan Gilbert RCU_READ_LOCK_GUARD(); 203397cd965cSPaolo Bonzini 20344474e37aSYuri Benditovich return virtio_net_receive_rcu(nc, buf, size, false); 203597cd965cSPaolo Bonzini } 203697cd965cSPaolo Bonzini 20372974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain, 20382974e916SYuri Benditovich const uint8_t *buf, 20392974e916SYuri Benditovich VirtioNetRscUnit *unit) 20402974e916SYuri Benditovich { 20412974e916SYuri Benditovich uint16_t ip_hdrlen; 20422974e916SYuri Benditovich struct ip_header *ip; 20432974e916SYuri Benditovich 20442974e916SYuri Benditovich ip = (struct ip_header *)(buf + chain->n->guest_hdr_len 20452974e916SYuri Benditovich + sizeof(struct eth_header)); 20462974e916SYuri Benditovich unit->ip = (void *)ip; 20472974e916SYuri Benditovich ip_hdrlen = (ip->ip_ver_len & 0xF) << 2; 20482974e916SYuri Benditovich unit->ip_plen = &ip->ip_len; 20492974e916SYuri Benditovich unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen); 20502974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 20512974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen; 20522974e916SYuri Benditovich } 20532974e916SYuri Benditovich 20542974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain, 20552974e916SYuri Benditovich const uint8_t *buf, 20562974e916SYuri Benditovich VirtioNetRscUnit *unit) 20572974e916SYuri Benditovich { 20582974e916SYuri Benditovich struct ip6_header *ip6; 20592974e916SYuri Benditovich 20602974e916SYuri Benditovich ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len 20612974e916SYuri Benditovich + sizeof(struct eth_header)); 20622974e916SYuri Benditovich unit->ip = ip6; 20632974e916SYuri Benditovich unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 206478ee6bd0SPhilippe Mathieu-Daudé unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) 20652974e916SYuri Benditovich + sizeof(struct ip6_header)); 20662974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 20672974e916SYuri Benditovich 20682431f4f1SMichael Tokarev /* There is a difference between payload length in ipv4 and v6, 20692974e916SYuri Benditovich ip header is excluded in ipv6 */ 20702974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen; 20712974e916SYuri Benditovich } 20722974e916SYuri Benditovich 20732974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain, 20742974e916SYuri Benditovich VirtioNetRscSeg *seg) 20752974e916SYuri Benditovich { 20762974e916SYuri Benditovich int ret; 2077dd3d85e8SYuri Benditovich struct virtio_net_hdr_v1 *h; 20782974e916SYuri Benditovich 2079dd3d85e8SYuri Benditovich h = (struct virtio_net_hdr_v1 *)seg->buf; 20802974e916SYuri Benditovich h->flags = 0; 20812974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_NONE; 20822974e916SYuri Benditovich 20832974e916SYuri Benditovich if (seg->is_coalesced) { 2084dd3d85e8SYuri Benditovich h->rsc.segments = seg->packets; 2085dd3d85e8SYuri Benditovich h->rsc.dup_acks = seg->dup_ack; 20862974e916SYuri Benditovich h->flags = VIRTIO_NET_HDR_F_RSC_INFO; 20872974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 20882974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 20892974e916SYuri Benditovich } else { 20902974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 20912974e916SYuri Benditovich } 20922974e916SYuri Benditovich } 20932974e916SYuri Benditovich 20942974e916SYuri Benditovich ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size); 20952974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 20962974e916SYuri Benditovich g_free(seg->buf); 20972974e916SYuri Benditovich g_free(seg); 20982974e916SYuri Benditovich 20992974e916SYuri Benditovich return ret; 21002974e916SYuri Benditovich } 21012974e916SYuri Benditovich 21022974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq) 21032974e916SYuri Benditovich { 21042974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn; 21052974e916SYuri Benditovich VirtioNetRscChain *chain = (VirtioNetRscChain *)opq; 21062974e916SYuri Benditovich 21072974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) { 21082974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 21092974e916SYuri Benditovich chain->stat.purge_failed++; 21102974e916SYuri Benditovich continue; 21112974e916SYuri Benditovich } 21122974e916SYuri Benditovich } 21132974e916SYuri Benditovich 21142974e916SYuri Benditovich chain->stat.timer++; 21152974e916SYuri Benditovich if (!QTAILQ_EMPTY(&chain->buffers)) { 21162974e916SYuri Benditovich timer_mod(chain->drain_timer, 21172974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 21182974e916SYuri Benditovich } 21192974e916SYuri Benditovich } 21202974e916SYuri Benditovich 21212974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n) 21222974e916SYuri Benditovich { 21232974e916SYuri Benditovich VirtioNetRscChain *chain, *rn_chain; 21242974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn_seg; 21252974e916SYuri Benditovich 21262974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) { 21272974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) { 21282974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 21292974e916SYuri Benditovich g_free(seg->buf); 21302974e916SYuri Benditovich g_free(seg); 21312974e916SYuri Benditovich } 21322974e916SYuri Benditovich 21332974e916SYuri Benditovich timer_free(chain->drain_timer); 21342974e916SYuri Benditovich QTAILQ_REMOVE(&n->rsc_chains, chain, next); 21352974e916SYuri Benditovich g_free(chain); 21362974e916SYuri Benditovich } 21372974e916SYuri Benditovich } 21382974e916SYuri Benditovich 21392974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain, 21402974e916SYuri Benditovich NetClientState *nc, 21412974e916SYuri Benditovich const uint8_t *buf, size_t size) 21422974e916SYuri Benditovich { 21432974e916SYuri Benditovich uint16_t hdr_len; 21442974e916SYuri Benditovich VirtioNetRscSeg *seg; 21452974e916SYuri Benditovich 21462974e916SYuri Benditovich hdr_len = chain->n->guest_hdr_len; 2147b21e2380SMarkus Armbruster seg = g_new(VirtioNetRscSeg, 1); 21482974e916SYuri Benditovich seg->buf = g_malloc(hdr_len + sizeof(struct eth_header) 21492974e916SYuri Benditovich + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD); 21502974e916SYuri Benditovich memcpy(seg->buf, buf, size); 21512974e916SYuri Benditovich seg->size = size; 21522974e916SYuri Benditovich seg->packets = 1; 21532974e916SYuri Benditovich seg->dup_ack = 0; 21542974e916SYuri Benditovich seg->is_coalesced = 0; 21552974e916SYuri Benditovich seg->nc = nc; 21562974e916SYuri Benditovich 21572974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&chain->buffers, seg, next); 21582974e916SYuri Benditovich chain->stat.cache++; 21592974e916SYuri Benditovich 21602974e916SYuri Benditovich switch (chain->proto) { 21612974e916SYuri Benditovich case ETH_P_IP: 21622974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit); 21632974e916SYuri Benditovich break; 21642974e916SYuri Benditovich case ETH_P_IPV6: 21652974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit); 21662974e916SYuri Benditovich break; 21672974e916SYuri Benditovich default: 21682974e916SYuri Benditovich g_assert_not_reached(); 21692974e916SYuri Benditovich } 21702974e916SYuri Benditovich } 21712974e916SYuri Benditovich 21722974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain, 21732974e916SYuri Benditovich VirtioNetRscSeg *seg, 21742974e916SYuri Benditovich const uint8_t *buf, 21752974e916SYuri Benditovich struct tcp_header *n_tcp, 21762974e916SYuri Benditovich struct tcp_header *o_tcp) 21772974e916SYuri Benditovich { 21782974e916SYuri Benditovich uint32_t nack, oack; 21792974e916SYuri Benditovich uint16_t nwin, owin; 21802974e916SYuri Benditovich 21812974e916SYuri Benditovich nack = htonl(n_tcp->th_ack); 21822974e916SYuri Benditovich nwin = htons(n_tcp->th_win); 21832974e916SYuri Benditovich oack = htonl(o_tcp->th_ack); 21842974e916SYuri Benditovich owin = htons(o_tcp->th_win); 21852974e916SYuri Benditovich 21862974e916SYuri Benditovich if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) { 21872974e916SYuri Benditovich chain->stat.ack_out_of_win++; 21882974e916SYuri Benditovich return RSC_FINAL; 21892974e916SYuri Benditovich } else if (nack == oack) { 21902974e916SYuri Benditovich /* duplicated ack or window probe */ 21912974e916SYuri Benditovich if (nwin == owin) { 21922974e916SYuri Benditovich /* duplicated ack, add dup ack count due to whql test up to 1 */ 21932974e916SYuri Benditovich chain->stat.dup_ack++; 21942974e916SYuri Benditovich return RSC_FINAL; 21952974e916SYuri Benditovich } else { 21962974e916SYuri Benditovich /* Coalesce window update */ 21972974e916SYuri Benditovich o_tcp->th_win = n_tcp->th_win; 21982974e916SYuri Benditovich chain->stat.win_update++; 21992974e916SYuri Benditovich return RSC_COALESCE; 22002974e916SYuri Benditovich } 22012974e916SYuri Benditovich } else { 22022974e916SYuri Benditovich /* pure ack, go to 'C', finalize*/ 22032974e916SYuri Benditovich chain->stat.pure_ack++; 22042974e916SYuri Benditovich return RSC_FINAL; 22052974e916SYuri Benditovich } 22062974e916SYuri Benditovich } 22072974e916SYuri Benditovich 22082974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain, 22092974e916SYuri Benditovich VirtioNetRscSeg *seg, 22102974e916SYuri Benditovich const uint8_t *buf, 22112974e916SYuri Benditovich VirtioNetRscUnit *n_unit) 22122974e916SYuri Benditovich { 22132974e916SYuri Benditovich void *data; 22142974e916SYuri Benditovich uint16_t o_ip_len; 22152974e916SYuri Benditovich uint32_t nseq, oseq; 22162974e916SYuri Benditovich VirtioNetRscUnit *o_unit; 22172974e916SYuri Benditovich 22182974e916SYuri Benditovich o_unit = &seg->unit; 22192974e916SYuri Benditovich o_ip_len = htons(*o_unit->ip_plen); 22202974e916SYuri Benditovich nseq = htonl(n_unit->tcp->th_seq); 22212974e916SYuri Benditovich oseq = htonl(o_unit->tcp->th_seq); 22222974e916SYuri Benditovich 22232974e916SYuri Benditovich /* out of order or retransmitted. */ 22242974e916SYuri Benditovich if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) { 22252974e916SYuri Benditovich chain->stat.data_out_of_win++; 22262974e916SYuri Benditovich return RSC_FINAL; 22272974e916SYuri Benditovich } 22282974e916SYuri Benditovich 22292974e916SYuri Benditovich data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen; 22302974e916SYuri Benditovich if (nseq == oseq) { 22312974e916SYuri Benditovich if ((o_unit->payload == 0) && n_unit->payload) { 22322974e916SYuri Benditovich /* From no payload to payload, normal case, not a dup ack or etc */ 22332974e916SYuri Benditovich chain->stat.data_after_pure_ack++; 22342974e916SYuri Benditovich goto coalesce; 22352974e916SYuri Benditovich } else { 22362974e916SYuri Benditovich return virtio_net_rsc_handle_ack(chain, seg, buf, 22372974e916SYuri Benditovich n_unit->tcp, o_unit->tcp); 22382974e916SYuri Benditovich } 22392974e916SYuri Benditovich } else if ((nseq - oseq) != o_unit->payload) { 22402974e916SYuri Benditovich /* Not a consistent packet, out of order */ 22412974e916SYuri Benditovich chain->stat.data_out_of_order++; 22422974e916SYuri Benditovich return RSC_FINAL; 22432974e916SYuri Benditovich } else { 22442974e916SYuri Benditovich coalesce: 22452974e916SYuri Benditovich if ((o_ip_len + n_unit->payload) > chain->max_payload) { 22462974e916SYuri Benditovich chain->stat.over_size++; 22472974e916SYuri Benditovich return RSC_FINAL; 22482974e916SYuri Benditovich } 22492974e916SYuri Benditovich 22502974e916SYuri Benditovich /* Here comes the right data, the payload length in v4/v6 is different, 22512974e916SYuri Benditovich so use the field value to update and record the new data len */ 22522974e916SYuri Benditovich o_unit->payload += n_unit->payload; /* update new data len */ 22532974e916SYuri Benditovich 22542974e916SYuri Benditovich /* update field in ip header */ 22552974e916SYuri Benditovich *o_unit->ip_plen = htons(o_ip_len + n_unit->payload); 22562974e916SYuri Benditovich 22572974e916SYuri Benditovich /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced 22582974e916SYuri Benditovich for windows guest, while this may change the behavior for linux 22592974e916SYuri Benditovich guest (only if it uses RSC feature). */ 22602974e916SYuri Benditovich o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags; 22612974e916SYuri Benditovich 22622974e916SYuri Benditovich o_unit->tcp->th_ack = n_unit->tcp->th_ack; 22632974e916SYuri Benditovich o_unit->tcp->th_win = n_unit->tcp->th_win; 22642974e916SYuri Benditovich 22652974e916SYuri Benditovich memmove(seg->buf + seg->size, data, n_unit->payload); 22662974e916SYuri Benditovich seg->size += n_unit->payload; 22672974e916SYuri Benditovich seg->packets++; 22682974e916SYuri Benditovich chain->stat.coalesced++; 22692974e916SYuri Benditovich return RSC_COALESCE; 22702974e916SYuri Benditovich } 22712974e916SYuri Benditovich } 22722974e916SYuri Benditovich 22732974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain, 22742974e916SYuri Benditovich VirtioNetRscSeg *seg, 22752974e916SYuri Benditovich const uint8_t *buf, size_t size, 22762974e916SYuri Benditovich VirtioNetRscUnit *unit) 22772974e916SYuri Benditovich { 22782974e916SYuri Benditovich struct ip_header *ip1, *ip2; 22792974e916SYuri Benditovich 22802974e916SYuri Benditovich ip1 = (struct ip_header *)(unit->ip); 22812974e916SYuri Benditovich ip2 = (struct ip_header *)(seg->unit.ip); 22822974e916SYuri Benditovich if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst) 22832974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 22842974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 22852974e916SYuri Benditovich chain->stat.no_match++; 22862974e916SYuri Benditovich return RSC_NO_MATCH; 22872974e916SYuri Benditovich } 22882974e916SYuri Benditovich 22892974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 22902974e916SYuri Benditovich } 22912974e916SYuri Benditovich 22922974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain, 22932974e916SYuri Benditovich VirtioNetRscSeg *seg, 22942974e916SYuri Benditovich const uint8_t *buf, size_t size, 22952974e916SYuri Benditovich VirtioNetRscUnit *unit) 22962974e916SYuri Benditovich { 22972974e916SYuri Benditovich struct ip6_header *ip1, *ip2; 22982974e916SYuri Benditovich 22992974e916SYuri Benditovich ip1 = (struct ip6_header *)(unit->ip); 23002974e916SYuri Benditovich ip2 = (struct ip6_header *)(seg->unit.ip); 23012974e916SYuri Benditovich if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address)) 23022974e916SYuri Benditovich || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address)) 23032974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 23042974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 23052974e916SYuri Benditovich chain->stat.no_match++; 23062974e916SYuri Benditovich return RSC_NO_MATCH; 23072974e916SYuri Benditovich } 23082974e916SYuri Benditovich 23092974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 23102974e916SYuri Benditovich } 23112974e916SYuri Benditovich 23122974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain 23132974e916SYuri Benditovich * to prevent out of order */ 23142974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain, 23152974e916SYuri Benditovich struct tcp_header *tcp) 23162974e916SYuri Benditovich { 23172974e916SYuri Benditovich uint16_t tcp_hdr; 23182974e916SYuri Benditovich uint16_t tcp_flag; 23192974e916SYuri Benditovich 23202974e916SYuri Benditovich tcp_flag = htons(tcp->th_offset_flags); 23212974e916SYuri Benditovich tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10; 23222974e916SYuri Benditovich tcp_flag &= VIRTIO_NET_TCP_FLAG; 23232974e916SYuri Benditovich if (tcp_flag & TH_SYN) { 23242974e916SYuri Benditovich chain->stat.tcp_syn++; 23252974e916SYuri Benditovich return RSC_BYPASS; 23262974e916SYuri Benditovich } 23272974e916SYuri Benditovich 23282974e916SYuri Benditovich if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) { 23292974e916SYuri Benditovich chain->stat.tcp_ctrl_drain++; 23302974e916SYuri Benditovich return RSC_FINAL; 23312974e916SYuri Benditovich } 23322974e916SYuri Benditovich 23332974e916SYuri Benditovich if (tcp_hdr > sizeof(struct tcp_header)) { 23342974e916SYuri Benditovich chain->stat.tcp_all_opt++; 23352974e916SYuri Benditovich return RSC_FINAL; 23362974e916SYuri Benditovich } 23372974e916SYuri Benditovich 23382974e916SYuri Benditovich return RSC_CANDIDATE; 23392974e916SYuri Benditovich } 23402974e916SYuri Benditovich 23412974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain, 23422974e916SYuri Benditovich NetClientState *nc, 23432974e916SYuri Benditovich const uint8_t *buf, size_t size, 23442974e916SYuri Benditovich VirtioNetRscUnit *unit) 23452974e916SYuri Benditovich { 23462974e916SYuri Benditovich int ret; 23472974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 23482974e916SYuri Benditovich 23492974e916SYuri Benditovich if (QTAILQ_EMPTY(&chain->buffers)) { 23502974e916SYuri Benditovich chain->stat.empty_cache++; 23512974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 23522974e916SYuri Benditovich timer_mod(chain->drain_timer, 23532974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 23542974e916SYuri Benditovich return size; 23552974e916SYuri Benditovich } 23562974e916SYuri Benditovich 23572974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 23582974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 23592974e916SYuri Benditovich ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit); 23602974e916SYuri Benditovich } else { 23612974e916SYuri Benditovich ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit); 23622974e916SYuri Benditovich } 23632974e916SYuri Benditovich 23642974e916SYuri Benditovich if (ret == RSC_FINAL) { 23652974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 23662974e916SYuri Benditovich /* Send failed */ 23672974e916SYuri Benditovich chain->stat.final_failed++; 23682974e916SYuri Benditovich return 0; 23692974e916SYuri Benditovich } 23702974e916SYuri Benditovich 23712974e916SYuri Benditovich /* Send current packet */ 23722974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23732974e916SYuri Benditovich } else if (ret == RSC_NO_MATCH) { 23742974e916SYuri Benditovich continue; 23752974e916SYuri Benditovich } else { 23762974e916SYuri Benditovich /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */ 23772974e916SYuri Benditovich seg->is_coalesced = 1; 23782974e916SYuri Benditovich return size; 23792974e916SYuri Benditovich } 23802974e916SYuri Benditovich } 23812974e916SYuri Benditovich 23822974e916SYuri Benditovich chain->stat.no_match_cache++; 23832974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 23842974e916SYuri Benditovich return size; 23852974e916SYuri Benditovich } 23862974e916SYuri Benditovich 23872974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */ 23882974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain, 23892974e916SYuri Benditovich NetClientState *nc, 23902974e916SYuri Benditovich const uint8_t *buf, size_t size, 23912974e916SYuri Benditovich uint16_t ip_start, uint16_t ip_size, 23922974e916SYuri Benditovich uint16_t tcp_port) 23932974e916SYuri Benditovich { 23942974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 23952974e916SYuri Benditovich uint32_t ppair1, ppair2; 23962974e916SYuri Benditovich 23972974e916SYuri Benditovich ppair1 = *(uint32_t *)(buf + tcp_port); 23982974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 23992974e916SYuri Benditovich ppair2 = *(uint32_t *)(seg->buf + tcp_port); 24002974e916SYuri Benditovich if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size) 24012974e916SYuri Benditovich || (ppair1 != ppair2)) { 24022974e916SYuri Benditovich continue; 24032974e916SYuri Benditovich } 24042974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 24052974e916SYuri Benditovich chain->stat.drain_failed++; 24062974e916SYuri Benditovich } 24072974e916SYuri Benditovich 24082974e916SYuri Benditovich break; 24092974e916SYuri Benditovich } 24102974e916SYuri Benditovich 24112974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24122974e916SYuri Benditovich } 24132974e916SYuri Benditovich 24142974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain, 24152974e916SYuri Benditovich struct ip_header *ip, 24162974e916SYuri Benditovich const uint8_t *buf, size_t size) 24172974e916SYuri Benditovich { 24182974e916SYuri Benditovich uint16_t ip_len; 24192974e916SYuri Benditovich 24202974e916SYuri Benditovich /* Not an ipv4 packet */ 24212974e916SYuri Benditovich if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) { 24222974e916SYuri Benditovich chain->stat.ip_option++; 24232974e916SYuri Benditovich return RSC_BYPASS; 24242974e916SYuri Benditovich } 24252974e916SYuri Benditovich 24262974e916SYuri Benditovich /* Don't handle packets with ip option */ 24272974e916SYuri Benditovich if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) { 24282974e916SYuri Benditovich chain->stat.ip_option++; 24292974e916SYuri Benditovich return RSC_BYPASS; 24302974e916SYuri Benditovich } 24312974e916SYuri Benditovich 24322974e916SYuri Benditovich if (ip->ip_p != IPPROTO_TCP) { 24332974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 24342974e916SYuri Benditovich return RSC_BYPASS; 24352974e916SYuri Benditovich } 24362974e916SYuri Benditovich 24372974e916SYuri Benditovich /* Don't handle packets with ip fragment */ 24382974e916SYuri Benditovich if (!(htons(ip->ip_off) & IP_DF)) { 24392974e916SYuri Benditovich chain->stat.ip_frag++; 24402974e916SYuri Benditovich return RSC_BYPASS; 24412974e916SYuri Benditovich } 24422974e916SYuri Benditovich 24432974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 24442974e916SYuri Benditovich if (IPTOS_ECN(ip->ip_tos)) { 24452974e916SYuri Benditovich chain->stat.ip_ecn++; 24462974e916SYuri Benditovich return RSC_BYPASS; 24472974e916SYuri Benditovich } 24482974e916SYuri Benditovich 24492974e916SYuri Benditovich ip_len = htons(ip->ip_len); 24502974e916SYuri Benditovich if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header)) 24512974e916SYuri Benditovich || ip_len > (size - chain->n->guest_hdr_len - 24522974e916SYuri Benditovich sizeof(struct eth_header))) { 24532974e916SYuri Benditovich chain->stat.ip_hacked++; 24542974e916SYuri Benditovich return RSC_BYPASS; 24552974e916SYuri Benditovich } 24562974e916SYuri Benditovich 24572974e916SYuri Benditovich return RSC_CANDIDATE; 24582974e916SYuri Benditovich } 24592974e916SYuri Benditovich 24602974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain, 24612974e916SYuri Benditovich NetClientState *nc, 24622974e916SYuri Benditovich const uint8_t *buf, size_t size) 24632974e916SYuri Benditovich { 24642974e916SYuri Benditovich int32_t ret; 24652974e916SYuri Benditovich uint16_t hdr_len; 24662974e916SYuri Benditovich VirtioNetRscUnit unit; 24672974e916SYuri Benditovich 24682974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 24692974e916SYuri Benditovich 24702974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header) 24712974e916SYuri Benditovich + sizeof(struct tcp_header))) { 24722974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 24732974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24742974e916SYuri Benditovich } 24752974e916SYuri Benditovich 24762974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, buf, &unit); 24772974e916SYuri Benditovich if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size) 24782974e916SYuri Benditovich != RSC_CANDIDATE) { 24792974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24802974e916SYuri Benditovich } 24812974e916SYuri Benditovich 24822974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 24832974e916SYuri Benditovich if (ret == RSC_BYPASS) { 24842974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24852974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 24862974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 24872974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 12), 24882974e916SYuri Benditovich VIRTIO_NET_IP4_ADDR_SIZE, 24892974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)); 24902974e916SYuri Benditovich } 24912974e916SYuri Benditovich 24922974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 24932974e916SYuri Benditovich } 24942974e916SYuri Benditovich 24952974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain, 24962974e916SYuri Benditovich struct ip6_header *ip6, 24972974e916SYuri Benditovich const uint8_t *buf, size_t size) 24982974e916SYuri Benditovich { 24992974e916SYuri Benditovich uint16_t ip_len; 25002974e916SYuri Benditovich 25012974e916SYuri Benditovich if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4) 25022974e916SYuri Benditovich != IP_HEADER_VERSION_6) { 25032974e916SYuri Benditovich return RSC_BYPASS; 25042974e916SYuri Benditovich } 25052974e916SYuri Benditovich 25062974e916SYuri Benditovich /* Both option and protocol is checked in this */ 25072974e916SYuri Benditovich if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) { 25082974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 25092974e916SYuri Benditovich return RSC_BYPASS; 25102974e916SYuri Benditovich } 25112974e916SYuri Benditovich 25122974e916SYuri Benditovich ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 25132974e916SYuri Benditovich if (ip_len < sizeof(struct tcp_header) || 25142974e916SYuri Benditovich ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header) 25152974e916SYuri Benditovich - sizeof(struct ip6_header))) { 25162974e916SYuri Benditovich chain->stat.ip_hacked++; 25172974e916SYuri Benditovich return RSC_BYPASS; 25182974e916SYuri Benditovich } 25192974e916SYuri Benditovich 25202974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 25212974e916SYuri Benditovich if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) { 25222974e916SYuri Benditovich chain->stat.ip_ecn++; 25232974e916SYuri Benditovich return RSC_BYPASS; 25242974e916SYuri Benditovich } 25252974e916SYuri Benditovich 25262974e916SYuri Benditovich return RSC_CANDIDATE; 25272974e916SYuri Benditovich } 25282974e916SYuri Benditovich 25292974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc, 25302974e916SYuri Benditovich const uint8_t *buf, size_t size) 25312974e916SYuri Benditovich { 25322974e916SYuri Benditovich int32_t ret; 25332974e916SYuri Benditovich uint16_t hdr_len; 25342974e916SYuri Benditovich VirtioNetRscChain *chain; 25352974e916SYuri Benditovich VirtioNetRscUnit unit; 25362974e916SYuri Benditovich 25373d558330SMarkus Armbruster chain = opq; 25382974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 25392974e916SYuri Benditovich 25402974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header) 25412974e916SYuri Benditovich + sizeof(tcp_header))) { 25422974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25432974e916SYuri Benditovich } 25442974e916SYuri Benditovich 25452974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, buf, &unit); 25462974e916SYuri Benditovich if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain, 25472974e916SYuri Benditovich unit.ip, buf, size)) { 25482974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25492974e916SYuri Benditovich } 25502974e916SYuri Benditovich 25512974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 25522974e916SYuri Benditovich if (ret == RSC_BYPASS) { 25532974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25542974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 25552974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 25562974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 8), 25572974e916SYuri Benditovich VIRTIO_NET_IP6_ADDR_SIZE, 25582974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) 25592974e916SYuri Benditovich + sizeof(struct ip6_header)); 25602974e916SYuri Benditovich } 25612974e916SYuri Benditovich 25622974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 25632974e916SYuri Benditovich } 25642974e916SYuri Benditovich 25652974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n, 25662974e916SYuri Benditovich NetClientState *nc, 25672974e916SYuri Benditovich uint16_t proto) 25682974e916SYuri Benditovich { 25692974e916SYuri Benditovich VirtioNetRscChain *chain; 25702974e916SYuri Benditovich 25712974e916SYuri Benditovich if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) { 25722974e916SYuri Benditovich return NULL; 25732974e916SYuri Benditovich } 25742974e916SYuri Benditovich 25752974e916SYuri Benditovich QTAILQ_FOREACH(chain, &n->rsc_chains, next) { 25762974e916SYuri Benditovich if (chain->proto == proto) { 25772974e916SYuri Benditovich return chain; 25782974e916SYuri Benditovich } 25792974e916SYuri Benditovich } 25802974e916SYuri Benditovich 25812974e916SYuri Benditovich chain = g_malloc(sizeof(*chain)); 25822974e916SYuri Benditovich chain->n = n; 25832974e916SYuri Benditovich chain->proto = proto; 25842974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP) { 25852974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD; 25862974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 25872974e916SYuri Benditovich } else { 25882974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD; 25892974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 25902974e916SYuri Benditovich } 25912974e916SYuri Benditovich chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST, 25922974e916SYuri Benditovich virtio_net_rsc_purge, chain); 25932974e916SYuri Benditovich memset(&chain->stat, 0, sizeof(chain->stat)); 25942974e916SYuri Benditovich 25952974e916SYuri Benditovich QTAILQ_INIT(&chain->buffers); 25962974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next); 25972974e916SYuri Benditovich 25982974e916SYuri Benditovich return chain; 25992974e916SYuri Benditovich } 26002974e916SYuri Benditovich 26012974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc, 26022974e916SYuri Benditovich const uint8_t *buf, 26032974e916SYuri Benditovich size_t size) 26042974e916SYuri Benditovich { 26052974e916SYuri Benditovich uint16_t proto; 26062974e916SYuri Benditovich VirtioNetRscChain *chain; 26072974e916SYuri Benditovich struct eth_header *eth; 26082974e916SYuri Benditovich VirtIONet *n; 26092974e916SYuri Benditovich 26102974e916SYuri Benditovich n = qemu_get_nic_opaque(nc); 26112974e916SYuri Benditovich if (size < (n->host_hdr_len + sizeof(struct eth_header))) { 26122974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26132974e916SYuri Benditovich } 26142974e916SYuri Benditovich 26152974e916SYuri Benditovich eth = (struct eth_header *)(buf + n->guest_hdr_len); 26162974e916SYuri Benditovich proto = htons(eth->h_proto); 26172974e916SYuri Benditovich 26182974e916SYuri Benditovich chain = virtio_net_rsc_lookup_chain(n, nc, proto); 26192974e916SYuri Benditovich if (chain) { 26202974e916SYuri Benditovich chain->stat.received++; 26212974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) { 26222974e916SYuri Benditovich return virtio_net_rsc_receive4(chain, nc, buf, size); 26232974e916SYuri Benditovich } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) { 26242974e916SYuri Benditovich return virtio_net_rsc_receive6(chain, nc, buf, size); 26252974e916SYuri Benditovich } 26262974e916SYuri Benditovich } 26272974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26282974e916SYuri Benditovich } 26292974e916SYuri Benditovich 26302974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, 26312974e916SYuri Benditovich size_t size) 26322974e916SYuri Benditovich { 26332974e916SYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 26342974e916SYuri Benditovich if ((n->rsc4_enabled || n->rsc6_enabled)) { 26352974e916SYuri Benditovich return virtio_net_rsc_receive(nc, buf, size); 26362974e916SYuri Benditovich } else { 26372974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26382974e916SYuri Benditovich } 26392974e916SYuri Benditovich } 26402974e916SYuri Benditovich 26416e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q); 26426e790746SPaolo Bonzini 26436e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len) 26446e790746SPaolo Bonzini { 26456e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 26466e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 264717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2648df8d0708SLaurent Vivier int ret; 26496e790746SPaolo Bonzini 265051b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, q->async_tx.elem, 0); 265117a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 26526e790746SPaolo Bonzini 265351b19ebeSPaolo Bonzini g_free(q->async_tx.elem); 265451b19ebeSPaolo Bonzini q->async_tx.elem = NULL; 26556e790746SPaolo Bonzini 26566e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2657df8d0708SLaurent Vivier ret = virtio_net_flush_tx(q); 26587550a822SLaurent Vivier if (ret >= n->tx_burst) { 2659df8d0708SLaurent Vivier /* 2660df8d0708SLaurent Vivier * the flush has been stopped by tx_burst 2661df8d0708SLaurent Vivier * we will not receive notification for the 2662df8d0708SLaurent Vivier * remainining part, so re-schedule 2663df8d0708SLaurent Vivier */ 2664df8d0708SLaurent Vivier virtio_queue_set_notification(q->tx_vq, 0); 26657550a822SLaurent Vivier if (q->tx_bh) { 2666df8d0708SLaurent Vivier qemu_bh_schedule(q->tx_bh); 26677550a822SLaurent Vivier } else { 26687550a822SLaurent Vivier timer_mod(q->tx_timer, 26697550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 26707550a822SLaurent Vivier } 2671df8d0708SLaurent Vivier q->tx_waiting = 1; 2672df8d0708SLaurent Vivier } 26736e790746SPaolo Bonzini } 26746e790746SPaolo Bonzini 26756e790746SPaolo Bonzini /* TX */ 26766e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q) 26776e790746SPaolo Bonzini { 26786e790746SPaolo Bonzini VirtIONet *n = q->n; 267917a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 268051b19ebeSPaolo Bonzini VirtQueueElement *elem; 26816e790746SPaolo Bonzini int32_t num_packets = 0; 26826e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(q->tx_vq)); 268317a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 26846e790746SPaolo Bonzini return num_packets; 26856e790746SPaolo Bonzini } 26866e790746SPaolo Bonzini 268751b19ebeSPaolo Bonzini if (q->async_tx.elem) { 26886e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 26896e790746SPaolo Bonzini return num_packets; 26906e790746SPaolo Bonzini } 26916e790746SPaolo Bonzini 269251b19ebeSPaolo Bonzini for (;;) { 2693bd89dd98SJason Wang ssize_t ret; 269451b19ebeSPaolo Bonzini unsigned int out_num; 269551b19ebeSPaolo Bonzini struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg; 2696feb93f36SJason Wang struct virtio_net_hdr_mrg_rxbuf mhdr; 26976e790746SPaolo Bonzini 269851b19ebeSPaolo Bonzini elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement)); 269951b19ebeSPaolo Bonzini if (!elem) { 270051b19ebeSPaolo Bonzini break; 270151b19ebeSPaolo Bonzini } 270251b19ebeSPaolo Bonzini 270351b19ebeSPaolo Bonzini out_num = elem->out_num; 270451b19ebeSPaolo Bonzini out_sg = elem->out_sg; 27056e790746SPaolo Bonzini if (out_num < 1) { 2706fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header not in first element"); 2707fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2708fa5e56c2SGreg Kurz g_free(elem); 2709fa5e56c2SGreg Kurz return -EINVAL; 27106e790746SPaolo Bonzini } 27116e790746SPaolo Bonzini 2712032a74a1SCédric Le Goater if (n->has_vnet_hdr) { 2713feb93f36SJason Wang if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) < 2714feb93f36SJason Wang n->guest_hdr_len) { 2715fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header incorrect"); 2716fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2717fa5e56c2SGreg Kurz g_free(elem); 2718fa5e56c2SGreg Kurz return -EINVAL; 2719032a74a1SCédric Le Goater } 27201bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2721feb93f36SJason Wang virtio_net_hdr_swap(vdev, (void *) &mhdr); 2722feb93f36SJason Wang sg2[0].iov_base = &mhdr; 2723feb93f36SJason Wang sg2[0].iov_len = n->guest_hdr_len; 2724feb93f36SJason Wang out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1, 2725feb93f36SJason Wang out_sg, out_num, 2726feb93f36SJason Wang n->guest_hdr_len, -1); 2727feb93f36SJason Wang if (out_num == VIRTQUEUE_MAX_SIZE) { 2728feb93f36SJason Wang goto drop; 2729032a74a1SCédric Le Goater } 2730feb93f36SJason Wang out_num += 1; 2731feb93f36SJason Wang out_sg = sg2; 2732feb93f36SJason Wang } 2733feb93f36SJason Wang } 27346e790746SPaolo Bonzini /* 27356e790746SPaolo Bonzini * If host wants to see the guest header as is, we can 27366e790746SPaolo Bonzini * pass it on unchanged. Otherwise, copy just the parts 27376e790746SPaolo Bonzini * that host is interested in. 27386e790746SPaolo Bonzini */ 27396e790746SPaolo Bonzini assert(n->host_hdr_len <= n->guest_hdr_len); 27406e790746SPaolo Bonzini if (n->host_hdr_len != n->guest_hdr_len) { 27416e790746SPaolo Bonzini unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg), 27426e790746SPaolo Bonzini out_sg, out_num, 27436e790746SPaolo Bonzini 0, n->host_hdr_len); 27446e790746SPaolo Bonzini sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num, 27456e790746SPaolo Bonzini out_sg, out_num, 27466e790746SPaolo Bonzini n->guest_hdr_len, -1); 27476e790746SPaolo Bonzini out_num = sg_num; 27486e790746SPaolo Bonzini out_sg = sg; 27496e790746SPaolo Bonzini } 27506e790746SPaolo Bonzini 27516e790746SPaolo Bonzini ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index), 27526e790746SPaolo Bonzini out_sg, out_num, virtio_net_tx_complete); 27536e790746SPaolo Bonzini if (ret == 0) { 27546e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27556e790746SPaolo Bonzini q->async_tx.elem = elem; 27566e790746SPaolo Bonzini return -EBUSY; 27576e790746SPaolo Bonzini } 27586e790746SPaolo Bonzini 2759feb93f36SJason Wang drop: 276051b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, elem, 0); 276117a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 276251b19ebeSPaolo Bonzini g_free(elem); 27636e790746SPaolo Bonzini 27646e790746SPaolo Bonzini if (++num_packets >= n->tx_burst) { 27656e790746SPaolo Bonzini break; 27666e790746SPaolo Bonzini } 27676e790746SPaolo Bonzini } 27686e790746SPaolo Bonzini return num_packets; 27696e790746SPaolo Bonzini } 27706e790746SPaolo Bonzini 27717550a822SLaurent Vivier static void virtio_net_tx_timer(void *opaque); 27727550a822SLaurent Vivier 27736e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq) 27746e790746SPaolo Bonzini { 277517a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 27766e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 27776e790746SPaolo Bonzini 2778283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2779283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2780283e2c2aSYuri Benditovich return; 2781283e2c2aSYuri Benditovich } 2782283e2c2aSYuri Benditovich 27836e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 278417a0ca55SKONRAD Frederic if (!vdev->vm_running) { 27856e790746SPaolo Bonzini q->tx_waiting = 1; 27866e790746SPaolo Bonzini return; 27876e790746SPaolo Bonzini } 27886e790746SPaolo Bonzini 27896e790746SPaolo Bonzini if (q->tx_waiting) { 27907550a822SLaurent Vivier /* We already have queued packets, immediately flush */ 2791bc72ad67SAlex Bligh timer_del(q->tx_timer); 27927550a822SLaurent Vivier virtio_net_tx_timer(q); 27936e790746SPaolo Bonzini } else { 27947550a822SLaurent Vivier /* re-arm timer to flush it (and more) on next tick */ 2795bc72ad67SAlex Bligh timer_mod(q->tx_timer, 2796bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 27976e790746SPaolo Bonzini q->tx_waiting = 1; 27986e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 27996e790746SPaolo Bonzini } 28006e790746SPaolo Bonzini } 28016e790746SPaolo Bonzini 28026e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq) 28036e790746SPaolo Bonzini { 280417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 28056e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 28066e790746SPaolo Bonzini 2807283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2808283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2809283e2c2aSYuri Benditovich return; 2810283e2c2aSYuri Benditovich } 2811283e2c2aSYuri Benditovich 28126e790746SPaolo Bonzini if (unlikely(q->tx_waiting)) { 28136e790746SPaolo Bonzini return; 28146e790746SPaolo Bonzini } 28156e790746SPaolo Bonzini q->tx_waiting = 1; 28166e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 281717a0ca55SKONRAD Frederic if (!vdev->vm_running) { 28186e790746SPaolo Bonzini return; 28196e790746SPaolo Bonzini } 28206e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 28216e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 28226e790746SPaolo Bonzini } 28236e790746SPaolo Bonzini 28246e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque) 28256e790746SPaolo Bonzini { 28266e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 28276e790746SPaolo Bonzini VirtIONet *n = q->n; 282817a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 28297550a822SLaurent Vivier int ret; 28307550a822SLaurent Vivier 2831e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2832e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2833e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2834e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2835e8bcf842SMichael S. Tsirkin return; 2836e8bcf842SMichael S. Tsirkin } 28376e790746SPaolo Bonzini 28386e790746SPaolo Bonzini q->tx_waiting = 0; 28396e790746SPaolo Bonzini 28406e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 284117a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 28426e790746SPaolo Bonzini return; 284317a0ca55SKONRAD Frederic } 28446e790746SPaolo Bonzini 28457550a822SLaurent Vivier ret = virtio_net_flush_tx(q); 28467550a822SLaurent Vivier if (ret == -EBUSY || ret == -EINVAL) { 28477550a822SLaurent Vivier return; 28487550a822SLaurent Vivier } 28497550a822SLaurent Vivier /* 28507550a822SLaurent Vivier * If we flush a full burst of packets, assume there are 28517550a822SLaurent Vivier * more coming and immediately rearm 28527550a822SLaurent Vivier */ 28537550a822SLaurent Vivier if (ret >= n->tx_burst) { 28547550a822SLaurent Vivier q->tx_waiting = 1; 28557550a822SLaurent Vivier timer_mod(q->tx_timer, 28567550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28577550a822SLaurent Vivier return; 28587550a822SLaurent Vivier } 28597550a822SLaurent Vivier /* 28607550a822SLaurent Vivier * If less than a full burst, re-enable notification and flush 28617550a822SLaurent Vivier * anything that may have come in while we weren't looking. If 28627550a822SLaurent Vivier * we find something, assume the guest is still active and rearm 28637550a822SLaurent Vivier */ 28646e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 28657550a822SLaurent Vivier ret = virtio_net_flush_tx(q); 28667550a822SLaurent Vivier if (ret > 0) { 28677550a822SLaurent Vivier virtio_queue_set_notification(q->tx_vq, 0); 28687550a822SLaurent Vivier q->tx_waiting = 1; 28697550a822SLaurent Vivier timer_mod(q->tx_timer, 28707550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28717550a822SLaurent Vivier } 28726e790746SPaolo Bonzini } 28736e790746SPaolo Bonzini 28746e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque) 28756e790746SPaolo Bonzini { 28766e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 28776e790746SPaolo Bonzini VirtIONet *n = q->n; 287817a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 28796e790746SPaolo Bonzini int32_t ret; 28806e790746SPaolo Bonzini 2881e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2882e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2883e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2884e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2885e8bcf842SMichael S. Tsirkin return; 2886e8bcf842SMichael S. Tsirkin } 28876e790746SPaolo Bonzini 28886e790746SPaolo Bonzini q->tx_waiting = 0; 28896e790746SPaolo Bonzini 28906e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 289117a0ca55SKONRAD Frederic if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) { 28926e790746SPaolo Bonzini return; 289317a0ca55SKONRAD Frederic } 28946e790746SPaolo Bonzini 28956e790746SPaolo Bonzini ret = virtio_net_flush_tx(q); 2896fa5e56c2SGreg Kurz if (ret == -EBUSY || ret == -EINVAL) { 2897fa5e56c2SGreg Kurz return; /* Notification re-enable handled by tx_complete or device 2898fa5e56c2SGreg Kurz * broken */ 28996e790746SPaolo Bonzini } 29006e790746SPaolo Bonzini 29016e790746SPaolo Bonzini /* If we flush a full burst of packets, assume there are 29026e790746SPaolo Bonzini * more coming and immediately reschedule */ 29036e790746SPaolo Bonzini if (ret >= n->tx_burst) { 29046e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 29056e790746SPaolo Bonzini q->tx_waiting = 1; 29066e790746SPaolo Bonzini return; 29076e790746SPaolo Bonzini } 29086e790746SPaolo Bonzini 29096e790746SPaolo Bonzini /* If less than a full burst, re-enable notification and flush 29106e790746SPaolo Bonzini * anything that may have come in while we weren't looking. If 29116e790746SPaolo Bonzini * we find something, assume the guest is still active and reschedule */ 29126e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2913fa5e56c2SGreg Kurz ret = virtio_net_flush_tx(q); 2914fa5e56c2SGreg Kurz if (ret == -EINVAL) { 2915fa5e56c2SGreg Kurz return; 2916fa5e56c2SGreg Kurz } else if (ret > 0) { 29176e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 29186e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 29196e790746SPaolo Bonzini q->tx_waiting = 1; 29206e790746SPaolo Bonzini } 29216e790746SPaolo Bonzini } 29226e790746SPaolo Bonzini 2923f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index) 2924f9d6dbf0SWen Congyang { 2925f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2926f9d6dbf0SWen Congyang 29271c0fbfa3SMichael S. Tsirkin n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size, 29281c0fbfa3SMichael S. Tsirkin virtio_net_handle_rx); 29299b02e161SWei Wang 2930f9d6dbf0SWen Congyang if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) { 2931f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 29329b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 29339b02e161SWei Wang virtio_net_handle_tx_timer); 2934f9d6dbf0SWen Congyang n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, 2935f9d6dbf0SWen Congyang virtio_net_tx_timer, 2936f9d6dbf0SWen Congyang &n->vqs[index]); 2937f9d6dbf0SWen Congyang } else { 2938f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 29399b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 29409b02e161SWei Wang virtio_net_handle_tx_bh); 2941f63192b0SAlexander Bulekov n->vqs[index].tx_bh = qemu_bh_new_guarded(virtio_net_tx_bh, &n->vqs[index], 2942f63192b0SAlexander Bulekov &DEVICE(vdev)->mem_reentrancy_guard); 2943f9d6dbf0SWen Congyang } 2944f9d6dbf0SWen Congyang 2945f9d6dbf0SWen Congyang n->vqs[index].tx_waiting = 0; 2946f9d6dbf0SWen Congyang n->vqs[index].n = n; 2947f9d6dbf0SWen Congyang } 2948f9d6dbf0SWen Congyang 2949f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index) 2950f9d6dbf0SWen Congyang { 2951f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2952f9d6dbf0SWen Congyang VirtIONetQueue *q = &n->vqs[index]; 2953f9d6dbf0SWen Congyang NetClientState *nc = qemu_get_subqueue(n->nic, index); 2954f9d6dbf0SWen Congyang 2955f9d6dbf0SWen Congyang qemu_purge_queued_packets(nc); 2956f9d6dbf0SWen Congyang 2957f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2); 2958f9d6dbf0SWen Congyang if (q->tx_timer) { 2959f9d6dbf0SWen Congyang timer_free(q->tx_timer); 2960f989c30cSYunjian Wang q->tx_timer = NULL; 2961f9d6dbf0SWen Congyang } else { 2962f9d6dbf0SWen Congyang qemu_bh_delete(q->tx_bh); 2963f989c30cSYunjian Wang q->tx_bh = NULL; 2964f9d6dbf0SWen Congyang } 2965f989c30cSYunjian Wang q->tx_waiting = 0; 2966f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2 + 1); 2967f9d6dbf0SWen Congyang } 2968f9d6dbf0SWen Congyang 2969441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs) 2970f9d6dbf0SWen Congyang { 2971f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2972f9d6dbf0SWen Congyang int old_num_queues = virtio_get_num_queues(vdev); 2973441537f1SJason Wang int new_num_queues = new_max_queue_pairs * 2 + 1; 2974f9d6dbf0SWen Congyang int i; 2975f9d6dbf0SWen Congyang 2976f9d6dbf0SWen Congyang assert(old_num_queues >= 3); 2977f9d6dbf0SWen Congyang assert(old_num_queues % 2 == 1); 2978f9d6dbf0SWen Congyang 2979f9d6dbf0SWen Congyang if (old_num_queues == new_num_queues) { 2980f9d6dbf0SWen Congyang return; 2981f9d6dbf0SWen Congyang } 2982f9d6dbf0SWen Congyang 2983f9d6dbf0SWen Congyang /* 2984f9d6dbf0SWen Congyang * We always need to remove and add ctrl vq if 2985f9d6dbf0SWen Congyang * old_num_queues != new_num_queues. Remove ctrl_vq first, 298620f86a75SYuval Shaia * and then we only enter one of the following two loops. 2987f9d6dbf0SWen Congyang */ 2988f9d6dbf0SWen Congyang virtio_del_queue(vdev, old_num_queues - 1); 2989f9d6dbf0SWen Congyang 2990f9d6dbf0SWen Congyang for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) { 2991f9d6dbf0SWen Congyang /* new_num_queues < old_num_queues */ 2992f9d6dbf0SWen Congyang virtio_net_del_queue(n, i / 2); 2993f9d6dbf0SWen Congyang } 2994f9d6dbf0SWen Congyang 2995f9d6dbf0SWen Congyang for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) { 2996f9d6dbf0SWen Congyang /* new_num_queues > old_num_queues */ 2997f9d6dbf0SWen Congyang virtio_net_add_queue(n, i / 2); 2998f9d6dbf0SWen Congyang } 2999f9d6dbf0SWen Congyang 3000f9d6dbf0SWen Congyang /* add ctrl_vq last */ 3001f9d6dbf0SWen Congyang n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 3002f9d6dbf0SWen Congyang } 3003f9d6dbf0SWen Congyang 3004ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue) 30056e790746SPaolo Bonzini { 3006441537f1SJason Wang int max = multiqueue ? n->max_queue_pairs : 1; 3007f9d6dbf0SWen Congyang 30086e790746SPaolo Bonzini n->multiqueue = multiqueue; 3009441537f1SJason Wang virtio_net_change_num_queue_pairs(n, max); 30106e790746SPaolo Bonzini 3011441537f1SJason Wang virtio_net_set_queue_pairs(n); 30126e790746SPaolo Bonzini } 30136e790746SPaolo Bonzini 3014982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id) 3015037dab2fSGreg Kurz { 3016982b78c5SDr. David Alan Gilbert VirtIONet *n = opaque; 3017982b78c5SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 3018037dab2fSGreg Kurz int i, link_down; 3019037dab2fSGreg Kurz 30209d8c6a25SDr. David Alan Gilbert trace_virtio_net_post_load_device(); 3021982b78c5SDr. David Alan Gilbert virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs, 302295129d6fSCornelia Huck virtio_vdev_has_feature(vdev, 3023e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 3024e22f0603SYuri Benditovich virtio_vdev_has_feature(vdev, 3025e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 30266e790746SPaolo Bonzini 30276e790746SPaolo Bonzini /* MAC_TABLE_ENTRIES may be different from the saved image */ 3028982b78c5SDr. David Alan Gilbert if (n->mac_table.in_use > MAC_TABLE_ENTRIES) { 30296e790746SPaolo Bonzini n->mac_table.in_use = 0; 30306e790746SPaolo Bonzini } 30316e790746SPaolo Bonzini 3032982b78c5SDr. David Alan Gilbert if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 30336c666823SMichael S. Tsirkin n->curr_guest_offloads = virtio_net_supported_guest_offloads(n); 30346c666823SMichael S. Tsirkin } 30356c666823SMichael S. Tsirkin 30367788c3f2SMikhail Sennikovsky /* 30377788c3f2SMikhail Sennikovsky * curr_guest_offloads will be later overwritten by the 30387788c3f2SMikhail Sennikovsky * virtio_set_features_nocheck call done from the virtio_load. 30397788c3f2SMikhail Sennikovsky * Here we make sure it is preserved and restored accordingly 30407788c3f2SMikhail Sennikovsky * in the virtio_net_post_load_virtio callback. 30417788c3f2SMikhail Sennikovsky */ 30427788c3f2SMikhail Sennikovsky n->saved_guest_offloads = n->curr_guest_offloads; 30436c666823SMichael S. Tsirkin 3044441537f1SJason Wang virtio_net_set_queue_pairs(n); 30456e790746SPaolo Bonzini 30466e790746SPaolo Bonzini /* Find the first multicast entry in the saved MAC filter */ 30476e790746SPaolo Bonzini for (i = 0; i < n->mac_table.in_use; i++) { 30486e790746SPaolo Bonzini if (n->mac_table.macs[i * ETH_ALEN] & 1) { 30496e790746SPaolo Bonzini break; 30506e790746SPaolo Bonzini } 30516e790746SPaolo Bonzini } 30526e790746SPaolo Bonzini n->mac_table.first_multi = i; 30536e790746SPaolo Bonzini 30546e790746SPaolo Bonzini /* nc.link_down can't be migrated, so infer link_down according 30556e790746SPaolo Bonzini * to link status bit in n->status */ 30566e790746SPaolo Bonzini link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0; 3057441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 30586e790746SPaolo Bonzini qemu_get_subqueue(n->nic, i)->link_down = link_down; 30596e790746SPaolo Bonzini } 30606e790746SPaolo Bonzini 30616c666823SMichael S. Tsirkin if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 30626c666823SMichael S. Tsirkin virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 30639d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 30649d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 30659d8c6a25SDr. David Alan Gilbert virtio_net_announce_timer, n); 30669d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 30679d8c6a25SDr. David Alan Gilbert timer_mod(n->announce_timer.tm, 30689d8c6a25SDr. David Alan Gilbert qemu_clock_get_ms(n->announce_timer.type)); 30699d8c6a25SDr. David Alan Gilbert } else { 3070944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 30719d8c6a25SDr. David Alan Gilbert } 30726c666823SMichael S. Tsirkin } 30736c666823SMichael S. Tsirkin 3074e41b7114SYuri Benditovich if (n->rss_data.enabled) { 30750145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = n->rss_data.populate_hash; 30760145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 30770145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 30780145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 30790145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS for vhost"); 30800145c393SAndrew Melnychenko } else { 30810145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS - " 30820145c393SAndrew Melnychenko "fallback to software RSS"); 30830145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 30840145c393SAndrew Melnychenko } 30850145c393SAndrew Melnychenko } 30860145c393SAndrew Melnychenko } 30870145c393SAndrew Melnychenko 3088e41b7114SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 3089e41b7114SYuri Benditovich n->rss_data.indirections_len, 3090e41b7114SYuri Benditovich sizeof(n->rss_data.key)); 3091e41b7114SYuri Benditovich } else { 3092e41b7114SYuri Benditovich trace_virtio_net_rss_disable(); 3093e41b7114SYuri Benditovich } 30946e790746SPaolo Bonzini return 0; 30956e790746SPaolo Bonzini } 30966e790746SPaolo Bonzini 30977788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev) 30987788c3f2SMikhail Sennikovsky { 30997788c3f2SMikhail Sennikovsky VirtIONet *n = VIRTIO_NET(vdev); 31007788c3f2SMikhail Sennikovsky /* 31017788c3f2SMikhail Sennikovsky * The actual needed state is now in saved_guest_offloads, 31027788c3f2SMikhail Sennikovsky * see virtio_net_post_load_device for detail. 31037788c3f2SMikhail Sennikovsky * Restore it back and apply the desired offloads. 31047788c3f2SMikhail Sennikovsky */ 31057788c3f2SMikhail Sennikovsky n->curr_guest_offloads = n->saved_guest_offloads; 31067788c3f2SMikhail Sennikovsky if (peer_has_vnet_hdr(n)) { 31077788c3f2SMikhail Sennikovsky virtio_net_apply_guest_offloads(n); 31087788c3f2SMikhail Sennikovsky } 31097788c3f2SMikhail Sennikovsky 31107788c3f2SMikhail Sennikovsky return 0; 31117788c3f2SMikhail Sennikovsky } 31127788c3f2SMikhail Sennikovsky 3113982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */ 3114982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = { 3115982b78c5SDr. David Alan Gilbert .name = "virtio-net-queue-tx_waiting", 3116982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3117982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(tx_waiting, VirtIONetQueue), 3118982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3119982b78c5SDr. David Alan Gilbert }, 3120982b78c5SDr. David Alan Gilbert }; 3121982b78c5SDr. David Alan Gilbert 3122441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id) 3123982b78c5SDr. David Alan Gilbert { 3124441537f1SJason Wang return VIRTIO_NET(opaque)->max_queue_pairs > 1; 3125982b78c5SDr. David Alan Gilbert } 3126982b78c5SDr. David Alan Gilbert 3127982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id) 3128982b78c5SDr. David Alan Gilbert { 3129982b78c5SDr. David Alan Gilbert return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque), 3130982b78c5SDr. David Alan Gilbert VIRTIO_NET_F_CTRL_GUEST_OFFLOADS); 3131982b78c5SDr. David Alan Gilbert } 3132982b78c5SDr. David Alan Gilbert 3133982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id) 3134982b78c5SDr. David Alan Gilbert { 3135982b78c5SDr. David Alan Gilbert return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES; 3136982b78c5SDr. David Alan Gilbert } 3137982b78c5SDr. David Alan Gilbert 3138982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id) 3139982b78c5SDr. David Alan Gilbert { 3140982b78c5SDr. David Alan Gilbert return !mac_table_fits(opaque, version_id); 3141982b78c5SDr. David Alan Gilbert } 3142982b78c5SDr. David Alan Gilbert 3143982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods 3144982b78c5SDr. David Alan Gilbert * although only some fields are used by each. 3145982b78c5SDr. David Alan Gilbert */ 3146982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp { 3147982b78c5SDr. David Alan Gilbert VirtIONet *parent; 3148982b78c5SDr. David Alan Gilbert VirtIONetQueue *vqs_1; 3149441537f1SJason Wang uint16_t curr_queue_pairs_1; 3150982b78c5SDr. David Alan Gilbert uint8_t has_ufo; 3151982b78c5SDr. David Alan Gilbert uint32_t has_vnet_hdr; 3152982b78c5SDr. David Alan Gilbert }; 3153982b78c5SDr. David Alan Gilbert 3154982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than 3155441537f1SJason Wang * the 1st entry in the queue_pairs and only if there's more than one 3156982b78c5SDr. David Alan Gilbert * entry. We use the tmp mechanism to calculate a temporary 3157982b78c5SDr. David Alan Gilbert * pointer and count and also validate the count. 3158982b78c5SDr. David Alan Gilbert */ 3159982b78c5SDr. David Alan Gilbert 316044b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque) 3161982b78c5SDr. David Alan Gilbert { 3162982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3163982b78c5SDr. David Alan Gilbert 3164982b78c5SDr. David Alan Gilbert tmp->vqs_1 = tmp->parent->vqs + 1; 3165441537f1SJason Wang tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1; 3166441537f1SJason Wang if (tmp->parent->curr_queue_pairs == 0) { 3167441537f1SJason Wang tmp->curr_queue_pairs_1 = 0; 3168982b78c5SDr. David Alan Gilbert } 316944b1ff31SDr. David Alan Gilbert 317044b1ff31SDr. David Alan Gilbert return 0; 3171982b78c5SDr. David Alan Gilbert } 3172982b78c5SDr. David Alan Gilbert 3173982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque) 3174982b78c5SDr. David Alan Gilbert { 3175982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3176982b78c5SDr. David Alan Gilbert 3177982b78c5SDr. David Alan Gilbert /* Reuse the pointer setup from save */ 3178982b78c5SDr. David Alan Gilbert virtio_net_tx_waiting_pre_save(opaque); 3179982b78c5SDr. David Alan Gilbert 3180441537f1SJason Wang if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) { 3181441537f1SJason Wang error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x", 3182441537f1SJason Wang tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs); 3183982b78c5SDr. David Alan Gilbert 3184982b78c5SDr. David Alan Gilbert return -EINVAL; 3185982b78c5SDr. David Alan Gilbert } 3186982b78c5SDr. David Alan Gilbert 3187982b78c5SDr. David Alan Gilbert return 0; /* all good */ 3188982b78c5SDr. David Alan Gilbert } 3189982b78c5SDr. David Alan Gilbert 3190982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = { 3191982b78c5SDr. David Alan Gilbert .name = "virtio-net-tx_waiting", 3192982b78c5SDr. David Alan Gilbert .pre_load = virtio_net_tx_waiting_pre_load, 3193982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_tx_waiting_pre_save, 3194982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3195982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp, 3196441537f1SJason Wang curr_queue_pairs_1, 3197982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3198982b78c5SDr. David Alan Gilbert struct VirtIONetQueue), 3199982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3200982b78c5SDr. David Alan Gilbert }, 3201982b78c5SDr. David Alan Gilbert }; 3202982b78c5SDr. David Alan Gilbert 3203982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the 3204982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3205982b78c5SDr. David Alan Gilbert */ 3206982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id) 3207982b78c5SDr. David Alan Gilbert { 3208982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3209982b78c5SDr. David Alan Gilbert 3210982b78c5SDr. David Alan Gilbert if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) { 3211982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires TUN_F_UFO support"); 3212982b78c5SDr. David Alan Gilbert return -EINVAL; 3213982b78c5SDr. David Alan Gilbert } 3214982b78c5SDr. David Alan Gilbert 3215982b78c5SDr. David Alan Gilbert return 0; 3216982b78c5SDr. David Alan Gilbert } 3217982b78c5SDr. David Alan Gilbert 321844b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque) 3219982b78c5SDr. David Alan Gilbert { 3220982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3221982b78c5SDr. David Alan Gilbert 3222982b78c5SDr. David Alan Gilbert tmp->has_ufo = tmp->parent->has_ufo; 322344b1ff31SDr. David Alan Gilbert 322444b1ff31SDr. David Alan Gilbert return 0; 3225982b78c5SDr. David Alan Gilbert } 3226982b78c5SDr. David Alan Gilbert 3227982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = { 3228982b78c5SDr. David Alan Gilbert .name = "virtio-net-ufo", 3229982b78c5SDr. David Alan Gilbert .post_load = virtio_net_ufo_post_load, 3230982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_ufo_pre_save, 3231982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3232982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp), 3233982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3234982b78c5SDr. David Alan Gilbert }, 3235982b78c5SDr. David Alan Gilbert }; 3236982b78c5SDr. David Alan Gilbert 3237982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the 3238982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3239982b78c5SDr. David Alan Gilbert */ 3240982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id) 3241982b78c5SDr. David Alan Gilbert { 3242982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3243982b78c5SDr. David Alan Gilbert 3244982b78c5SDr. David Alan Gilbert if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) { 3245982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires vnet_hdr=on"); 3246982b78c5SDr. David Alan Gilbert return -EINVAL; 3247982b78c5SDr. David Alan Gilbert } 3248982b78c5SDr. David Alan Gilbert 3249982b78c5SDr. David Alan Gilbert return 0; 3250982b78c5SDr. David Alan Gilbert } 3251982b78c5SDr. David Alan Gilbert 325244b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque) 3253982b78c5SDr. David Alan Gilbert { 3254982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3255982b78c5SDr. David Alan Gilbert 3256982b78c5SDr. David Alan Gilbert tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr; 325744b1ff31SDr. David Alan Gilbert 325844b1ff31SDr. David Alan Gilbert return 0; 3259982b78c5SDr. David Alan Gilbert } 3260982b78c5SDr. David Alan Gilbert 3261982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = { 3262982b78c5SDr. David Alan Gilbert .name = "virtio-net-vnet", 3263982b78c5SDr. David Alan Gilbert .post_load = virtio_net_vnet_post_load, 3264982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_vnet_pre_save, 3265982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3266982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp), 3267982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3268982b78c5SDr. David Alan Gilbert }, 3269982b78c5SDr. David Alan Gilbert }; 3270982b78c5SDr. David Alan Gilbert 3271e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque) 3272e41b7114SYuri Benditovich { 3273e41b7114SYuri Benditovich return VIRTIO_NET(opaque)->rss_data.enabled; 3274e41b7114SYuri Benditovich } 3275e41b7114SYuri Benditovich 3276e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = { 3277e41b7114SYuri Benditovich .name = "virtio-net-device/rss", 3278e41b7114SYuri Benditovich .version_id = 1, 3279e41b7114SYuri Benditovich .minimum_version_id = 1, 3280e41b7114SYuri Benditovich .needed = virtio_net_rss_needed, 3281e41b7114SYuri Benditovich .fields = (VMStateField[]) { 3282e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.enabled, VirtIONet), 3283e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.redirect, VirtIONet), 3284e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.populate_hash, VirtIONet), 3285e41b7114SYuri Benditovich VMSTATE_UINT32(rss_data.hash_types, VirtIONet), 3286e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.indirections_len, VirtIONet), 3287e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.default_queue, VirtIONet), 3288e41b7114SYuri Benditovich VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet, 3289e41b7114SYuri Benditovich VIRTIO_NET_RSS_MAX_KEY_SIZE), 3290e41b7114SYuri Benditovich VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet, 3291e41b7114SYuri Benditovich rss_data.indirections_len, 0, 3292e41b7114SYuri Benditovich vmstate_info_uint16, uint16_t), 3293e41b7114SYuri Benditovich VMSTATE_END_OF_LIST() 3294e41b7114SYuri Benditovich }, 3295e41b7114SYuri Benditovich }; 3296e41b7114SYuri Benditovich 3297982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = { 3298982b78c5SDr. David Alan Gilbert .name = "virtio-net-device", 3299982b78c5SDr. David Alan Gilbert .version_id = VIRTIO_NET_VM_VERSION, 3300982b78c5SDr. David Alan Gilbert .minimum_version_id = VIRTIO_NET_VM_VERSION, 3301982b78c5SDr. David Alan Gilbert .post_load = virtio_net_post_load_device, 3302982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3303982b78c5SDr. David Alan Gilbert VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN), 3304982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_POINTER(vqs, VirtIONet, 3305982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3306982b78c5SDr. David Alan Gilbert VirtIONetQueue), 3307982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet), 3308982b78c5SDr. David Alan Gilbert VMSTATE_UINT16(status, VirtIONet), 3309982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(promisc, VirtIONet), 3310982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(allmulti, VirtIONet), 3311982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mac_table.in_use, VirtIONet), 3312982b78c5SDr. David Alan Gilbert 3313982b78c5SDr. David Alan Gilbert /* Guarded pair: If it fits we load it, else we throw it away 3314982b78c5SDr. David Alan Gilbert * - can happen if source has a larger MAC table.; post-load 3315982b78c5SDr. David Alan Gilbert * sets flags in this case. 3316982b78c5SDr. David Alan Gilbert */ 3317982b78c5SDr. David Alan Gilbert VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet, 3318982b78c5SDr. David Alan Gilbert 0, mac_table_fits, mac_table.in_use, 3319982b78c5SDr. David Alan Gilbert ETH_ALEN), 3320982b78c5SDr. David Alan Gilbert VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0, 3321982b78c5SDr. David Alan Gilbert mac_table.in_use, ETH_ALEN), 3322982b78c5SDr. David Alan Gilbert 3323982b78c5SDr. David Alan Gilbert /* Note: This is an array of uint32's that's always been saved as a 3324982b78c5SDr. David Alan Gilbert * buffer; hold onto your endiannesses; it's actually used as a bitmap 3325982b78c5SDr. David Alan Gilbert * but based on the uint. 3326982b78c5SDr. David Alan Gilbert */ 3327982b78c5SDr. David Alan Gilbert VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3), 3328982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3329982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_vnet), 3330982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet), 3331982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet), 3332982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(alluni, VirtIONet), 3333982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nomulti, VirtIONet), 3334982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nouni, VirtIONet), 3335982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nobcast, VirtIONet), 3336982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3337982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_ufo), 3338441537f1SJason Wang VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0, 3339982b78c5SDr. David Alan Gilbert vmstate_info_uint16_equal, uint16_t), 3340441537f1SJason Wang VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1), 3341982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3342982b78c5SDr. David Alan Gilbert vmstate_virtio_net_tx_waiting), 3343982b78c5SDr. David Alan Gilbert VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet, 3344982b78c5SDr. David Alan Gilbert has_ctrl_guest_offloads), 3345982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3346982b78c5SDr. David Alan Gilbert }, 3347e41b7114SYuri Benditovich .subsections = (const VMStateDescription * []) { 3348e41b7114SYuri Benditovich &vmstate_virtio_net_rss, 3349e41b7114SYuri Benditovich NULL 3350e41b7114SYuri Benditovich } 3351982b78c5SDr. David Alan Gilbert }; 3352982b78c5SDr. David Alan Gilbert 33536e790746SPaolo Bonzini static NetClientInfo net_virtio_info = { 3354f394b2e2SEric Blake .type = NET_CLIENT_DRIVER_NIC, 33556e790746SPaolo Bonzini .size = sizeof(NICState), 33566e790746SPaolo Bonzini .can_receive = virtio_net_can_receive, 33576e790746SPaolo Bonzini .receive = virtio_net_receive, 33586e790746SPaolo Bonzini .link_status_changed = virtio_net_set_link_status, 3359b1be4280SAmos Kong .query_rx_filter = virtio_net_query_rxfilter, 3360b2c929f0SDr. David Alan Gilbert .announce = virtio_net_announce, 33616e790746SPaolo Bonzini }; 33626e790746SPaolo Bonzini 33636e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx) 33646e790746SPaolo Bonzini { 336517a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 336668b0a639SSi-Wei Liu NetClientState *nc; 33676e790746SPaolo Bonzini assert(n->vhost_started); 336868b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) { 336968b0a639SSi-Wei Liu /* Must guard against invalid features and bogus queue index 337068b0a639SSi-Wei Liu * from being set by malicious guest, or penetrated through 337168b0a639SSi-Wei Liu * buggy migration stream. 337268b0a639SSi-Wei Liu */ 337368b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 337468b0a639SSi-Wei Liu qemu_log_mask(LOG_GUEST_ERROR, 337568b0a639SSi-Wei Liu "%s: bogus vq index ignored\n", __func__); 337668b0a639SSi-Wei Liu return false; 337768b0a639SSi-Wei Liu } 337868b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, n->max_queue_pairs); 337968b0a639SSi-Wei Liu } else { 338068b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, vq2q(idx)); 338168b0a639SSi-Wei Liu } 3382544f0278SCindy Lu /* 3383544f0278SCindy Lu * Add the check for configure interrupt, Use VIRTIO_CONFIG_IRQ_IDX -1 33847e8094f0SAlex Bennée * as the macro of configure interrupt's IDX, If this driver does not 3385544f0278SCindy Lu * support, the function will return false 3386544f0278SCindy Lu */ 3387544f0278SCindy Lu 3388544f0278SCindy Lu if (idx == VIRTIO_CONFIG_IRQ_IDX) { 33898aab0d1dSCindy Lu return vhost_net_config_pending(get_vhost_net(nc->peer)); 3390544f0278SCindy Lu } 3391ed8b4afeSNikolay Nikolaev return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx); 33926e790746SPaolo Bonzini } 33936e790746SPaolo Bonzini 33946e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx, 33956e790746SPaolo Bonzini bool mask) 33966e790746SPaolo Bonzini { 339717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 339868b0a639SSi-Wei Liu NetClientState *nc; 33996e790746SPaolo Bonzini assert(n->vhost_started); 340068b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ) && idx == 2) { 340168b0a639SSi-Wei Liu /* Must guard against invalid features and bogus queue index 340268b0a639SSi-Wei Liu * from being set by malicious guest, or penetrated through 340368b0a639SSi-Wei Liu * buggy migration stream. 340468b0a639SSi-Wei Liu */ 340568b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 340668b0a639SSi-Wei Liu qemu_log_mask(LOG_GUEST_ERROR, 340768b0a639SSi-Wei Liu "%s: bogus vq index ignored\n", __func__); 340868b0a639SSi-Wei Liu return; 340968b0a639SSi-Wei Liu } 341068b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, n->max_queue_pairs); 341168b0a639SSi-Wei Liu } else { 341268b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, vq2q(idx)); 341368b0a639SSi-Wei Liu } 3414544f0278SCindy Lu /* 3415544f0278SCindy Lu *Add the check for configure interrupt, Use VIRTIO_CONFIG_IRQ_IDX -1 34167e8094f0SAlex Bennée * as the macro of configure interrupt's IDX, If this driver does not 3417544f0278SCindy Lu * support, the function will return 3418544f0278SCindy Lu */ 3419544f0278SCindy Lu 3420544f0278SCindy Lu if (idx == VIRTIO_CONFIG_IRQ_IDX) { 34218aab0d1dSCindy Lu vhost_net_config_mask(get_vhost_net(nc->peer), vdev, mask); 3422544f0278SCindy Lu return; 3423544f0278SCindy Lu } 3424544f0278SCindy Lu vhost_net_virtqueue_mask(get_vhost_net(nc->peer), vdev, idx, mask); 34256e790746SPaolo Bonzini } 34266e790746SPaolo Bonzini 3427019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features) 34286e790746SPaolo Bonzini { 34290cd09c3aSCornelia Huck virtio_add_feature(&host_features, VIRTIO_NET_F_MAC); 3430a93e599dSMaxime Coquelin 3431d74c30c8SDaniil Tatianin n->config_size = virtio_get_config_size(&cfg_size_params, host_features); 343217ec5a86SKONRAD Frederic } 34336e790746SPaolo Bonzini 34348a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name, 34358a253ec2SKONRAD Frederic const char *type) 34368a253ec2SKONRAD Frederic { 34378a253ec2SKONRAD Frederic /* 34388a253ec2SKONRAD Frederic * The name can be NULL, the netclient name will be type.x. 34398a253ec2SKONRAD Frederic */ 34408a253ec2SKONRAD Frederic assert(type != NULL); 34418a253ec2SKONRAD Frederic 34428a253ec2SKONRAD Frederic g_free(n->netclient_name); 34438a253ec2SKONRAD Frederic g_free(n->netclient_type); 34448a253ec2SKONRAD Frederic n->netclient_name = g_strdup(name); 34458a253ec2SKONRAD Frederic n->netclient_type = g_strdup(type); 34468a253ec2SKONRAD Frederic } 34478a253ec2SKONRAD Frederic 34480e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev) 34499711cd0dSJens Freimann { 34509711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 34519711cd0dSJens Freimann PCIDevice *pci_dev; 34529711cd0dSJens Freimann Error *err = NULL; 34539711cd0dSJens Freimann 34540e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 34559711cd0dSJens Freimann if (hotplug_ctrl) { 34560e9a65c5SJuan Quintela pci_dev = PCI_DEVICE(dev); 34579711cd0dSJens Freimann pci_dev->partially_hotplugged = true; 34580e9a65c5SJuan Quintela hotplug_handler_unplug_request(hotplug_ctrl, dev, &err); 34599711cd0dSJens Freimann if (err) { 34609711cd0dSJens Freimann error_report_err(err); 34619711cd0dSJens Freimann return false; 34629711cd0dSJens Freimann } 34639711cd0dSJens Freimann } else { 34649711cd0dSJens Freimann return false; 34659711cd0dSJens Freimann } 34669711cd0dSJens Freimann return true; 34679711cd0dSJens Freimann } 34689711cd0dSJens Freimann 34690e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev, 34700e9a65c5SJuan Quintela Error **errp) 34719711cd0dSJens Freimann { 34725a0948d3SMarkus Armbruster Error *err = NULL; 34739711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 34740e9a65c5SJuan Quintela PCIDevice *pdev = PCI_DEVICE(dev); 347578274682SJuan Quintela BusState *primary_bus; 34769711cd0dSJens Freimann 34779711cd0dSJens Freimann if (!pdev->partially_hotplugged) { 34789711cd0dSJens Freimann return true; 34799711cd0dSJens Freimann } 34800e9a65c5SJuan Quintela primary_bus = dev->parent_bus; 348178274682SJuan Quintela if (!primary_bus) { 3482150ab54aSJens Freimann error_setg(errp, "virtio_net: couldn't find primary bus"); 34835a0948d3SMarkus Armbruster return false; 34849711cd0dSJens Freimann } 34850e9a65c5SJuan Quintela qdev_set_parent_bus(dev, primary_bus, &error_abort); 3486e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 34870e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 34889711cd0dSJens Freimann if (hotplug_ctrl) { 34890e9a65c5SJuan Quintela hotplug_handler_pre_plug(hotplug_ctrl, dev, &err); 34905a0948d3SMarkus Armbruster if (err) { 34915a0948d3SMarkus Armbruster goto out; 34925a0948d3SMarkus Armbruster } 34930e9a65c5SJuan Quintela hotplug_handler_plug(hotplug_ctrl, dev, &err); 34949711cd0dSJens Freimann } 3495109c20eaSLaurent Vivier pdev->partially_hotplugged = false; 3496150ab54aSJens Freimann 3497150ab54aSJens Freimann out: 34985a0948d3SMarkus Armbruster error_propagate(errp, err); 34995a0948d3SMarkus Armbruster return !err; 35009711cd0dSJens Freimann } 35019711cd0dSJens Freimann 350207a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s) 35039711cd0dSJens Freimann { 35049711cd0dSJens Freimann bool should_be_hidden; 35059711cd0dSJens Freimann Error *err = NULL; 350607a5d816SJuan Quintela DeviceState *dev = failover_find_primary_device(n); 350707a5d816SJuan Quintela 350807a5d816SJuan Quintela if (!dev) { 350907a5d816SJuan Quintela return; 351007a5d816SJuan Quintela } 35119711cd0dSJens Freimann 3512e2bde83eSJuan Quintela should_be_hidden = qatomic_read(&n->failover_primary_hidden); 35139711cd0dSJens Freimann 35144dbac1aeSMarkus Armbruster if (migration_in_setup(s) && !should_be_hidden) { 351507a5d816SJuan Quintela if (failover_unplug_primary(n, dev)) { 351607a5d816SJuan Quintela vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev); 351707a5d816SJuan Quintela qapi_event_send_unplug_primary(dev->id); 3518e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 35199711cd0dSJens Freimann } else { 35209711cd0dSJens Freimann warn_report("couldn't unplug primary device"); 35219711cd0dSJens Freimann } 35229711cd0dSJens Freimann } else if (migration_has_failed(s)) { 3523150ab54aSJens Freimann /* We already unplugged the device let's plug it back */ 352407a5d816SJuan Quintela if (!failover_replug_primary(n, dev, &err)) { 35259711cd0dSJens Freimann if (err) { 35269711cd0dSJens Freimann error_report_err(err); 35279711cd0dSJens Freimann } 35289711cd0dSJens Freimann } 35299711cd0dSJens Freimann } 35309711cd0dSJens Freimann } 35319711cd0dSJens Freimann 35329711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data) 35339711cd0dSJens Freimann { 35349711cd0dSJens Freimann MigrationState *s = data; 35359711cd0dSJens Freimann VirtIONet *n = container_of(notifier, VirtIONet, migration_state); 35369711cd0dSJens Freimann virtio_net_handle_migration_primary(n, s); 35379711cd0dSJens Freimann } 35389711cd0dSJens Freimann 3539b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener, 3540f3558b1bSKevin Wolf const QDict *device_opts, 3541f3558b1bSKevin Wolf bool from_json, 3542f3558b1bSKevin Wolf Error **errp) 35439711cd0dSJens Freimann { 35449711cd0dSJens Freimann VirtIONet *n = container_of(listener, VirtIONet, primary_listener); 35454f0303aeSJuan Quintela const char *standby_id; 35469711cd0dSJens Freimann 35474d0e59acSJens Freimann if (!device_opts) { 354889631fedSJuan Quintela return false; 35494d0e59acSJens Freimann } 3550bcfc906bSLaurent Vivier 3551bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "failover_pair_id")) { 3552bcfc906bSLaurent Vivier return false; 3553bcfc906bSLaurent Vivier } 3554bcfc906bSLaurent Vivier 3555bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "id")) { 3556bcfc906bSLaurent Vivier error_setg(errp, "Device with failover_pair_id needs to have id"); 3557bcfc906bSLaurent Vivier return false; 3558bcfc906bSLaurent Vivier } 3559bcfc906bSLaurent Vivier 3560bcfc906bSLaurent Vivier standby_id = qdict_get_str(device_opts, "failover_pair_id"); 356189631fedSJuan Quintela if (g_strcmp0(standby_id, n->netclient_name) != 0) { 356289631fedSJuan Quintela return false; 35639711cd0dSJens Freimann } 35649711cd0dSJens Freimann 35657fe7791eSLaurent Vivier /* 35667fe7791eSLaurent Vivier * The hide helper can be called several times for a given device. 35677fe7791eSLaurent Vivier * Check there is only one primary for a virtio-net device but 35687fe7791eSLaurent Vivier * don't duplicate the qdict several times if it's called for the same 35697fe7791eSLaurent Vivier * device. 35707fe7791eSLaurent Vivier */ 3571259a10dbSKevin Wolf if (n->primary_opts) { 35727fe7791eSLaurent Vivier const char *old, *new; 35737fe7791eSLaurent Vivier /* devices with failover_pair_id always have an id */ 35747fe7791eSLaurent Vivier old = qdict_get_str(n->primary_opts, "id"); 35757fe7791eSLaurent Vivier new = qdict_get_str(device_opts, "id"); 35767fe7791eSLaurent Vivier if (strcmp(old, new) != 0) { 35777fe7791eSLaurent Vivier error_setg(errp, "Cannot attach more than one primary device to " 35787fe7791eSLaurent Vivier "'%s': '%s' and '%s'", n->netclient_name, old, new); 3579259a10dbSKevin Wolf return false; 3580259a10dbSKevin Wolf } 35817fe7791eSLaurent Vivier } else { 3582f3558b1bSKevin Wolf n->primary_opts = qdict_clone_shallow(device_opts); 3583f3558b1bSKevin Wolf n->primary_opts_from_json = from_json; 35847fe7791eSLaurent Vivier } 3585259a10dbSKevin Wolf 3586e2bde83eSJuan Quintela /* failover_primary_hidden is set during feature negotiation */ 35873abad4a2SJuan Quintela return qatomic_read(&n->failover_primary_hidden); 35889711cd0dSJens Freimann } 35899711cd0dSJens Freimann 3590e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp) 359117ec5a86SKONRAD Frederic { 3592e6f746b3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3593284a32f0SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3594284a32f0SAndreas Färber NetClientState *nc; 35951773d9eeSKONRAD Frederic int i; 359617ec5a86SKONRAD Frederic 3597a93e599dSMaxime Coquelin if (n->net_conf.mtu) { 3598127833eeSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_MTU); 3599a93e599dSMaxime Coquelin } 3600a93e599dSMaxime Coquelin 36019473939eSJason Baron if (n->net_conf.duplex_str) { 36029473939eSJason Baron if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) { 36039473939eSJason Baron n->net_conf.duplex = DUPLEX_HALF; 36049473939eSJason Baron } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) { 36059473939eSJason Baron n->net_conf.duplex = DUPLEX_FULL; 36069473939eSJason Baron } else { 36079473939eSJason Baron error_setg(errp, "'duplex' must be 'half' or 'full'"); 3608843c4cfcSMarkus Armbruster return; 36099473939eSJason Baron } 36109473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 36119473939eSJason Baron } else { 36129473939eSJason Baron n->net_conf.duplex = DUPLEX_UNKNOWN; 36139473939eSJason Baron } 36149473939eSJason Baron 36159473939eSJason Baron if (n->net_conf.speed < SPEED_UNKNOWN) { 36169473939eSJason Baron error_setg(errp, "'speed' must be between 0 and INT_MAX"); 3617843c4cfcSMarkus Armbruster return; 3618843c4cfcSMarkus Armbruster } 3619843c4cfcSMarkus Armbruster if (n->net_conf.speed >= 0) { 36209473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 36219473939eSJason Baron } 36229473939eSJason Baron 36239711cd0dSJens Freimann if (n->failover) { 3624b91ad981SJuan Quintela n->primary_listener.hide_device = failover_hide_primary_device; 3625e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 36269711cd0dSJens Freimann device_listener_register(&n->primary_listener); 3627d9cda213SSteve Sistare migration_add_notifier(&n->migration_state, 3628d9cda213SSteve Sistare virtio_net_migration_state_notifier); 36299711cd0dSJens Freimann n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY); 36309711cd0dSJens Freimann } 36319711cd0dSJens Freimann 3632da3e8a23SShannon Zhao virtio_net_set_config_size(n, n->host_features); 36333857cd5cSJonah Palmer virtio_init(vdev, VIRTIO_ID_NET, n->config_size); 363417ec5a86SKONRAD Frederic 36351c0fbfa3SMichael S. Tsirkin /* 36361c0fbfa3SMichael S. Tsirkin * We set a lower limit on RX queue size to what it always was. 36371c0fbfa3SMichael S. Tsirkin * Guests that want a smaller ring can always resize it without 36381c0fbfa3SMichael S. Tsirkin * help from us (using virtio 1 and up). 36391c0fbfa3SMichael S. Tsirkin */ 36401c0fbfa3SMichael S. Tsirkin if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE || 36411c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE || 36425f997fd1SMichal Privoznik !is_power_of_2(n->net_conf.rx_queue_size)) { 36431c0fbfa3SMichael S. Tsirkin error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), " 36441c0fbfa3SMichael S. Tsirkin "must be a power of 2 between %d and %d.", 36451c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE, 36461c0fbfa3SMichael S. Tsirkin VIRTQUEUE_MAX_SIZE); 36471c0fbfa3SMichael S. Tsirkin virtio_cleanup(vdev); 36481c0fbfa3SMichael S. Tsirkin return; 36491c0fbfa3SMichael S. Tsirkin } 36501c0fbfa3SMichael S. Tsirkin 36519b02e161SWei Wang if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE || 36524271f403SLaurent Vivier n->net_conf.tx_queue_size > virtio_net_max_tx_queue_size(n) || 36539b02e161SWei Wang !is_power_of_2(n->net_conf.tx_queue_size)) { 36549b02e161SWei Wang error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), " 36559b02e161SWei Wang "must be a power of 2 between %d and %d", 36569b02e161SWei Wang n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE, 36574271f403SLaurent Vivier virtio_net_max_tx_queue_size(n)); 36589b02e161SWei Wang virtio_cleanup(vdev); 36599b02e161SWei Wang return; 36609b02e161SWei Wang } 36619b02e161SWei Wang 366222288fe5SJason Wang n->max_ncs = MAX(n->nic_conf.peers.queues, 1); 366322288fe5SJason Wang 366422288fe5SJason Wang /* 366522288fe5SJason Wang * Figure out the datapath queue pairs since the backend could 366622288fe5SJason Wang * provide control queue via peers as well. 366722288fe5SJason Wang */ 366822288fe5SJason Wang if (n->nic_conf.peers.queues) { 366922288fe5SJason Wang for (i = 0; i < n->max_ncs; i++) { 367022288fe5SJason Wang if (n->nic_conf.peers.ncs[i]->is_datapath) { 367122288fe5SJason Wang ++n->max_queue_pairs; 367222288fe5SJason Wang } 367322288fe5SJason Wang } 367422288fe5SJason Wang } 367522288fe5SJason Wang n->max_queue_pairs = MAX(n->max_queue_pairs, 1); 367622288fe5SJason Wang 3677441537f1SJason Wang if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) { 367822288fe5SJason Wang error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), " 3679631b22eaSStefan Weil "must be a positive integer less than %d.", 3680441537f1SJason Wang n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2); 36817e0e736eSJason Wang virtio_cleanup(vdev); 36827e0e736eSJason Wang return; 36837e0e736eSJason Wang } 3684b21e2380SMarkus Armbruster n->vqs = g_new0(VirtIONetQueue, n->max_queue_pairs); 3685441537f1SJason Wang n->curr_queue_pairs = 1; 36861773d9eeSKONRAD Frederic n->tx_timeout = n->net_conf.txtimer; 36876e790746SPaolo Bonzini 36881773d9eeSKONRAD Frederic if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer") 36891773d9eeSKONRAD Frederic && strcmp(n->net_conf.tx, "bh")) { 36900765691eSMarkus Armbruster warn_report("virtio-net: " 36916e790746SPaolo Bonzini "Unknown option tx=%s, valid options: \"timer\" \"bh\"", 36921773d9eeSKONRAD Frederic n->net_conf.tx); 36930765691eSMarkus Armbruster error_printf("Defaulting to \"bh\""); 36946e790746SPaolo Bonzini } 36956e790746SPaolo Bonzini 36962eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n), 36972eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size); 36989b02e161SWei Wang 3699441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3700f9d6dbf0SWen Congyang virtio_net_add_queue(n, i); 3701da51a335SJason Wang } 3702da51a335SJason Wang 370317a0ca55SKONRAD Frederic n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 37041773d9eeSKONRAD Frederic qemu_macaddr_default_if_unset(&n->nic_conf.macaddr); 37051773d9eeSKONRAD Frederic memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac)); 37066e790746SPaolo Bonzini n->status = VIRTIO_NET_S_LINK_UP; 37079d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 37089d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 3709f57fcf70SJason Wang virtio_net_announce_timer, n); 3710b2c929f0SDr. David Alan Gilbert n->announce_timer.round = 0; 37116e790746SPaolo Bonzini 37128a253ec2SKONRAD Frederic if (n->netclient_type) { 37138a253ec2SKONRAD Frederic /* 37148a253ec2SKONRAD Frederic * Happen when virtio_net_set_netclient_name has been called. 37158a253ec2SKONRAD Frederic */ 37168a253ec2SKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 3717*7d0fefdfSAkihiko Odaki n->netclient_type, n->netclient_name, 3718*7d0fefdfSAkihiko Odaki &dev->mem_reentrancy_guard, n); 37198a253ec2SKONRAD Frederic } else { 37201773d9eeSKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 3721*7d0fefdfSAkihiko Odaki object_get_typename(OBJECT(dev)), dev->id, 3722*7d0fefdfSAkihiko Odaki &dev->mem_reentrancy_guard, n); 37238a253ec2SKONRAD Frederic } 37248a253ec2SKONRAD Frederic 3725441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3726d4c62930SBin Meng n->nic->ncs[i].do_not_pad = true; 3727d4c62930SBin Meng } 3728d4c62930SBin Meng 37296e790746SPaolo Bonzini peer_test_vnet_hdr(n); 37306e790746SPaolo Bonzini if (peer_has_vnet_hdr(n)) { 3731441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3732d6085e3aSStefan Hajnoczi qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true); 37336e790746SPaolo Bonzini } 37346e790746SPaolo Bonzini n->host_hdr_len = sizeof(struct virtio_net_hdr); 37356e790746SPaolo Bonzini } else { 37366e790746SPaolo Bonzini n->host_hdr_len = 0; 37376e790746SPaolo Bonzini } 37386e790746SPaolo Bonzini 37391773d9eeSKONRAD Frederic qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a); 37406e790746SPaolo Bonzini 37416e790746SPaolo Bonzini n->vqs[0].tx_waiting = 0; 37421773d9eeSKONRAD Frederic n->tx_burst = n->net_conf.txburst; 3743e22f0603SYuri Benditovich virtio_net_set_mrg_rx_bufs(n, 0, 0, 0); 37446e790746SPaolo Bonzini n->promisc = 1; /* for compatibility */ 37456e790746SPaolo Bonzini 37466e790746SPaolo Bonzini n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 37476e790746SPaolo Bonzini 37486e790746SPaolo Bonzini n->vlans = g_malloc0(MAX_VLAN >> 3); 37496e790746SPaolo Bonzini 3750b1be4280SAmos Kong nc = qemu_get_queue(n->nic); 3751b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 3752b1be4280SAmos Kong 3753e87936eaSCindy Lu if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 3754e87936eaSCindy Lu struct virtio_net_config netcfg = {}; 3755e87936eaSCindy Lu memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN); 3756e87936eaSCindy Lu vhost_net_set_config(get_vhost_net(nc->peer), 3757f8ed3648SManos Pitsidianakis (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_FRONTEND); 3758e87936eaSCindy Lu } 37592974e916SYuri Benditovich QTAILQ_INIT(&n->rsc_chains); 3760284a32f0SAndreas Färber n->qdev = dev; 37614474e37aSYuri Benditovich 3762aac8f89dSAkihiko Odaki net_rx_pkt_init(&n->rx_pkt); 37630145c393SAndrew Melnychenko 37640145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 37650145c393SAndrew Melnychenko virtio_net_load_ebpf(n); 37660145c393SAndrew Melnychenko } 376717ec5a86SKONRAD Frederic } 376817ec5a86SKONRAD Frederic 3769b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev) 377017ec5a86SKONRAD Frederic { 3771306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3772306ec6c3SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3773441537f1SJason Wang int i, max_queue_pairs; 377417ec5a86SKONRAD Frederic 37750145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 37760145c393SAndrew Melnychenko virtio_net_unload_ebpf(n); 37770145c393SAndrew Melnychenko } 37780145c393SAndrew Melnychenko 377917ec5a86SKONRAD Frederic /* This will stop vhost backend if appropriate. */ 378017ec5a86SKONRAD Frederic virtio_net_set_status(vdev, 0); 378117ec5a86SKONRAD Frederic 37828a253ec2SKONRAD Frederic g_free(n->netclient_name); 37838a253ec2SKONRAD Frederic n->netclient_name = NULL; 37848a253ec2SKONRAD Frederic g_free(n->netclient_type); 37858a253ec2SKONRAD Frederic n->netclient_type = NULL; 37868a253ec2SKONRAD Frederic 378717ec5a86SKONRAD Frederic g_free(n->mac_table.macs); 378817ec5a86SKONRAD Frederic g_free(n->vlans); 378917ec5a86SKONRAD Frederic 37909711cd0dSJens Freimann if (n->failover) { 3791f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 379265018100SJuan Quintela device_listener_unregister(&n->primary_listener); 3793d9cda213SSteve Sistare migration_remove_notifier(&n->migration_state); 3794f3558b1bSKevin Wolf } else { 3795f3558b1bSKevin Wolf assert(n->primary_opts == NULL); 37969711cd0dSJens Freimann } 37979711cd0dSJens Freimann 3798441537f1SJason Wang max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3799441537f1SJason Wang for (i = 0; i < max_queue_pairs; i++) { 3800f9d6dbf0SWen Congyang virtio_net_del_queue(n, i); 380117ec5a86SKONRAD Frederic } 3802d945d9f1SYuri Benditovich /* delete also control vq */ 3803441537f1SJason Wang virtio_del_queue(vdev, max_queue_pairs * 2); 3804944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 380517ec5a86SKONRAD Frederic g_free(n->vqs); 380617ec5a86SKONRAD Frederic qemu_del_nic(n->nic); 38072974e916SYuri Benditovich virtio_net_rsc_cleanup(n); 380859079029SYuri Benditovich g_free(n->rss_data.indirections_table); 38094474e37aSYuri Benditovich net_rx_pkt_uninit(n->rx_pkt); 38106a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 381117ec5a86SKONRAD Frederic } 381217ec5a86SKONRAD Frederic 381317ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj) 381417ec5a86SKONRAD Frederic { 381517ec5a86SKONRAD Frederic VirtIONet *n = VIRTIO_NET(obj); 381617ec5a86SKONRAD Frederic 381717ec5a86SKONRAD Frederic /* 381817ec5a86SKONRAD Frederic * The default config_size is sizeof(struct virtio_net_config). 38192431f4f1SMichael Tokarev * Can be overridden with virtio_net_set_config_size. 382017ec5a86SKONRAD Frederic */ 382117ec5a86SKONRAD Frederic n->config_size = sizeof(struct virtio_net_config); 3822aa4197c3SGonglei device_add_bootindex_property(obj, &n->nic_conf.bootindex, 3823aa4197c3SGonglei "bootindex", "/ethernet-phy@0", 382440c2281cSMarkus Armbruster DEVICE(n)); 38250145c393SAndrew Melnychenko 38260145c393SAndrew Melnychenko ebpf_rss_init(&n->ebpf_rss); 382717ec5a86SKONRAD Frederic } 382817ec5a86SKONRAD Frederic 382944b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque) 38304d45dcfbSHalil Pasic { 38314d45dcfbSHalil Pasic VirtIONet *n = opaque; 38324d45dcfbSHalil Pasic 38334d45dcfbSHalil Pasic /* At this point, backend must be stopped, otherwise 38344d45dcfbSHalil Pasic * it might keep writing to memory. */ 38354d45dcfbSHalil Pasic assert(!n->vhost_started); 383644b1ff31SDr. David Alan Gilbert 383744b1ff31SDr. David Alan Gilbert return 0; 38384d45dcfbSHalil Pasic } 38394d45dcfbSHalil Pasic 38409711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque) 38419711cd0dSJens Freimann { 38429711cd0dSJens Freimann DeviceState *dev = opaque; 384321e8709bSJuan Quintela DeviceState *primary; 38449711cd0dSJens Freimann VirtIODevice *vdev = VIRTIO_DEVICE(dev); 38459711cd0dSJens Freimann VirtIONet *n = VIRTIO_NET(vdev); 38469711cd0dSJens Freimann 3847284f42a5SJens Freimann if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) { 3848284f42a5SJens Freimann return false; 3849284f42a5SJens Freimann } 385021e8709bSJuan Quintela primary = failover_find_primary_device(n); 385121e8709bSJuan Quintela return primary ? primary->pending_deleted_event : false; 38529711cd0dSJens Freimann } 38539711cd0dSJens Freimann 38549711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque) 38559711cd0dSJens Freimann { 38569711cd0dSJens Freimann DeviceState *dev = opaque; 38579711cd0dSJens Freimann VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev); 38589711cd0dSJens Freimann 38599711cd0dSJens Freimann return vdc->primary_unplug_pending(dev); 38609711cd0dSJens Freimann } 38619711cd0dSJens Freimann 3862c255488dSJonah Palmer static struct vhost_dev *virtio_net_get_vhost(VirtIODevice *vdev) 3863c255488dSJonah Palmer { 3864c255488dSJonah Palmer VirtIONet *n = VIRTIO_NET(vdev); 3865c255488dSJonah Palmer NetClientState *nc = qemu_get_queue(n->nic); 3866c255488dSJonah Palmer struct vhost_net *net = get_vhost_net(nc->peer); 3867c255488dSJonah Palmer return &net->dev; 3868c255488dSJonah Palmer } 3869c255488dSJonah Palmer 38704d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = { 38714d45dcfbSHalil Pasic .name = "virtio-net", 38724d45dcfbSHalil Pasic .minimum_version_id = VIRTIO_NET_VM_VERSION, 38734d45dcfbSHalil Pasic .version_id = VIRTIO_NET_VM_VERSION, 38744d45dcfbSHalil Pasic .fields = (VMStateField[]) { 38754d45dcfbSHalil Pasic VMSTATE_VIRTIO_DEVICE, 38764d45dcfbSHalil Pasic VMSTATE_END_OF_LIST() 38774d45dcfbSHalil Pasic }, 38784d45dcfbSHalil Pasic .pre_save = virtio_net_pre_save, 38799711cd0dSJens Freimann .dev_unplug_pending = dev_unplug_pending, 38804d45dcfbSHalil Pasic }; 3881290c2428SDr. David Alan Gilbert 388217ec5a86SKONRAD Frederic static Property virtio_net_properties[] = { 3883127833eeSJason Baron DEFINE_PROP_BIT64("csum", VirtIONet, host_features, 3884127833eeSJason Baron VIRTIO_NET_F_CSUM, true), 3885127833eeSJason Baron DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features, 388687108bb2SShannon Zhao VIRTIO_NET_F_GUEST_CSUM, true), 3887127833eeSJason Baron DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true), 3888127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features, 388987108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO4, true), 3890127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features, 389187108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO6, true), 3892127833eeSJason Baron DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features, 389387108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ECN, true), 3894127833eeSJason Baron DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features, 389587108bb2SShannon Zhao VIRTIO_NET_F_GUEST_UFO, true), 3896127833eeSJason Baron DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features, 389787108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ANNOUNCE, true), 3898127833eeSJason Baron DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features, 389987108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO4, true), 3900127833eeSJason Baron DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features, 390187108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO6, true), 3902127833eeSJason Baron DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features, 390387108bb2SShannon Zhao VIRTIO_NET_F_HOST_ECN, true), 3904127833eeSJason Baron DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features, 390587108bb2SShannon Zhao VIRTIO_NET_F_HOST_UFO, true), 3906127833eeSJason Baron DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features, 390787108bb2SShannon Zhao VIRTIO_NET_F_MRG_RXBUF, true), 3908127833eeSJason Baron DEFINE_PROP_BIT64("status", VirtIONet, host_features, 390987108bb2SShannon Zhao VIRTIO_NET_F_STATUS, true), 3910127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features, 391187108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VQ, true), 3912127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features, 391387108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX, true), 3914127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features, 391587108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VLAN, true), 3916127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features, 391787108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX_EXTRA, true), 3918127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features, 391987108bb2SShannon Zhao VIRTIO_NET_F_CTRL_MAC_ADDR, true), 3920127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features, 392187108bb2SShannon Zhao VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true), 3922127833eeSJason Baron DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false), 392359079029SYuri Benditovich DEFINE_PROP_BIT64("rss", VirtIONet, host_features, 392459079029SYuri Benditovich VIRTIO_NET_F_RSS, false), 3925e22f0603SYuri Benditovich DEFINE_PROP_BIT64("hash", VirtIONet, host_features, 3926e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT, false), 39272974e916SYuri Benditovich DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features, 39282974e916SYuri Benditovich VIRTIO_NET_F_RSC_EXT, false), 39292974e916SYuri Benditovich DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout, 39302974e916SYuri Benditovich VIRTIO_NET_RSC_DEFAULT_INTERVAL), 393117ec5a86SKONRAD Frederic DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf), 393217ec5a86SKONRAD Frederic DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer, 393317ec5a86SKONRAD Frederic TX_TIMER_INTERVAL), 393417ec5a86SKONRAD Frederic DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST), 393517ec5a86SKONRAD Frederic DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx), 39361c0fbfa3SMichael S. Tsirkin DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size, 39371c0fbfa3SMichael S. Tsirkin VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE), 39389b02e161SWei Wang DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size, 39399b02e161SWei Wang VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE), 3940a93e599dSMaxime Coquelin DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0), 394175ebec11SMaxime Coquelin DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend, 394275ebec11SMaxime Coquelin true), 39439473939eSJason Baron DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN), 39449473939eSJason Baron DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str), 39459711cd0dSJens Freimann DEFINE_PROP_BOOL("failover", VirtIONet, failover, false), 394653da8b5aSYuri Benditovich DEFINE_PROP_BIT64("guest_uso4", VirtIONet, host_features, 394753da8b5aSYuri Benditovich VIRTIO_NET_F_GUEST_USO4, true), 394853da8b5aSYuri Benditovich DEFINE_PROP_BIT64("guest_uso6", VirtIONet, host_features, 394953da8b5aSYuri Benditovich VIRTIO_NET_F_GUEST_USO6, true), 395053da8b5aSYuri Benditovich DEFINE_PROP_BIT64("host_uso", VirtIONet, host_features, 395153da8b5aSYuri Benditovich VIRTIO_NET_F_HOST_USO, true), 395217ec5a86SKONRAD Frederic DEFINE_PROP_END_OF_LIST(), 395317ec5a86SKONRAD Frederic }; 395417ec5a86SKONRAD Frederic 395517ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data) 395617ec5a86SKONRAD Frederic { 395717ec5a86SKONRAD Frederic DeviceClass *dc = DEVICE_CLASS(klass); 395817ec5a86SKONRAD Frederic VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 3959e6f746b3SAndreas Färber 39604f67d30bSMarc-André Lureau device_class_set_props(dc, virtio_net_properties); 3961290c2428SDr. David Alan Gilbert dc->vmsd = &vmstate_virtio_net; 3962125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_NETWORK, dc->categories); 3963e6f746b3SAndreas Färber vdc->realize = virtio_net_device_realize; 3964306ec6c3SAndreas Färber vdc->unrealize = virtio_net_device_unrealize; 396517ec5a86SKONRAD Frederic vdc->get_config = virtio_net_get_config; 396617ec5a86SKONRAD Frederic vdc->set_config = virtio_net_set_config; 396717ec5a86SKONRAD Frederic vdc->get_features = virtio_net_get_features; 396817ec5a86SKONRAD Frederic vdc->set_features = virtio_net_set_features; 396917ec5a86SKONRAD Frederic vdc->bad_features = virtio_net_bad_features; 397017ec5a86SKONRAD Frederic vdc->reset = virtio_net_reset; 39717dc6be52SXuan Zhuo vdc->queue_reset = virtio_net_queue_reset; 39727f863302SKangjie Xu vdc->queue_enable = virtio_net_queue_enable; 397317ec5a86SKONRAD Frederic vdc->set_status = virtio_net_set_status; 397417ec5a86SKONRAD Frederic vdc->guest_notifier_mask = virtio_net_guest_notifier_mask; 397517ec5a86SKONRAD Frederic vdc->guest_notifier_pending = virtio_net_guest_notifier_pending; 39762a083ffdSMichael S. Tsirkin vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO); 39777788c3f2SMikhail Sennikovsky vdc->post_load = virtio_net_post_load_virtio; 3978982b78c5SDr. David Alan Gilbert vdc->vmsd = &vmstate_virtio_net_device; 39799711cd0dSJens Freimann vdc->primary_unplug_pending = primary_unplug_pending; 3980c255488dSJonah Palmer vdc->get_vhost = virtio_net_get_vhost; 3981cd9b8346SViktor Prutyanov vdc->toggle_device_iotlb = vhost_toggle_device_iotlb; 398217ec5a86SKONRAD Frederic } 398317ec5a86SKONRAD Frederic 398417ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = { 398517ec5a86SKONRAD Frederic .name = TYPE_VIRTIO_NET, 398617ec5a86SKONRAD Frederic .parent = TYPE_VIRTIO_DEVICE, 398717ec5a86SKONRAD Frederic .instance_size = sizeof(VirtIONet), 398817ec5a86SKONRAD Frederic .instance_init = virtio_net_instance_init, 398917ec5a86SKONRAD Frederic .class_init = virtio_net_class_init, 399017ec5a86SKONRAD Frederic }; 399117ec5a86SKONRAD Frederic 399217ec5a86SKONRAD Frederic static void virtio_register_types(void) 399317ec5a86SKONRAD Frederic { 399417ec5a86SKONRAD Frederic type_register_static(&virtio_net_info); 399517ec5a86SKONRAD Frederic } 399617ec5a86SKONRAD Frederic 399717ec5a86SKONRAD Frederic type_init(virtio_register_types) 3998