16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Network Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 149b8bfe21SPeter Maydell #include "qemu/osdep.h" 159711cd0dSJens Freimann #include "qemu/atomic.h" 166e790746SPaolo Bonzini #include "qemu/iov.h" 17db725815SMarkus Armbruster #include "qemu/main-loop.h" 180b8fa32fSMarkus Armbruster #include "qemu/module.h" 196e790746SPaolo Bonzini #include "hw/virtio/virtio.h" 206e790746SPaolo Bonzini #include "net/net.h" 216e790746SPaolo Bonzini #include "net/checksum.h" 226e790746SPaolo Bonzini #include "net/tap.h" 236e790746SPaolo Bonzini #include "qemu/error-report.h" 246e790746SPaolo Bonzini #include "qemu/timer.h" 259711cd0dSJens Freimann #include "qemu/option.h" 269711cd0dSJens Freimann #include "qemu/option_int.h" 279711cd0dSJens Freimann #include "qemu/config-file.h" 289711cd0dSJens Freimann #include "qapi/qmp/qdict.h" 296e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h" 306e790746SPaolo Bonzini #include "net/vhost_net.h" 319d8c6a25SDr. David Alan Gilbert #include "net/announce.h" 3217ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h" 33e688df6bSMarkus Armbruster #include "qapi/error.h" 349af23989SMarkus Armbruster #include "qapi/qapi-events-net.h" 35a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h" 369711cd0dSJens Freimann #include "qapi/qapi-types-migration.h" 379711cd0dSJens Freimann #include "qapi/qapi-events-migration.h" 381399c60dSRusty Russell #include "hw/virtio/virtio-access.h" 39f8d806c9SJuan Quintela #include "migration/misc.h" 409473939eSJason Baron #include "standard-headers/linux/ethtool.h" 412f780b6aSMarkus Armbruster #include "sysemu/sysemu.h" 429d8c6a25SDr. David Alan Gilbert #include "trace.h" 439711cd0dSJens Freimann #include "monitor/qdev.h" 449711cd0dSJens Freimann #include "hw/pci/pci.h" 454474e37aSYuri Benditovich #include "net_rx_pkt.h" 46108a6481SCindy Lu #include "hw/virtio/vhost.h" 471b529d90SLaurent Vivier #include "sysemu/qtest.h" 486e790746SPaolo Bonzini 496e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION 11 506e790746SPaolo Bonzini 516e790746SPaolo Bonzini #define MAC_TABLE_ENTRIES 64 526e790746SPaolo Bonzini #define MAX_VLAN (1 << 12) /* Per 802.1Q definition */ 536e790746SPaolo Bonzini 541c0fbfa3SMichael S. Tsirkin /* previously fixed value */ 551c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256 569b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256 579b02e161SWei Wang 58441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */ 591c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 609b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 611c0fbfa3SMichael S. Tsirkin 622974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE 8 /* ipv4 saddr + daddr */ 632974e916SYuri Benditovich 642974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG 0x3F 652974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH 0xF000 662974e916SYuri Benditovich 672974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */ 682974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header)) 692974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535 702974e916SYuri Benditovich 712974e916SYuri Benditovich /* header length value in ip header without option */ 722974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5 732974e916SYuri Benditovich 742974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE 32 /* ipv6 saddr + daddr */ 752974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD 762974e916SYuri Benditovich 772974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance 782974e916SYuri Benditovich a lot, and should be tuned carefully, '300000'(300us) is the recommended 792974e916SYuri Benditovich value to pass the WHQL test, '50000' can gain 2x netperf throughput with 802974e916SYuri Benditovich tso/gso/gro 'off'. */ 812974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000 822974e916SYuri Benditovich 8359079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \ 8459079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \ 8559079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \ 8659079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \ 8759079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \ 8859079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \ 8959079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \ 9059079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \ 9159079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) 9259079029SYuri Benditovich 93ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = { 94127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MAC, 955d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mac)}, 96127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_STATUS, 975d5b33c0SMax Reitz .end = endof(struct virtio_net_config, status)}, 98127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MQ, 995d5b33c0SMax Reitz .end = endof(struct virtio_net_config, max_virtqueue_pairs)}, 100127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MTU, 1015d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mtu)}, 1029473939eSJason Baron {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX, 1035d5b33c0SMax Reitz .end = endof(struct virtio_net_config, duplex)}, 104e22f0603SYuri Benditovich {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT), 10559079029SYuri Benditovich .end = endof(struct virtio_net_config, supported_hash_types)}, 1066e790746SPaolo Bonzini {} 1076e790746SPaolo Bonzini }; 1086e790746SPaolo Bonzini 1096e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc) 1106e790746SPaolo Bonzini { 1116e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1126e790746SPaolo Bonzini 1136e790746SPaolo Bonzini return &n->vqs[nc->queue_index]; 1146e790746SPaolo Bonzini } 1156e790746SPaolo Bonzini 1166e790746SPaolo Bonzini static int vq2q(int queue_index) 1176e790746SPaolo Bonzini { 1186e790746SPaolo Bonzini return queue_index / 2; 1196e790746SPaolo Bonzini } 1206e790746SPaolo Bonzini 1216e790746SPaolo Bonzini /* TODO 1226e790746SPaolo Bonzini * - we could suppress RX interrupt if we were so inclined. 1236e790746SPaolo Bonzini */ 1246e790746SPaolo Bonzini 1256e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config) 1266e790746SPaolo Bonzini { 12717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1286e790746SPaolo Bonzini struct virtio_net_config netcfg; 129c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 130fb592882SCindy Lu static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } }; 1316e790746SPaolo Bonzini 132108a6481SCindy Lu int ret = 0; 133108a6481SCindy Lu memset(&netcfg, 0 , sizeof(struct virtio_net_config)); 1341399c60dSRusty Russell virtio_stw_p(vdev, &netcfg.status, n->status); 135441537f1SJason Wang virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs); 136a93e599dSMaxime Coquelin virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu); 1376e790746SPaolo Bonzini memcpy(netcfg.mac, n->mac, ETH_ALEN); 1389473939eSJason Baron virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed); 1399473939eSJason Baron netcfg.duplex = n->net_conf.duplex; 14059079029SYuri Benditovich netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE; 14159079029SYuri Benditovich virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length, 142e22f0603SYuri Benditovich virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ? 143e22f0603SYuri Benditovich VIRTIO_NET_RSS_MAX_TABLE_LEN : 1); 14459079029SYuri Benditovich virtio_stl_p(vdev, &netcfg.supported_hash_types, 14559079029SYuri Benditovich VIRTIO_NET_RSS_SUPPORTED_HASHES); 1466e790746SPaolo Bonzini memcpy(config, &netcfg, n->config_size); 147108a6481SCindy Lu 148c546ecf2SJason Wang /* 149c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 150c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 151c546ecf2SJason Wang */ 152c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 153108a6481SCindy Lu ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg, 154108a6481SCindy Lu n->config_size); 155108a6481SCindy Lu if (ret != -1) { 156fb592882SCindy Lu /* 157fb592882SCindy Lu * Some NIC/kernel combinations present 0 as the mac address. As 158fb592882SCindy Lu * that is not a legal address, try to proceed with the 159fb592882SCindy Lu * address from the QEMU command line in the hope that the 160fb592882SCindy Lu * address has been configured correctly elsewhere - just not 161fb592882SCindy Lu * reported by the device. 162fb592882SCindy Lu */ 163fb592882SCindy Lu if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) { 164fb592882SCindy Lu info_report("Zero hardware mac address detected. Ignoring."); 165fb592882SCindy Lu memcpy(netcfg.mac, n->mac, ETH_ALEN); 166fb592882SCindy Lu } 167108a6481SCindy Lu memcpy(config, &netcfg, n->config_size); 168108a6481SCindy Lu } 169108a6481SCindy Lu } 1706e790746SPaolo Bonzini } 1716e790746SPaolo Bonzini 1726e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config) 1736e790746SPaolo Bonzini { 17417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1756e790746SPaolo Bonzini struct virtio_net_config netcfg = {}; 176c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 1776e790746SPaolo Bonzini 1786e790746SPaolo Bonzini memcpy(&netcfg, config, n->config_size); 1796e790746SPaolo Bonzini 18095129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) && 18195129d6fSCornelia Huck !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) && 1826e790746SPaolo Bonzini memcmp(netcfg.mac, n->mac, ETH_ALEN)) { 1836e790746SPaolo Bonzini memcpy(n->mac, netcfg.mac, ETH_ALEN); 1846e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1856e790746SPaolo Bonzini } 186108a6481SCindy Lu 187c546ecf2SJason Wang /* 188c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 189c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 190c546ecf2SJason Wang */ 191c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 192c546ecf2SJason Wang vhost_net_set_config(get_vhost_net(nc->peer), 193c546ecf2SJason Wang (uint8_t *)&netcfg, 0, n->config_size, 194108a6481SCindy Lu VHOST_SET_CONFIG_TYPE_MASTER); 195108a6481SCindy Lu } 1966e790746SPaolo Bonzini } 1976e790746SPaolo Bonzini 1986e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status) 1996e790746SPaolo Bonzini { 20017a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2016e790746SPaolo Bonzini return (status & VIRTIO_CONFIG_S_DRIVER_OK) && 20217a0ca55SKONRAD Frederic (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running; 2036e790746SPaolo Bonzini } 2046e790746SPaolo Bonzini 205b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net) 206b2c929f0SDr. David Alan Gilbert { 207b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(net); 208b2c929f0SDr. David Alan Gilbert trace_virtio_net_announce_notify(); 209b2c929f0SDr. David Alan Gilbert 210b2c929f0SDr. David Alan Gilbert net->status |= VIRTIO_NET_S_ANNOUNCE; 211b2c929f0SDr. David Alan Gilbert virtio_notify_config(vdev); 212b2c929f0SDr. David Alan Gilbert } 213b2c929f0SDr. David Alan Gilbert 214f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque) 215f57fcf70SJason Wang { 216f57fcf70SJason Wang VirtIONet *n = opaque; 2179d8c6a25SDr. David Alan Gilbert trace_virtio_net_announce_timer(n->announce_timer.round); 218f57fcf70SJason Wang 2199d8c6a25SDr. David Alan Gilbert n->announce_timer.round--; 220b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 221b2c929f0SDr. David Alan Gilbert } 222b2c929f0SDr. David Alan Gilbert 223b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc) 224b2c929f0SDr. David Alan Gilbert { 225b2c929f0SDr. David Alan Gilbert VirtIONet *n = qemu_get_nic_opaque(nc); 226b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 227b2c929f0SDr. David Alan Gilbert 228b2c929f0SDr. David Alan Gilbert /* 229b2c929f0SDr. David Alan Gilbert * Make sure the virtio migration announcement timer isn't running 230b2c929f0SDr. David Alan Gilbert * If it is, let it trigger announcement so that we do not cause 231b2c929f0SDr. David Alan Gilbert * confusion. 232b2c929f0SDr. David Alan Gilbert */ 233b2c929f0SDr. David Alan Gilbert if (n->announce_timer.round) { 234b2c929f0SDr. David Alan Gilbert return; 235b2c929f0SDr. David Alan Gilbert } 236b2c929f0SDr. David Alan Gilbert 237b2c929f0SDr. David Alan Gilbert if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 238b2c929f0SDr. David Alan Gilbert virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 239b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 240b2c929f0SDr. David Alan Gilbert } 241f57fcf70SJason Wang } 242f57fcf70SJason Wang 2436e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status) 2446e790746SPaolo Bonzini { 24517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2466e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 247441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 24822288fe5SJason Wang int cvq = n->max_ncs - n->max_queue_pairs; 2496e790746SPaolo Bonzini 250ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 2516e790746SPaolo Bonzini return; 2526e790746SPaolo Bonzini } 2536e790746SPaolo Bonzini 2548c1ac475SRadim Krčmář if ((virtio_net_started(n, status) && !nc->peer->link_down) == 2558c1ac475SRadim Krčmář !!n->vhost_started) { 2566e790746SPaolo Bonzini return; 2576e790746SPaolo Bonzini } 2586e790746SPaolo Bonzini if (!n->vhost_started) { 259086abc1cSMichael S. Tsirkin int r, i; 260086abc1cSMichael S. Tsirkin 2611bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2621bfa316cSGreg Kurz error_report("backend does not support %s vnet headers; " 2631bfa316cSGreg Kurz "falling back on userspace virtio", 2641bfa316cSGreg Kurz virtio_is_big_endian(vdev) ? "BE" : "LE"); 2651bfa316cSGreg Kurz return; 2661bfa316cSGreg Kurz } 2671bfa316cSGreg Kurz 268086abc1cSMichael S. Tsirkin /* Any packets outstanding? Purge them to avoid touching rings 269086abc1cSMichael S. Tsirkin * when vhost is running. 270086abc1cSMichael S. Tsirkin */ 271441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 272086abc1cSMichael S. Tsirkin NetClientState *qnc = qemu_get_subqueue(n->nic, i); 273086abc1cSMichael S. Tsirkin 274086abc1cSMichael S. Tsirkin /* Purge both directions: TX and RX. */ 275086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->peer->incoming_queue, qnc); 276086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->incoming_queue, qnc->peer); 277086abc1cSMichael S. Tsirkin } 278086abc1cSMichael S. Tsirkin 279a93e599dSMaxime Coquelin if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) { 280a93e599dSMaxime Coquelin r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu); 281a93e599dSMaxime Coquelin if (r < 0) { 282a93e599dSMaxime Coquelin error_report("%uBytes MTU not supported by the backend", 283a93e599dSMaxime Coquelin n->net_conf.mtu); 284a93e599dSMaxime Coquelin 285a93e599dSMaxime Coquelin return; 286a93e599dSMaxime Coquelin } 287a93e599dSMaxime Coquelin } 288a93e599dSMaxime Coquelin 2896e790746SPaolo Bonzini n->vhost_started = 1; 29022288fe5SJason Wang r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq); 2916e790746SPaolo Bonzini if (r < 0) { 2926e790746SPaolo Bonzini error_report("unable to start vhost net: %d: " 2936e790746SPaolo Bonzini "falling back on userspace virtio", -r); 2946e790746SPaolo Bonzini n->vhost_started = 0; 2956e790746SPaolo Bonzini } 2966e790746SPaolo Bonzini } else { 29722288fe5SJason Wang vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq); 2986e790746SPaolo Bonzini n->vhost_started = 0; 2996e790746SPaolo Bonzini } 3006e790746SPaolo Bonzini } 3016e790746SPaolo Bonzini 3021bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev, 3031bfa316cSGreg Kurz NetClientState *peer, 3041bfa316cSGreg Kurz bool enable) 3051bfa316cSGreg Kurz { 3061bfa316cSGreg Kurz if (virtio_is_big_endian(vdev)) { 3071bfa316cSGreg Kurz return qemu_set_vnet_be(peer, enable); 3081bfa316cSGreg Kurz } else { 3091bfa316cSGreg Kurz return qemu_set_vnet_le(peer, enable); 3101bfa316cSGreg Kurz } 3111bfa316cSGreg Kurz } 3121bfa316cSGreg Kurz 3131bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs, 314441537f1SJason Wang int queue_pairs, bool enable) 3151bfa316cSGreg Kurz { 3161bfa316cSGreg Kurz int i; 3171bfa316cSGreg Kurz 318441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 3191bfa316cSGreg Kurz if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 && 3201bfa316cSGreg Kurz enable) { 3211bfa316cSGreg Kurz while (--i >= 0) { 3221bfa316cSGreg Kurz virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false); 3231bfa316cSGreg Kurz } 3241bfa316cSGreg Kurz 3251bfa316cSGreg Kurz return true; 3261bfa316cSGreg Kurz } 3271bfa316cSGreg Kurz } 3281bfa316cSGreg Kurz 3291bfa316cSGreg Kurz return false; 3301bfa316cSGreg Kurz } 3311bfa316cSGreg Kurz 3321bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status) 3331bfa316cSGreg Kurz { 3341bfa316cSGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(n); 335441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3361bfa316cSGreg Kurz 3371bfa316cSGreg Kurz if (virtio_net_started(n, status)) { 3381bfa316cSGreg Kurz /* Before using the device, we tell the network backend about the 3391bfa316cSGreg Kurz * endianness to use when parsing vnet headers. If the backend 3401bfa316cSGreg Kurz * can't do it, we fallback onto fixing the headers in the core 3411bfa316cSGreg Kurz * virtio-net code. 3421bfa316cSGreg Kurz */ 3431bfa316cSGreg Kurz n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs, 344441537f1SJason Wang queue_pairs, true); 3451bfa316cSGreg Kurz } else if (virtio_net_started(n, vdev->status)) { 3461bfa316cSGreg Kurz /* After using the device, we need to reset the network backend to 3471bfa316cSGreg Kurz * the default (guest native endianness), otherwise the guest may 3481bfa316cSGreg Kurz * lose network connectivity if it is rebooted into a different 3491bfa316cSGreg Kurz * endianness. 3501bfa316cSGreg Kurz */ 351441537f1SJason Wang virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false); 3521bfa316cSGreg Kurz } 3531bfa316cSGreg Kurz } 3541bfa316cSGreg Kurz 355283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq) 356283e2c2aSYuri Benditovich { 357283e2c2aSYuri Benditovich unsigned int dropped = virtqueue_drop_all(vq); 358283e2c2aSYuri Benditovich if (dropped) { 359283e2c2aSYuri Benditovich virtio_notify(vdev, vq); 360283e2c2aSYuri Benditovich } 361283e2c2aSYuri Benditovich } 362283e2c2aSYuri Benditovich 3636e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status) 3646e790746SPaolo Bonzini { 36517a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 3666e790746SPaolo Bonzini VirtIONetQueue *q; 3676e790746SPaolo Bonzini int i; 3686e790746SPaolo Bonzini uint8_t queue_status; 3696e790746SPaolo Bonzini 3701bfa316cSGreg Kurz virtio_net_vnet_endian_status(n, status); 3716e790746SPaolo Bonzini virtio_net_vhost_status(n, status); 3726e790746SPaolo Bonzini 373441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 37438705bb5SFam Zheng NetClientState *ncs = qemu_get_subqueue(n->nic, i); 37538705bb5SFam Zheng bool queue_started; 3766e790746SPaolo Bonzini q = &n->vqs[i]; 3776e790746SPaolo Bonzini 378441537f1SJason Wang if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) { 3796e790746SPaolo Bonzini queue_status = 0; 3806e790746SPaolo Bonzini } else { 3816e790746SPaolo Bonzini queue_status = status; 3826e790746SPaolo Bonzini } 38338705bb5SFam Zheng queue_started = 38438705bb5SFam Zheng virtio_net_started(n, queue_status) && !n->vhost_started; 38538705bb5SFam Zheng 38638705bb5SFam Zheng if (queue_started) { 38738705bb5SFam Zheng qemu_flush_queued_packets(ncs); 38838705bb5SFam Zheng } 3896e790746SPaolo Bonzini 3906e790746SPaolo Bonzini if (!q->tx_waiting) { 3916e790746SPaolo Bonzini continue; 3926e790746SPaolo Bonzini } 3936e790746SPaolo Bonzini 39438705bb5SFam Zheng if (queue_started) { 3956e790746SPaolo Bonzini if (q->tx_timer) { 396bc72ad67SAlex Bligh timer_mod(q->tx_timer, 397bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 3986e790746SPaolo Bonzini } else { 3996e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 4006e790746SPaolo Bonzini } 4016e790746SPaolo Bonzini } else { 4026e790746SPaolo Bonzini if (q->tx_timer) { 403bc72ad67SAlex Bligh timer_del(q->tx_timer); 4046e790746SPaolo Bonzini } else { 4056e790746SPaolo Bonzini qemu_bh_cancel(q->tx_bh); 4066e790746SPaolo Bonzini } 407283e2c2aSYuri Benditovich if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 && 40870e53e6eSJason Wang (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) && 40970e53e6eSJason Wang vdev->vm_running) { 410283e2c2aSYuri Benditovich /* if tx is waiting we are likely have some packets in tx queue 411283e2c2aSYuri Benditovich * and disabled notification */ 412283e2c2aSYuri Benditovich q->tx_waiting = 0; 413283e2c2aSYuri Benditovich virtio_queue_set_notification(q->tx_vq, 1); 414283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, q->tx_vq); 415283e2c2aSYuri Benditovich } 4166e790746SPaolo Bonzini } 4176e790746SPaolo Bonzini } 4186e790746SPaolo Bonzini } 4196e790746SPaolo Bonzini 4206e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc) 4216e790746SPaolo Bonzini { 4226e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 42317a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 4246e790746SPaolo Bonzini uint16_t old_status = n->status; 4256e790746SPaolo Bonzini 4266e790746SPaolo Bonzini if (nc->link_down) 4276e790746SPaolo Bonzini n->status &= ~VIRTIO_NET_S_LINK_UP; 4286e790746SPaolo Bonzini else 4296e790746SPaolo Bonzini n->status |= VIRTIO_NET_S_LINK_UP; 4306e790746SPaolo Bonzini 4316e790746SPaolo Bonzini if (n->status != old_status) 43217a0ca55SKONRAD Frederic virtio_notify_config(vdev); 4336e790746SPaolo Bonzini 43417a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 4356e790746SPaolo Bonzini } 4366e790746SPaolo Bonzini 437b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc) 438b1be4280SAmos Kong { 439b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 440b1be4280SAmos Kong 441b1be4280SAmos Kong if (nc->rxfilter_notify_enabled) { 442ddfb0baaSMarkus Armbruster char *path = object_get_canonical_path(OBJECT(n->qdev)); 44306150279SWenchao Xia qapi_event_send_nic_rx_filter_changed(!!n->netclient_name, 4443ab72385SPeter Xu n->netclient_name, path); 44596e35046SAmos Kong g_free(path); 446b1be4280SAmos Kong 447b1be4280SAmos Kong /* disable event notification to avoid events flooding */ 448b1be4280SAmos Kong nc->rxfilter_notify_enabled = 0; 449b1be4280SAmos Kong } 450b1be4280SAmos Kong } 451b1be4280SAmos Kong 452f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n) 453f7bc8ef8SAmos Kong { 45454aa3de7SEric Blake intList *list; 455f7bc8ef8SAmos Kong int i, j; 456f7bc8ef8SAmos Kong 457f7bc8ef8SAmos Kong list = NULL; 458f7bc8ef8SAmos Kong for (i = 0; i < MAX_VLAN >> 5; i++) { 459f7bc8ef8SAmos Kong for (j = 0; n->vlans[i] && j <= 0x1f; j++) { 460f7bc8ef8SAmos Kong if (n->vlans[i] & (1U << j)) { 46154aa3de7SEric Blake QAPI_LIST_PREPEND(list, (i << 5) + j); 462f7bc8ef8SAmos Kong } 463f7bc8ef8SAmos Kong } 464f7bc8ef8SAmos Kong } 465f7bc8ef8SAmos Kong 466f7bc8ef8SAmos Kong return list; 467f7bc8ef8SAmos Kong } 468f7bc8ef8SAmos Kong 469b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc) 470b1be4280SAmos Kong { 471b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 472f7bc8ef8SAmos Kong VirtIODevice *vdev = VIRTIO_DEVICE(n); 473b1be4280SAmos Kong RxFilterInfo *info; 47454aa3de7SEric Blake strList *str_list; 475f7bc8ef8SAmos Kong int i; 476b1be4280SAmos Kong 477b1be4280SAmos Kong info = g_malloc0(sizeof(*info)); 478b1be4280SAmos Kong info->name = g_strdup(nc->name); 479b1be4280SAmos Kong info->promiscuous = n->promisc; 480b1be4280SAmos Kong 481b1be4280SAmos Kong if (n->nouni) { 482b1be4280SAmos Kong info->unicast = RX_STATE_NONE; 483b1be4280SAmos Kong } else if (n->alluni) { 484b1be4280SAmos Kong info->unicast = RX_STATE_ALL; 485b1be4280SAmos Kong } else { 486b1be4280SAmos Kong info->unicast = RX_STATE_NORMAL; 487b1be4280SAmos Kong } 488b1be4280SAmos Kong 489b1be4280SAmos Kong if (n->nomulti) { 490b1be4280SAmos Kong info->multicast = RX_STATE_NONE; 491b1be4280SAmos Kong } else if (n->allmulti) { 492b1be4280SAmos Kong info->multicast = RX_STATE_ALL; 493b1be4280SAmos Kong } else { 494b1be4280SAmos Kong info->multicast = RX_STATE_NORMAL; 495b1be4280SAmos Kong } 496b1be4280SAmos Kong 497b1be4280SAmos Kong info->broadcast_allowed = n->nobcast; 498b1be4280SAmos Kong info->multicast_overflow = n->mac_table.multi_overflow; 499b1be4280SAmos Kong info->unicast_overflow = n->mac_table.uni_overflow; 500b1be4280SAmos Kong 501b0575ba4SScott Feldman info->main_mac = qemu_mac_strdup_printf(n->mac); 502b1be4280SAmos Kong 503b1be4280SAmos Kong str_list = NULL; 504b1be4280SAmos Kong for (i = 0; i < n->mac_table.first_multi; i++) { 50554aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 50654aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 507b1be4280SAmos Kong } 508b1be4280SAmos Kong info->unicast_table = str_list; 509b1be4280SAmos Kong 510b1be4280SAmos Kong str_list = NULL; 511b1be4280SAmos Kong for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 51254aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 51354aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 514b1be4280SAmos Kong } 515b1be4280SAmos Kong info->multicast_table = str_list; 516f7bc8ef8SAmos Kong info->vlan_table = get_vlan_table(n); 517b1be4280SAmos Kong 51895129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) { 519f7bc8ef8SAmos Kong info->vlan = RX_STATE_ALL; 520f7bc8ef8SAmos Kong } else if (!info->vlan_table) { 521f7bc8ef8SAmos Kong info->vlan = RX_STATE_NONE; 522f7bc8ef8SAmos Kong } else { 523f7bc8ef8SAmos Kong info->vlan = RX_STATE_NORMAL; 524b1be4280SAmos Kong } 525b1be4280SAmos Kong 526b1be4280SAmos Kong /* enable event notification after query */ 527b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 528b1be4280SAmos Kong 529b1be4280SAmos Kong return info; 530b1be4280SAmos Kong } 531b1be4280SAmos Kong 5326e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev) 5336e790746SPaolo Bonzini { 53417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 53594b52958SGreg Kurz int i; 5366e790746SPaolo Bonzini 5376e790746SPaolo Bonzini /* Reset back to compatibility mode */ 5386e790746SPaolo Bonzini n->promisc = 1; 5396e790746SPaolo Bonzini n->allmulti = 0; 5406e790746SPaolo Bonzini n->alluni = 0; 5416e790746SPaolo Bonzini n->nomulti = 0; 5426e790746SPaolo Bonzini n->nouni = 0; 5436e790746SPaolo Bonzini n->nobcast = 0; 5446e790746SPaolo Bonzini /* multiqueue is disabled by default */ 545441537f1SJason Wang n->curr_queue_pairs = 1; 5469d8c6a25SDr. David Alan Gilbert timer_del(n->announce_timer.tm); 5479d8c6a25SDr. David Alan Gilbert n->announce_timer.round = 0; 548f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 5496e790746SPaolo Bonzini 5506e790746SPaolo Bonzini /* Flush any MAC and VLAN filter table state */ 5516e790746SPaolo Bonzini n->mac_table.in_use = 0; 5526e790746SPaolo Bonzini n->mac_table.first_multi = 0; 5536e790746SPaolo Bonzini n->mac_table.multi_overflow = 0; 5546e790746SPaolo Bonzini n->mac_table.uni_overflow = 0; 5556e790746SPaolo Bonzini memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN); 5566e790746SPaolo Bonzini memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac)); 557702d66a8SMichael S. Tsirkin qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 5586e790746SPaolo Bonzini memset(n->vlans, 0, MAX_VLAN >> 3); 55994b52958SGreg Kurz 56094b52958SGreg Kurz /* Flush any async TX */ 561441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 56294b52958SGreg Kurz NetClientState *nc = qemu_get_subqueue(n->nic, i); 56394b52958SGreg Kurz 56494b52958SGreg Kurz if (nc->peer) { 56594b52958SGreg Kurz qemu_flush_or_purge_queued_packets(nc->peer, true); 56694b52958SGreg Kurz assert(!virtio_net_get_subqueue(nc)->async_tx.elem); 56794b52958SGreg Kurz } 56894b52958SGreg Kurz } 5696e790746SPaolo Bonzini } 5706e790746SPaolo Bonzini 5716e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n) 5726e790746SPaolo Bonzini { 5736e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 5746e790746SPaolo Bonzini if (!nc->peer) { 5756e790746SPaolo Bonzini return; 5766e790746SPaolo Bonzini } 5776e790746SPaolo Bonzini 578d6085e3aSStefan Hajnoczi n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer); 5796e790746SPaolo Bonzini } 5806e790746SPaolo Bonzini 5816e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n) 5826e790746SPaolo Bonzini { 5836e790746SPaolo Bonzini return n->has_vnet_hdr; 5846e790746SPaolo Bonzini } 5856e790746SPaolo Bonzini 5866e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n) 5876e790746SPaolo Bonzini { 5886e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) 5896e790746SPaolo Bonzini return 0; 5906e790746SPaolo Bonzini 591d6085e3aSStefan Hajnoczi n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer); 5926e790746SPaolo Bonzini 5936e790746SPaolo Bonzini return n->has_ufo; 5946e790746SPaolo Bonzini } 5956e790746SPaolo Bonzini 596bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs, 597e22f0603SYuri Benditovich int version_1, int hash_report) 5986e790746SPaolo Bonzini { 5996e790746SPaolo Bonzini int i; 6006e790746SPaolo Bonzini NetClientState *nc; 6016e790746SPaolo Bonzini 6026e790746SPaolo Bonzini n->mergeable_rx_bufs = mergeable_rx_bufs; 6036e790746SPaolo Bonzini 604bb9d17f8SCornelia Huck if (version_1) { 605e22f0603SYuri Benditovich n->guest_hdr_len = hash_report ? 606e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_v1_hash) : 607e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_mrg_rxbuf); 608e22f0603SYuri Benditovich n->rss_data.populate_hash = !!hash_report; 609bb9d17f8SCornelia Huck } else { 6106e790746SPaolo Bonzini n->guest_hdr_len = n->mergeable_rx_bufs ? 611bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr_mrg_rxbuf) : 612bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr); 613bb9d17f8SCornelia Huck } 6146e790746SPaolo Bonzini 615441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6166e790746SPaolo Bonzini nc = qemu_get_subqueue(n->nic, i); 6176e790746SPaolo Bonzini 6186e790746SPaolo Bonzini if (peer_has_vnet_hdr(n) && 619d6085e3aSStefan Hajnoczi qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) { 620d6085e3aSStefan Hajnoczi qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len); 6216e790746SPaolo Bonzini n->host_hdr_len = n->guest_hdr_len; 6226e790746SPaolo Bonzini } 6236e790746SPaolo Bonzini } 6246e790746SPaolo Bonzini } 6256e790746SPaolo Bonzini 6262eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n) 6272eef278bSMichael S. Tsirkin { 6282eef278bSMichael S. Tsirkin NetClientState *peer = n->nic_conf.peers.ncs[0]; 6292eef278bSMichael S. Tsirkin 6302eef278bSMichael S. Tsirkin /* 631*0ea5778fSEugenio Pérez * Backends other than vhost-user or vhost-vdpa don't support max queue 632*0ea5778fSEugenio Pérez * size. 6332eef278bSMichael S. Tsirkin */ 6342eef278bSMichael S. Tsirkin if (!peer) { 6352eef278bSMichael S. Tsirkin return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 6362eef278bSMichael S. Tsirkin } 6372eef278bSMichael S. Tsirkin 638*0ea5778fSEugenio Pérez switch(peer->info->type) { 639*0ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_USER: 640*0ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_VDPA: 6412eef278bSMichael S. Tsirkin return VIRTQUEUE_MAX_SIZE; 642*0ea5778fSEugenio Pérez default: 643*0ea5778fSEugenio Pérez return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 644*0ea5778fSEugenio Pérez }; 6452eef278bSMichael S. Tsirkin } 6462eef278bSMichael S. Tsirkin 6476e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index) 6486e790746SPaolo Bonzini { 6496e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 6506e790746SPaolo Bonzini 6516e790746SPaolo Bonzini if (!nc->peer) { 6526e790746SPaolo Bonzini return 0; 6536e790746SPaolo Bonzini } 6546e790746SPaolo Bonzini 655f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 6567263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 1); 6577263a0adSChangchun Ouyang } 6587263a0adSChangchun Ouyang 659f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 6606e790746SPaolo Bonzini return 0; 6616e790746SPaolo Bonzini } 6626e790746SPaolo Bonzini 663441537f1SJason Wang if (n->max_queue_pairs == 1) { 6641074b879SJason Wang return 0; 6651074b879SJason Wang } 6661074b879SJason Wang 6676e790746SPaolo Bonzini return tap_enable(nc->peer); 6686e790746SPaolo Bonzini } 6696e790746SPaolo Bonzini 6706e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index) 6716e790746SPaolo Bonzini { 6726e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 6736e790746SPaolo Bonzini 6746e790746SPaolo Bonzini if (!nc->peer) { 6756e790746SPaolo Bonzini return 0; 6766e790746SPaolo Bonzini } 6776e790746SPaolo Bonzini 678f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 6797263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 0); 6807263a0adSChangchun Ouyang } 6817263a0adSChangchun Ouyang 682f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 6836e790746SPaolo Bonzini return 0; 6846e790746SPaolo Bonzini } 6856e790746SPaolo Bonzini 6866e790746SPaolo Bonzini return tap_disable(nc->peer); 6876e790746SPaolo Bonzini } 6886e790746SPaolo Bonzini 689441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n) 6906e790746SPaolo Bonzini { 6916e790746SPaolo Bonzini int i; 692ddfa83eaSJoel Stanley int r; 6936e790746SPaolo Bonzini 69468b5f314SYuri Benditovich if (n->nic->peer_deleted) { 69568b5f314SYuri Benditovich return; 69668b5f314SYuri Benditovich } 69768b5f314SYuri Benditovich 698441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 699441537f1SJason Wang if (i < n->curr_queue_pairs) { 700ddfa83eaSJoel Stanley r = peer_attach(n, i); 701ddfa83eaSJoel Stanley assert(!r); 7026e790746SPaolo Bonzini } else { 703ddfa83eaSJoel Stanley r = peer_detach(n, i); 704ddfa83eaSJoel Stanley assert(!r); 7056e790746SPaolo Bonzini } 7066e790746SPaolo Bonzini } 7076e790746SPaolo Bonzini } 7086e790746SPaolo Bonzini 709ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue); 7106e790746SPaolo Bonzini 7119d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features, 7129d5b731dSJason Wang Error **errp) 7136e790746SPaolo Bonzini { 71417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 7156e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 7166e790746SPaolo Bonzini 717da3e8a23SShannon Zhao /* Firstly sync all virtio-net possible supported features */ 718da3e8a23SShannon Zhao features |= n->host_features; 719da3e8a23SShannon Zhao 7200cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7216e790746SPaolo Bonzini 7226e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) { 7230cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_CSUM); 7240cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4); 7250cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6); 7260cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN); 7276e790746SPaolo Bonzini 7280cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM); 7290cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4); 7300cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6); 7310cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN); 732e22f0603SYuri Benditovich 733e22f0603SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT); 7346e790746SPaolo Bonzini } 7356e790746SPaolo Bonzini 7366e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) { 7370cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO); 7380cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO); 7396e790746SPaolo Bonzini } 7406e790746SPaolo Bonzini 741ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 7426e790746SPaolo Bonzini return features; 7436e790746SPaolo Bonzini } 7442974e916SYuri Benditovich 7450145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 74659079029SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_RSS); 7470145c393SAndrew Melnychenko } 74875ebec11SMaxime Coquelin features = vhost_net_get_features(get_vhost_net(nc->peer), features); 74975ebec11SMaxime Coquelin vdev->backend_features = features; 75075ebec11SMaxime Coquelin 75175ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 75275ebec11SMaxime Coquelin (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) { 75375ebec11SMaxime Coquelin features |= (1ULL << VIRTIO_NET_F_MTU); 75475ebec11SMaxime Coquelin } 75575ebec11SMaxime Coquelin 75675ebec11SMaxime Coquelin return features; 7576e790746SPaolo Bonzini } 7586e790746SPaolo Bonzini 759019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev) 7606e790746SPaolo Bonzini { 761019a3edbSGerd Hoffmann uint64_t features = 0; 7626e790746SPaolo Bonzini 7636e790746SPaolo Bonzini /* Linux kernel 2.6.25. It understood MAC (as everyone must), 7646e790746SPaolo Bonzini * but also these: */ 7650cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7660cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_CSUM); 7670cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4); 7680cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6); 7690cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN); 7706e790746SPaolo Bonzini 7716e790746SPaolo Bonzini return features; 7726e790746SPaolo Bonzini } 7736e790746SPaolo Bonzini 774644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n) 775644c9858SDmitry Fleytman { 776ad37bb3bSStefan Hajnoczi qemu_set_offload(qemu_get_queue(n->nic)->peer, 777644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)), 778644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)), 779644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)), 780644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)), 781644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO))); 782644c9858SDmitry Fleytman } 783644c9858SDmitry Fleytman 784644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features) 785644c9858SDmitry Fleytman { 786644c9858SDmitry Fleytman static const uint64_t guest_offloads_mask = 787644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_CSUM) | 788644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO4) | 789644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO6) | 790644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_ECN) | 791644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_UFO); 792644c9858SDmitry Fleytman 793644c9858SDmitry Fleytman return guest_offloads_mask & features; 794644c9858SDmitry Fleytman } 795644c9858SDmitry Fleytman 796644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n) 797644c9858SDmitry Fleytman { 798644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 799644c9858SDmitry Fleytman return virtio_net_guest_offloads_by_features(vdev->guest_features); 800644c9858SDmitry Fleytman } 801644c9858SDmitry Fleytman 802f5e1847bSJuan Quintela typedef struct { 803f5e1847bSJuan Quintela VirtIONet *n; 80412b2fad7SKevin Wolf DeviceState *dev; 80512b2fad7SKevin Wolf } FailoverDevice; 806f5e1847bSJuan Quintela 807f5e1847bSJuan Quintela /** 80812b2fad7SKevin Wolf * Set the failover primary device 809f5e1847bSJuan Quintela * 810f5e1847bSJuan Quintela * @opaque: FailoverId to setup 811f5e1847bSJuan Quintela * @opts: opts for device we are handling 812f5e1847bSJuan Quintela * @errp: returns an error if this function fails 813f5e1847bSJuan Quintela */ 81412b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque) 815f5e1847bSJuan Quintela { 81612b2fad7SKevin Wolf FailoverDevice *fdev = opaque; 81712b2fad7SKevin Wolf PCIDevice *pci_dev = (PCIDevice *) 81812b2fad7SKevin Wolf object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE); 819f5e1847bSJuan Quintela 82012b2fad7SKevin Wolf if (!pci_dev) { 82112b2fad7SKevin Wolf return 0; 82212b2fad7SKevin Wolf } 82312b2fad7SKevin Wolf 82412b2fad7SKevin Wolf if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) { 82512b2fad7SKevin Wolf fdev->dev = dev; 826f5e1847bSJuan Quintela return 1; 827f5e1847bSJuan Quintela } 828f5e1847bSJuan Quintela 829f5e1847bSJuan Quintela return 0; 830f5e1847bSJuan Quintela } 831f5e1847bSJuan Quintela 832f5e1847bSJuan Quintela /** 83385d3b931SJuan Quintela * Find the primary device for this failover virtio-net 83485d3b931SJuan Quintela * 83585d3b931SJuan Quintela * @n: VirtIONet device 83685d3b931SJuan Quintela * @errp: returns an error if this function fails 83785d3b931SJuan Quintela */ 8380a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n) 8399711cd0dSJens Freimann { 84012b2fad7SKevin Wolf FailoverDevice fdev = { 84112b2fad7SKevin Wolf .n = n, 84212b2fad7SKevin Wolf }; 8439711cd0dSJens Freimann 84412b2fad7SKevin Wolf qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL, 84512b2fad7SKevin Wolf NULL, NULL, &fdev); 84612b2fad7SKevin Wolf return fdev.dev; 8479711cd0dSJens Freimann } 8489711cd0dSJens Freimann 84921e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp) 85021e8709bSJuan Quintela { 85121e8709bSJuan Quintela Error *err = NULL; 85221e8709bSJuan Quintela DeviceState *dev = failover_find_primary_device(n); 85321e8709bSJuan Quintela 85421e8709bSJuan Quintela if (dev) { 85521e8709bSJuan Quintela return; 85621e8709bSJuan Quintela } 85721e8709bSJuan Quintela 858259a10dbSKevin Wolf if (!n->primary_opts) { 85997ca9c59SLaurent Vivier error_setg(errp, "Primary device not found"); 86097ca9c59SLaurent Vivier error_append_hint(errp, "Virtio-net failover will not work. Make " 86197ca9c59SLaurent Vivier "sure primary device has parameter" 86297ca9c59SLaurent Vivier " failover_pair_id=%s\n", n->netclient_name); 86321e8709bSJuan Quintela return; 86421e8709bSJuan Quintela } 865259a10dbSKevin Wolf 866f3558b1bSKevin Wolf dev = qdev_device_add_from_qdict(n->primary_opts, 867f3558b1bSKevin Wolf n->primary_opts_from_json, 868f3558b1bSKevin Wolf &err); 86921e8709bSJuan Quintela if (err) { 870f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 871259a10dbSKevin Wolf n->primary_opts = NULL; 87200e7b129SLaurent Vivier } else { 87300e7b129SLaurent Vivier object_unref(OBJECT(dev)); 87421e8709bSJuan Quintela } 87521e8709bSJuan Quintela error_propagate(errp, err); 87621e8709bSJuan Quintela } 87721e8709bSJuan Quintela 878d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features) 8796e790746SPaolo Bonzini { 88017a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 8819711cd0dSJens Freimann Error *err = NULL; 8826e790746SPaolo Bonzini int i; 8836e790746SPaolo Bonzini 88475ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 88575ebec11SMaxime Coquelin !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) { 88675ebec11SMaxime Coquelin features &= ~(1ULL << VIRTIO_NET_F_MTU); 88775ebec11SMaxime Coquelin } 88875ebec11SMaxime Coquelin 889ef546f12SCornelia Huck virtio_net_set_multiqueue(n, 89059079029SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_RSS) || 89195129d6fSCornelia Huck virtio_has_feature(features, VIRTIO_NET_F_MQ)); 8926e790746SPaolo Bonzini 893ef546f12SCornelia Huck virtio_net_set_mrg_rx_bufs(n, 89495129d6fSCornelia Huck virtio_has_feature(features, 895bb9d17f8SCornelia Huck VIRTIO_NET_F_MRG_RXBUF), 89695129d6fSCornelia Huck virtio_has_feature(features, 897e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 898e22f0603SYuri Benditovich virtio_has_feature(features, 899e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 9006e790746SPaolo Bonzini 9012974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 9022974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4); 9032974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 9042974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6); 905e22f0603SYuri Benditovich n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS); 9062974e916SYuri Benditovich 9076e790746SPaolo Bonzini if (n->has_vnet_hdr) { 908644c9858SDmitry Fleytman n->curr_guest_offloads = 909644c9858SDmitry Fleytman virtio_net_guest_offloads_by_features(features); 910644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 9116e790746SPaolo Bonzini } 9126e790746SPaolo Bonzini 913441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 9146e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, i); 9156e790746SPaolo Bonzini 916ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 9176e790746SPaolo Bonzini continue; 9186e790746SPaolo Bonzini } 919ed8b4afeSNikolay Nikolaev vhost_net_ack_features(get_vhost_net(nc->peer), features); 9206e790746SPaolo Bonzini } 9210b1eaa88SStefan Fritsch 92295129d6fSCornelia Huck if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) { 9230b1eaa88SStefan Fritsch memset(n->vlans, 0, MAX_VLAN >> 3); 9240b1eaa88SStefan Fritsch } else { 9250b1eaa88SStefan Fritsch memset(n->vlans, 0xff, MAX_VLAN >> 3); 9260b1eaa88SStefan Fritsch } 9279711cd0dSJens Freimann 9289711cd0dSJens Freimann if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) { 9299711cd0dSJens Freimann qapi_event_send_failover_negotiated(n->netclient_name); 930e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 9319711cd0dSJens Freimann failover_add_primary(n, &err); 9329711cd0dSJens Freimann if (err) { 9331b529d90SLaurent Vivier if (!qtest_enabled()) { 9349711cd0dSJens Freimann warn_report_err(err); 9351b529d90SLaurent Vivier } else { 9361b529d90SLaurent Vivier error_free(err); 9371b529d90SLaurent Vivier } 9389711cd0dSJens Freimann } 9396e790746SPaolo Bonzini } 94021e8709bSJuan Quintela } 9416e790746SPaolo Bonzini 9426e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd, 9436e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 9446e790746SPaolo Bonzini { 9456e790746SPaolo Bonzini uint8_t on; 9466e790746SPaolo Bonzini size_t s; 947b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 9486e790746SPaolo Bonzini 9496e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on)); 9506e790746SPaolo Bonzini if (s != sizeof(on)) { 9516e790746SPaolo Bonzini return VIRTIO_NET_ERR; 9526e790746SPaolo Bonzini } 9536e790746SPaolo Bonzini 9546e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) { 9556e790746SPaolo Bonzini n->promisc = on; 9566e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) { 9576e790746SPaolo Bonzini n->allmulti = on; 9586e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) { 9596e790746SPaolo Bonzini n->alluni = on; 9606e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) { 9616e790746SPaolo Bonzini n->nomulti = on; 9626e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) { 9636e790746SPaolo Bonzini n->nouni = on; 9646e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) { 9656e790746SPaolo Bonzini n->nobcast = on; 9666e790746SPaolo Bonzini } else { 9676e790746SPaolo Bonzini return VIRTIO_NET_ERR; 9686e790746SPaolo Bonzini } 9696e790746SPaolo Bonzini 970b1be4280SAmos Kong rxfilter_notify(nc); 971b1be4280SAmos Kong 9726e790746SPaolo Bonzini return VIRTIO_NET_OK; 9736e790746SPaolo Bonzini } 9746e790746SPaolo Bonzini 975644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd, 976644c9858SDmitry Fleytman struct iovec *iov, unsigned int iov_cnt) 977644c9858SDmitry Fleytman { 978644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 979644c9858SDmitry Fleytman uint64_t offloads; 980644c9858SDmitry Fleytman size_t s; 981644c9858SDmitry Fleytman 98295129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 983644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 984644c9858SDmitry Fleytman } 985644c9858SDmitry Fleytman 986644c9858SDmitry Fleytman s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads)); 987644c9858SDmitry Fleytman if (s != sizeof(offloads)) { 988644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 989644c9858SDmitry Fleytman } 990644c9858SDmitry Fleytman 991644c9858SDmitry Fleytman if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) { 992644c9858SDmitry Fleytman uint64_t supported_offloads; 993644c9858SDmitry Fleytman 994189ae6bbSJason Wang offloads = virtio_ldq_p(vdev, &offloads); 995189ae6bbSJason Wang 996644c9858SDmitry Fleytman if (!n->has_vnet_hdr) { 997644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 998644c9858SDmitry Fleytman } 999644c9858SDmitry Fleytman 10002974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 10012974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4); 10022974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 10032974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6); 10042974e916SYuri Benditovich virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT); 10052974e916SYuri Benditovich 1006644c9858SDmitry Fleytman supported_offloads = virtio_net_supported_guest_offloads(n); 1007644c9858SDmitry Fleytman if (offloads & ~supported_offloads) { 1008644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1009644c9858SDmitry Fleytman } 1010644c9858SDmitry Fleytman 1011644c9858SDmitry Fleytman n->curr_guest_offloads = offloads; 1012644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 1013644c9858SDmitry Fleytman 1014644c9858SDmitry Fleytman return VIRTIO_NET_OK; 1015644c9858SDmitry Fleytman } else { 1016644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1017644c9858SDmitry Fleytman } 1018644c9858SDmitry Fleytman } 1019644c9858SDmitry Fleytman 10206e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd, 10216e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 10226e790746SPaolo Bonzini { 10231399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 10246e790746SPaolo Bonzini struct virtio_net_ctrl_mac mac_data; 10256e790746SPaolo Bonzini size_t s; 1026b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 10276e790746SPaolo Bonzini 10286e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) { 10296e790746SPaolo Bonzini if (iov_size(iov, iov_cnt) != sizeof(n->mac)) { 10306e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10316e790746SPaolo Bonzini } 10326e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac)); 10336e790746SPaolo Bonzini assert(s == sizeof(n->mac)); 10346e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1035b1be4280SAmos Kong rxfilter_notify(nc); 1036b1be4280SAmos Kong 10376e790746SPaolo Bonzini return VIRTIO_NET_OK; 10386e790746SPaolo Bonzini } 10396e790746SPaolo Bonzini 10406e790746SPaolo Bonzini if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) { 10416e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10426e790746SPaolo Bonzini } 10436e790746SPaolo Bonzini 1044cae2e556SAmos Kong int in_use = 0; 1045cae2e556SAmos Kong int first_multi = 0; 1046cae2e556SAmos Kong uint8_t uni_overflow = 0; 1047cae2e556SAmos Kong uint8_t multi_overflow = 0; 1048cae2e556SAmos Kong uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 10496e790746SPaolo Bonzini 10506e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 10516e790746SPaolo Bonzini sizeof(mac_data.entries)); 10521399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 10536e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1054b1be4280SAmos Kong goto error; 10556e790746SPaolo Bonzini } 10566e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 10576e790746SPaolo Bonzini 10586e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) { 1059b1be4280SAmos Kong goto error; 10606e790746SPaolo Bonzini } 10616e790746SPaolo Bonzini 10626e790746SPaolo Bonzini if (mac_data.entries <= MAC_TABLE_ENTRIES) { 1063cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, macs, 10646e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 10656e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1066b1be4280SAmos Kong goto error; 10676e790746SPaolo Bonzini } 1068cae2e556SAmos Kong in_use += mac_data.entries; 10696e790746SPaolo Bonzini } else { 1070cae2e556SAmos Kong uni_overflow = 1; 10716e790746SPaolo Bonzini } 10726e790746SPaolo Bonzini 10736e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN); 10746e790746SPaolo Bonzini 1075cae2e556SAmos Kong first_multi = in_use; 10766e790746SPaolo Bonzini 10776e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 10786e790746SPaolo Bonzini sizeof(mac_data.entries)); 10791399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 10806e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1081b1be4280SAmos Kong goto error; 10826e790746SPaolo Bonzini } 10836e790746SPaolo Bonzini 10846e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 10856e790746SPaolo Bonzini 10866e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) { 1087b1be4280SAmos Kong goto error; 10886e790746SPaolo Bonzini } 10896e790746SPaolo Bonzini 1090edc24385SMichael S. Tsirkin if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) { 1091cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN], 10926e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 10936e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1094b1be4280SAmos Kong goto error; 10956e790746SPaolo Bonzini } 1096cae2e556SAmos Kong in_use += mac_data.entries; 10976e790746SPaolo Bonzini } else { 1098cae2e556SAmos Kong multi_overflow = 1; 10996e790746SPaolo Bonzini } 11006e790746SPaolo Bonzini 1101cae2e556SAmos Kong n->mac_table.in_use = in_use; 1102cae2e556SAmos Kong n->mac_table.first_multi = first_multi; 1103cae2e556SAmos Kong n->mac_table.uni_overflow = uni_overflow; 1104cae2e556SAmos Kong n->mac_table.multi_overflow = multi_overflow; 1105cae2e556SAmos Kong memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN); 1106cae2e556SAmos Kong g_free(macs); 1107b1be4280SAmos Kong rxfilter_notify(nc); 1108b1be4280SAmos Kong 11096e790746SPaolo Bonzini return VIRTIO_NET_OK; 1110b1be4280SAmos Kong 1111b1be4280SAmos Kong error: 1112cae2e556SAmos Kong g_free(macs); 1113b1be4280SAmos Kong return VIRTIO_NET_ERR; 11146e790746SPaolo Bonzini } 11156e790746SPaolo Bonzini 11166e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd, 11176e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 11186e790746SPaolo Bonzini { 11191399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 11206e790746SPaolo Bonzini uint16_t vid; 11216e790746SPaolo Bonzini size_t s; 1122b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 11236e790746SPaolo Bonzini 11246e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid)); 11251399c60dSRusty Russell vid = virtio_lduw_p(vdev, &vid); 11266e790746SPaolo Bonzini if (s != sizeof(vid)) { 11276e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11286e790746SPaolo Bonzini } 11296e790746SPaolo Bonzini 11306e790746SPaolo Bonzini if (vid >= MAX_VLAN) 11316e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11326e790746SPaolo Bonzini 11336e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_VLAN_ADD) 11346e790746SPaolo Bonzini n->vlans[vid >> 5] |= (1U << (vid & 0x1f)); 11356e790746SPaolo Bonzini else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL) 11366e790746SPaolo Bonzini n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f)); 11376e790746SPaolo Bonzini else 11386e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11396e790746SPaolo Bonzini 1140b1be4280SAmos Kong rxfilter_notify(nc); 1141b1be4280SAmos Kong 11426e790746SPaolo Bonzini return VIRTIO_NET_OK; 11436e790746SPaolo Bonzini } 11446e790746SPaolo Bonzini 1145f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd, 1146f57fcf70SJason Wang struct iovec *iov, unsigned int iov_cnt) 1147f57fcf70SJason Wang { 11489d8c6a25SDr. David Alan Gilbert trace_virtio_net_handle_announce(n->announce_timer.round); 1149f57fcf70SJason Wang if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK && 1150f57fcf70SJason Wang n->status & VIRTIO_NET_S_ANNOUNCE) { 1151f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 11529d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 11539d8c6a25SDr. David Alan Gilbert qemu_announce_timer_step(&n->announce_timer); 1154f57fcf70SJason Wang } 1155f57fcf70SJason Wang return VIRTIO_NET_OK; 1156f57fcf70SJason Wang } else { 1157f57fcf70SJason Wang return VIRTIO_NET_ERR; 1158f57fcf70SJason Wang } 1159f57fcf70SJason Wang } 1160f57fcf70SJason Wang 11610145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n); 11620145c393SAndrew Melnychenko 116359079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n) 116459079029SYuri Benditovich { 116559079029SYuri Benditovich if (n->rss_data.enabled) { 116659079029SYuri Benditovich trace_virtio_net_rss_disable(); 116759079029SYuri Benditovich } 116859079029SYuri Benditovich n->rss_data.enabled = false; 11690145c393SAndrew Melnychenko 11700145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 11710145c393SAndrew Melnychenko } 11720145c393SAndrew Melnychenko 11730145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd) 11740145c393SAndrew Melnychenko { 11750145c393SAndrew Melnychenko NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0); 11760145c393SAndrew Melnychenko if (nc == NULL || nc->info->set_steering_ebpf == NULL) { 11770145c393SAndrew Melnychenko return false; 11780145c393SAndrew Melnychenko } 11790145c393SAndrew Melnychenko 11800145c393SAndrew Melnychenko return nc->info->set_steering_ebpf(nc, prog_fd); 11810145c393SAndrew Melnychenko } 11820145c393SAndrew Melnychenko 11830145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data, 11840145c393SAndrew Melnychenko struct EBPFRSSConfig *config) 11850145c393SAndrew Melnychenko { 11860145c393SAndrew Melnychenko config->redirect = data->redirect; 11870145c393SAndrew Melnychenko config->populate_hash = data->populate_hash; 11880145c393SAndrew Melnychenko config->hash_types = data->hash_types; 11890145c393SAndrew Melnychenko config->indirections_len = data->indirections_len; 11900145c393SAndrew Melnychenko config->default_queue = data->default_queue; 11910145c393SAndrew Melnychenko } 11920145c393SAndrew Melnychenko 11930145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n) 11940145c393SAndrew Melnychenko { 11950145c393SAndrew Melnychenko struct EBPFRSSConfig config = {}; 11960145c393SAndrew Melnychenko 11970145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 11980145c393SAndrew Melnychenko return false; 11990145c393SAndrew Melnychenko } 12000145c393SAndrew Melnychenko 12010145c393SAndrew Melnychenko rss_data_to_rss_config(&n->rss_data, &config); 12020145c393SAndrew Melnychenko 12030145c393SAndrew Melnychenko if (!ebpf_rss_set_all(&n->ebpf_rss, &config, 12040145c393SAndrew Melnychenko n->rss_data.indirections_table, n->rss_data.key)) { 12050145c393SAndrew Melnychenko return false; 12060145c393SAndrew Melnychenko } 12070145c393SAndrew Melnychenko 12080145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) { 12090145c393SAndrew Melnychenko return false; 12100145c393SAndrew Melnychenko } 12110145c393SAndrew Melnychenko 12120145c393SAndrew Melnychenko return true; 12130145c393SAndrew Melnychenko } 12140145c393SAndrew Melnychenko 12150145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n) 12160145c393SAndrew Melnychenko { 12170145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 12180145c393SAndrew Melnychenko } 12190145c393SAndrew Melnychenko 12200145c393SAndrew Melnychenko static bool virtio_net_load_ebpf(VirtIONet *n) 12210145c393SAndrew Melnychenko { 12220145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, -1)) { 12230145c393SAndrew Melnychenko /* backend does't support steering ebpf */ 12240145c393SAndrew Melnychenko return false; 12250145c393SAndrew Melnychenko } 12260145c393SAndrew Melnychenko 12270145c393SAndrew Melnychenko return ebpf_rss_load(&n->ebpf_rss); 12280145c393SAndrew Melnychenko } 12290145c393SAndrew Melnychenko 12300145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n) 12310145c393SAndrew Melnychenko { 12320145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 12330145c393SAndrew Melnychenko ebpf_rss_unload(&n->ebpf_rss); 123459079029SYuri Benditovich } 123559079029SYuri Benditovich 123659079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n, 1237e22f0603SYuri Benditovich struct iovec *iov, 1238e22f0603SYuri Benditovich unsigned int iov_cnt, 1239e22f0603SYuri Benditovich bool do_rss) 124059079029SYuri Benditovich { 124159079029SYuri Benditovich VirtIODevice *vdev = VIRTIO_DEVICE(n); 124259079029SYuri Benditovich struct virtio_net_rss_config cfg; 124359079029SYuri Benditovich size_t s, offset = 0, size_get; 1244441537f1SJason Wang uint16_t queue_pairs, i; 124559079029SYuri Benditovich struct { 124659079029SYuri Benditovich uint16_t us; 124759079029SYuri Benditovich uint8_t b; 124859079029SYuri Benditovich } QEMU_PACKED temp; 124959079029SYuri Benditovich const char *err_msg = ""; 125059079029SYuri Benditovich uint32_t err_value = 0; 125159079029SYuri Benditovich 1252e22f0603SYuri Benditovich if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) { 125359079029SYuri Benditovich err_msg = "RSS is not negotiated"; 125459079029SYuri Benditovich goto error; 125559079029SYuri Benditovich } 1256e22f0603SYuri Benditovich if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) { 1257e22f0603SYuri Benditovich err_msg = "Hash report is not negotiated"; 1258e22f0603SYuri Benditovich goto error; 1259e22f0603SYuri Benditovich } 126059079029SYuri Benditovich size_get = offsetof(struct virtio_net_rss_config, indirection_table); 126159079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get); 126259079029SYuri Benditovich if (s != size_get) { 126359079029SYuri Benditovich err_msg = "Short command buffer"; 126459079029SYuri Benditovich err_value = (uint32_t)s; 126559079029SYuri Benditovich goto error; 126659079029SYuri Benditovich } 126759079029SYuri Benditovich n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types); 126859079029SYuri Benditovich n->rss_data.indirections_len = 126959079029SYuri Benditovich virtio_lduw_p(vdev, &cfg.indirection_table_mask); 127059079029SYuri Benditovich n->rss_data.indirections_len++; 1271e22f0603SYuri Benditovich if (!do_rss) { 1272e22f0603SYuri Benditovich n->rss_data.indirections_len = 1; 1273e22f0603SYuri Benditovich } 127459079029SYuri Benditovich if (!is_power_of_2(n->rss_data.indirections_len)) { 127559079029SYuri Benditovich err_msg = "Invalid size of indirection table"; 127659079029SYuri Benditovich err_value = n->rss_data.indirections_len; 127759079029SYuri Benditovich goto error; 127859079029SYuri Benditovich } 127959079029SYuri Benditovich if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) { 128059079029SYuri Benditovich err_msg = "Too large indirection table"; 128159079029SYuri Benditovich err_value = n->rss_data.indirections_len; 128259079029SYuri Benditovich goto error; 128359079029SYuri Benditovich } 1284e22f0603SYuri Benditovich n->rss_data.default_queue = do_rss ? 1285e22f0603SYuri Benditovich virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0; 1286441537f1SJason Wang if (n->rss_data.default_queue >= n->max_queue_pairs) { 128759079029SYuri Benditovich err_msg = "Invalid default queue"; 128859079029SYuri Benditovich err_value = n->rss_data.default_queue; 128959079029SYuri Benditovich goto error; 129059079029SYuri Benditovich } 129159079029SYuri Benditovich offset += size_get; 129259079029SYuri Benditovich size_get = sizeof(uint16_t) * n->rss_data.indirections_len; 129359079029SYuri Benditovich g_free(n->rss_data.indirections_table); 129459079029SYuri Benditovich n->rss_data.indirections_table = g_malloc(size_get); 129559079029SYuri Benditovich if (!n->rss_data.indirections_table) { 129659079029SYuri Benditovich err_msg = "Can't allocate indirections table"; 129759079029SYuri Benditovich err_value = n->rss_data.indirections_len; 129859079029SYuri Benditovich goto error; 129959079029SYuri Benditovich } 130059079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, 130159079029SYuri Benditovich n->rss_data.indirections_table, size_get); 130259079029SYuri Benditovich if (s != size_get) { 130359079029SYuri Benditovich err_msg = "Short indirection table buffer"; 130459079029SYuri Benditovich err_value = (uint32_t)s; 130559079029SYuri Benditovich goto error; 130659079029SYuri Benditovich } 130759079029SYuri Benditovich for (i = 0; i < n->rss_data.indirections_len; ++i) { 130859079029SYuri Benditovich uint16_t val = n->rss_data.indirections_table[i]; 130959079029SYuri Benditovich n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val); 131059079029SYuri Benditovich } 131159079029SYuri Benditovich offset += size_get; 131259079029SYuri Benditovich size_get = sizeof(temp); 131359079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get); 131459079029SYuri Benditovich if (s != size_get) { 1315441537f1SJason Wang err_msg = "Can't get queue_pairs"; 131659079029SYuri Benditovich err_value = (uint32_t)s; 131759079029SYuri Benditovich goto error; 131859079029SYuri Benditovich } 1319441537f1SJason Wang queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs; 1320441537f1SJason Wang if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) { 1321441537f1SJason Wang err_msg = "Invalid number of queue_pairs"; 1322441537f1SJason Wang err_value = queue_pairs; 132359079029SYuri Benditovich goto error; 132459079029SYuri Benditovich } 132559079029SYuri Benditovich if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) { 132659079029SYuri Benditovich err_msg = "Invalid key size"; 132759079029SYuri Benditovich err_value = temp.b; 132859079029SYuri Benditovich goto error; 132959079029SYuri Benditovich } 133059079029SYuri Benditovich if (!temp.b && n->rss_data.hash_types) { 133159079029SYuri Benditovich err_msg = "No key provided"; 133259079029SYuri Benditovich err_value = 0; 133359079029SYuri Benditovich goto error; 133459079029SYuri Benditovich } 133559079029SYuri Benditovich if (!temp.b && !n->rss_data.hash_types) { 133659079029SYuri Benditovich virtio_net_disable_rss(n); 1337441537f1SJason Wang return queue_pairs; 133859079029SYuri Benditovich } 133959079029SYuri Benditovich offset += size_get; 134059079029SYuri Benditovich size_get = temp.b; 134159079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get); 134259079029SYuri Benditovich if (s != size_get) { 134359079029SYuri Benditovich err_msg = "Can get key buffer"; 134459079029SYuri Benditovich err_value = (uint32_t)s; 134559079029SYuri Benditovich goto error; 134659079029SYuri Benditovich } 134759079029SYuri Benditovich n->rss_data.enabled = true; 13480145c393SAndrew Melnychenko 13490145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 13500145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 13510145c393SAndrew Melnychenko /* EBPF must be loaded for vhost */ 13520145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 13530145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS for vhost"); 13540145c393SAndrew Melnychenko goto error; 13550145c393SAndrew Melnychenko } 13560145c393SAndrew Melnychenko /* fallback to software RSS */ 13570145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS - fallback to software RSS"); 13580145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 13590145c393SAndrew Melnychenko } 13600145c393SAndrew Melnychenko } else { 13610145c393SAndrew Melnychenko /* use software RSS for hash populating */ 13620145c393SAndrew Melnychenko /* and detach eBPF if was loaded before */ 13630145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 13640145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 13650145c393SAndrew Melnychenko } 13660145c393SAndrew Melnychenko 136759079029SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 136859079029SYuri Benditovich n->rss_data.indirections_len, 136959079029SYuri Benditovich temp.b); 1370441537f1SJason Wang return queue_pairs; 137159079029SYuri Benditovich error: 137259079029SYuri Benditovich trace_virtio_net_rss_error(err_msg, err_value); 137359079029SYuri Benditovich virtio_net_disable_rss(n); 137459079029SYuri Benditovich return 0; 137559079029SYuri Benditovich } 137659079029SYuri Benditovich 13776e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd, 13786e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 13796e790746SPaolo Bonzini { 138017a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1381441537f1SJason Wang uint16_t queue_pairs; 13826e790746SPaolo Bonzini 138359079029SYuri Benditovich virtio_net_disable_rss(n); 1384e22f0603SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) { 1385441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false); 1386441537f1SJason Wang return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR; 1387e22f0603SYuri Benditovich } 138859079029SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) { 1389441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true); 139059079029SYuri Benditovich } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) { 139159079029SYuri Benditovich struct virtio_net_ctrl_mq mq; 139259079029SYuri Benditovich size_t s; 139359079029SYuri Benditovich if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) { 139459079029SYuri Benditovich return VIRTIO_NET_ERR; 139559079029SYuri Benditovich } 13966e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq)); 13976e790746SPaolo Bonzini if (s != sizeof(mq)) { 13986e790746SPaolo Bonzini return VIRTIO_NET_ERR; 13996e790746SPaolo Bonzini } 1400441537f1SJason Wang queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs); 14016e790746SPaolo Bonzini 140259079029SYuri Benditovich } else { 14036e790746SPaolo Bonzini return VIRTIO_NET_ERR; 14046e790746SPaolo Bonzini } 14056e790746SPaolo Bonzini 1406441537f1SJason Wang if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN || 1407441537f1SJason Wang queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX || 1408441537f1SJason Wang queue_pairs > n->max_queue_pairs || 14096e790746SPaolo Bonzini !n->multiqueue) { 14106e790746SPaolo Bonzini return VIRTIO_NET_ERR; 14116e790746SPaolo Bonzini } 14126e790746SPaolo Bonzini 1413441537f1SJason Wang n->curr_queue_pairs = queue_pairs; 1414441537f1SJason Wang /* stop the backend before changing the number of queue_pairs to avoid handling a 14156e790746SPaolo Bonzini * disabled queue */ 141617a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 1417441537f1SJason Wang virtio_net_set_queue_pairs(n); 14186e790746SPaolo Bonzini 14196e790746SPaolo Bonzini return VIRTIO_NET_OK; 14206e790746SPaolo Bonzini } 1421ba7eadb5SGreg Kurz 14226e790746SPaolo Bonzini static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq) 14236e790746SPaolo Bonzini { 142417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 14256e790746SPaolo Bonzini struct virtio_net_ctrl_hdr ctrl; 14266e790746SPaolo Bonzini virtio_net_ctrl_ack status = VIRTIO_NET_ERR; 142751b19ebeSPaolo Bonzini VirtQueueElement *elem; 14286e790746SPaolo Bonzini size_t s; 1429771b6ed3SJason Wang struct iovec *iov, *iov2; 14306e790746SPaolo Bonzini unsigned int iov_cnt; 14316e790746SPaolo Bonzini 143251b19ebeSPaolo Bonzini for (;;) { 143351b19ebeSPaolo Bonzini elem = virtqueue_pop(vq, sizeof(VirtQueueElement)); 143451b19ebeSPaolo Bonzini if (!elem) { 143551b19ebeSPaolo Bonzini break; 143651b19ebeSPaolo Bonzini } 143751b19ebeSPaolo Bonzini if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) || 143851b19ebeSPaolo Bonzini iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) { 1439ba7eadb5SGreg Kurz virtio_error(vdev, "virtio-net ctrl missing headers"); 1440ba7eadb5SGreg Kurz virtqueue_detach_element(vq, elem, 0); 1441ba7eadb5SGreg Kurz g_free(elem); 1442ba7eadb5SGreg Kurz break; 14436e790746SPaolo Bonzini } 14446e790746SPaolo Bonzini 144551b19ebeSPaolo Bonzini iov_cnt = elem->out_num; 144651b19ebeSPaolo Bonzini iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num); 14476e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl)); 14486e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, sizeof(ctrl)); 14496e790746SPaolo Bonzini if (s != sizeof(ctrl)) { 14506e790746SPaolo Bonzini status = VIRTIO_NET_ERR; 14516e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_RX) { 14526e790746SPaolo Bonzini status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt); 14536e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) { 14546e790746SPaolo Bonzini status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt); 14556e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) { 14566e790746SPaolo Bonzini status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt); 1457f57fcf70SJason Wang } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) { 1458f57fcf70SJason Wang status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt); 14596e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) { 14606e790746SPaolo Bonzini status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt); 1461644c9858SDmitry Fleytman } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) { 1462644c9858SDmitry Fleytman status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt); 14636e790746SPaolo Bonzini } 14646e790746SPaolo Bonzini 146551b19ebeSPaolo Bonzini s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status)); 14666e790746SPaolo Bonzini assert(s == sizeof(status)); 14676e790746SPaolo Bonzini 146851b19ebeSPaolo Bonzini virtqueue_push(vq, elem, sizeof(status)); 14696e790746SPaolo Bonzini virtio_notify(vdev, vq); 1470771b6ed3SJason Wang g_free(iov2); 147151b19ebeSPaolo Bonzini g_free(elem); 14726e790746SPaolo Bonzini } 14736e790746SPaolo Bonzini } 14746e790746SPaolo Bonzini 14756e790746SPaolo Bonzini /* RX */ 14766e790746SPaolo Bonzini 14776e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq) 14786e790746SPaolo Bonzini { 147917a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 14806e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(vq)); 14816e790746SPaolo Bonzini 14826e790746SPaolo Bonzini qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index)); 14836e790746SPaolo Bonzini } 14846e790746SPaolo Bonzini 1485b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc) 14866e790746SPaolo Bonzini { 14876e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 148817a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 14896e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 14906e790746SPaolo Bonzini 149117a0ca55SKONRAD Frederic if (!vdev->vm_running) { 1492b8c4b67eSPhilippe Mathieu-Daudé return false; 14936e790746SPaolo Bonzini } 14946e790746SPaolo Bonzini 1495441537f1SJason Wang if (nc->queue_index >= n->curr_queue_pairs) { 1496b8c4b67eSPhilippe Mathieu-Daudé return false; 14976e790746SPaolo Bonzini } 14986e790746SPaolo Bonzini 14996e790746SPaolo Bonzini if (!virtio_queue_ready(q->rx_vq) || 150017a0ca55SKONRAD Frederic !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 1501b8c4b67eSPhilippe Mathieu-Daudé return false; 15026e790746SPaolo Bonzini } 15036e790746SPaolo Bonzini 1504b8c4b67eSPhilippe Mathieu-Daudé return true; 15056e790746SPaolo Bonzini } 15066e790746SPaolo Bonzini 15076e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize) 15086e790746SPaolo Bonzini { 15096e790746SPaolo Bonzini VirtIONet *n = q->n; 15106e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 15116e790746SPaolo Bonzini (n->mergeable_rx_bufs && 15126e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 15136e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 1); 15146e790746SPaolo Bonzini 15156e790746SPaolo Bonzini /* To avoid a race condition where the guest has made some buffers 15166e790746SPaolo Bonzini * available after the above check but before notification was 15176e790746SPaolo Bonzini * enabled, check for available buffers again. 15186e790746SPaolo Bonzini */ 15196e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 15206e790746SPaolo Bonzini (n->mergeable_rx_bufs && 15216e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 15226e790746SPaolo Bonzini return 0; 15236e790746SPaolo Bonzini } 15246e790746SPaolo Bonzini } 15256e790746SPaolo Bonzini 15266e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 0); 15276e790746SPaolo Bonzini return 1; 15286e790746SPaolo Bonzini } 15296e790746SPaolo Bonzini 15301399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr) 1531032a74a1SCédric Le Goater { 15321399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->hdr_len); 15331399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->gso_size); 15341399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_start); 15351399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_offset); 1536032a74a1SCédric Le Goater } 1537032a74a1SCédric Le Goater 15386e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so 15396e790746SPaolo Bonzini * it never finds out that the packets don't have valid checksums. This 15406e790746SPaolo Bonzini * causes dhclient to get upset. Fedora's carried a patch for ages to 15416e790746SPaolo Bonzini * fix this with Xen but it hasn't appeared in an upstream release of 15426e790746SPaolo Bonzini * dhclient yet. 15436e790746SPaolo Bonzini * 15446e790746SPaolo Bonzini * To avoid breaking existing guests, we catch udp packets and add 15456e790746SPaolo Bonzini * checksums. This is terrible but it's better than hacking the guest 15466e790746SPaolo Bonzini * kernels. 15476e790746SPaolo Bonzini * 15486e790746SPaolo Bonzini * N.B. if we introduce a zero-copy API, this operation is no longer free so 15496e790746SPaolo Bonzini * we should provide a mechanism to disable it to avoid polluting the host 15506e790746SPaolo Bonzini * cache. 15516e790746SPaolo Bonzini */ 15526e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr, 15536e790746SPaolo Bonzini uint8_t *buf, size_t size) 15546e790746SPaolo Bonzini { 15556e790746SPaolo Bonzini if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */ 15566e790746SPaolo Bonzini (size > 27 && size < 1500) && /* normal sized MTU */ 15576e790746SPaolo Bonzini (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */ 15586e790746SPaolo Bonzini (buf[23] == 17) && /* ip.protocol == UDP */ 15596e790746SPaolo Bonzini (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */ 1560f5746335SBin Meng net_checksum_calculate(buf, size, CSUM_UDP); 15616e790746SPaolo Bonzini hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM; 15626e790746SPaolo Bonzini } 15636e790746SPaolo Bonzini } 15646e790746SPaolo Bonzini 15656e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt, 15666e790746SPaolo Bonzini const void *buf, size_t size) 15676e790746SPaolo Bonzini { 15686e790746SPaolo Bonzini if (n->has_vnet_hdr) { 15696e790746SPaolo Bonzini /* FIXME this cast is evil */ 15706e790746SPaolo Bonzini void *wbuf = (void *)buf; 15716e790746SPaolo Bonzini work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len, 15726e790746SPaolo Bonzini size - n->host_hdr_len); 15731bfa316cSGreg Kurz 15741bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 15751399c60dSRusty Russell virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf); 15761bfa316cSGreg Kurz } 15776e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr)); 15786e790746SPaolo Bonzini } else { 15796e790746SPaolo Bonzini struct virtio_net_hdr hdr = { 15806e790746SPaolo Bonzini .flags = 0, 15816e790746SPaolo Bonzini .gso_type = VIRTIO_NET_HDR_GSO_NONE 15826e790746SPaolo Bonzini }; 15836e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr); 15846e790746SPaolo Bonzini } 15856e790746SPaolo Bonzini } 15866e790746SPaolo Bonzini 15876e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size) 15886e790746SPaolo Bonzini { 15896e790746SPaolo Bonzini static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff}; 15906e790746SPaolo Bonzini static const uint8_t vlan[] = {0x81, 0x00}; 15916e790746SPaolo Bonzini uint8_t *ptr = (uint8_t *)buf; 15926e790746SPaolo Bonzini int i; 15936e790746SPaolo Bonzini 15946e790746SPaolo Bonzini if (n->promisc) 15956e790746SPaolo Bonzini return 1; 15966e790746SPaolo Bonzini 15976e790746SPaolo Bonzini ptr += n->host_hdr_len; 15986e790746SPaolo Bonzini 15996e790746SPaolo Bonzini if (!memcmp(&ptr[12], vlan, sizeof(vlan))) { 16007542d3e7SPeter Maydell int vid = lduw_be_p(ptr + 14) & 0xfff; 16016e790746SPaolo Bonzini if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f)))) 16026e790746SPaolo Bonzini return 0; 16036e790746SPaolo Bonzini } 16046e790746SPaolo Bonzini 16056e790746SPaolo Bonzini if (ptr[0] & 1) { // multicast 16066e790746SPaolo Bonzini if (!memcmp(ptr, bcast, sizeof(bcast))) { 16076e790746SPaolo Bonzini return !n->nobcast; 16086e790746SPaolo Bonzini } else if (n->nomulti) { 16096e790746SPaolo Bonzini return 0; 16106e790746SPaolo Bonzini } else if (n->allmulti || n->mac_table.multi_overflow) { 16116e790746SPaolo Bonzini return 1; 16126e790746SPaolo Bonzini } 16136e790746SPaolo Bonzini 16146e790746SPaolo Bonzini for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 16156e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 16166e790746SPaolo Bonzini return 1; 16176e790746SPaolo Bonzini } 16186e790746SPaolo Bonzini } 16196e790746SPaolo Bonzini } else { // unicast 16206e790746SPaolo Bonzini if (n->nouni) { 16216e790746SPaolo Bonzini return 0; 16226e790746SPaolo Bonzini } else if (n->alluni || n->mac_table.uni_overflow) { 16236e790746SPaolo Bonzini return 1; 16246e790746SPaolo Bonzini } else if (!memcmp(ptr, n->mac, ETH_ALEN)) { 16256e790746SPaolo Bonzini return 1; 16266e790746SPaolo Bonzini } 16276e790746SPaolo Bonzini 16286e790746SPaolo Bonzini for (i = 0; i < n->mac_table.first_multi; i++) { 16296e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 16306e790746SPaolo Bonzini return 1; 16316e790746SPaolo Bonzini } 16326e790746SPaolo Bonzini } 16336e790746SPaolo Bonzini } 16346e790746SPaolo Bonzini 16356e790746SPaolo Bonzini return 0; 16366e790746SPaolo Bonzini } 16376e790746SPaolo Bonzini 16384474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4, 16394474e37aSYuri Benditovich bool isip6, 16404474e37aSYuri Benditovich bool isudp, 16414474e37aSYuri Benditovich bool istcp, 16424474e37aSYuri Benditovich uint32_t types) 16434474e37aSYuri Benditovich { 16444474e37aSYuri Benditovich if (isip4) { 16454474e37aSYuri Benditovich if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) { 16464474e37aSYuri Benditovich return NetPktRssIpV4Tcp; 16474474e37aSYuri Benditovich } 16484474e37aSYuri Benditovich if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) { 16494474e37aSYuri Benditovich return NetPktRssIpV4Udp; 16504474e37aSYuri Benditovich } 16514474e37aSYuri Benditovich if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) { 16524474e37aSYuri Benditovich return NetPktRssIpV4; 16534474e37aSYuri Benditovich } 16544474e37aSYuri Benditovich } else if (isip6) { 16554474e37aSYuri Benditovich uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | 16564474e37aSYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6; 16574474e37aSYuri Benditovich 16584474e37aSYuri Benditovich if (istcp && (types & mask)) { 16594474e37aSYuri Benditovich return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ? 16604474e37aSYuri Benditovich NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp; 16614474e37aSYuri Benditovich } 16624474e37aSYuri Benditovich mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6; 16634474e37aSYuri Benditovich if (isudp && (types & mask)) { 16644474e37aSYuri Benditovich return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ? 16654474e37aSYuri Benditovich NetPktRssIpV6UdpEx : NetPktRssIpV6Udp; 16664474e37aSYuri Benditovich } 16674474e37aSYuri Benditovich mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6; 16684474e37aSYuri Benditovich if (types & mask) { 16694474e37aSYuri Benditovich return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ? 16704474e37aSYuri Benditovich NetPktRssIpV6Ex : NetPktRssIpV6; 16714474e37aSYuri Benditovich } 16724474e37aSYuri Benditovich } 16734474e37aSYuri Benditovich return 0xff; 16744474e37aSYuri Benditovich } 16754474e37aSYuri Benditovich 1676e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report, 1677e22f0603SYuri Benditovich uint32_t hash) 1678e22f0603SYuri Benditovich { 1679e22f0603SYuri Benditovich struct virtio_net_hdr_v1_hash *hdr = (void *)buf; 1680e22f0603SYuri Benditovich hdr->hash_value = hash; 1681e22f0603SYuri Benditovich hdr->hash_report = report; 1682e22f0603SYuri Benditovich } 1683e22f0603SYuri Benditovich 16844474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf, 168597cd965cSPaolo Bonzini size_t size) 16866e790746SPaolo Bonzini { 16876e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1688e22f0603SYuri Benditovich unsigned int index = nc->queue_index, new_index = index; 16894474e37aSYuri Benditovich struct NetRxPkt *pkt = n->rx_pkt; 16904474e37aSYuri Benditovich uint8_t net_hash_type; 16914474e37aSYuri Benditovich uint32_t hash; 16924474e37aSYuri Benditovich bool isip4, isip6, isudp, istcp; 1693e22f0603SYuri Benditovich static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = { 1694e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv4, 1695e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv4, 1696e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6, 1697e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6, 1698e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6_EX, 1699e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6_EX, 1700e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv4, 1701e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6, 1702e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6_EX 1703e22f0603SYuri Benditovich }; 17044474e37aSYuri Benditovich 17054474e37aSYuri Benditovich net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len, 17064474e37aSYuri Benditovich size - n->host_hdr_len); 17074474e37aSYuri Benditovich net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp); 17084474e37aSYuri Benditovich if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) { 17094474e37aSYuri Benditovich istcp = isudp = false; 17104474e37aSYuri Benditovich } 17114474e37aSYuri Benditovich if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) { 17124474e37aSYuri Benditovich istcp = isudp = false; 17134474e37aSYuri Benditovich } 17144474e37aSYuri Benditovich net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp, 17154474e37aSYuri Benditovich n->rss_data.hash_types); 17164474e37aSYuri Benditovich if (net_hash_type > NetPktRssIpV6UdpEx) { 1717e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1718e22f0603SYuri Benditovich virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0); 1719e22f0603SYuri Benditovich } 1720e22f0603SYuri Benditovich return n->rss_data.redirect ? n->rss_data.default_queue : -1; 17214474e37aSYuri Benditovich } 17224474e37aSYuri Benditovich 17234474e37aSYuri Benditovich hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key); 1724e22f0603SYuri Benditovich 1725e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1726e22f0603SYuri Benditovich virtio_set_packet_hash(buf, reports[net_hash_type], hash); 1727e22f0603SYuri Benditovich } 1728e22f0603SYuri Benditovich 1729e22f0603SYuri Benditovich if (n->rss_data.redirect) { 17304474e37aSYuri Benditovich new_index = hash & (n->rss_data.indirections_len - 1); 17314474e37aSYuri Benditovich new_index = n->rss_data.indirections_table[new_index]; 17324474e37aSYuri Benditovich } 1733e22f0603SYuri Benditovich 1734e22f0603SYuri Benditovich return (index == new_index) ? -1 : new_index; 17354474e37aSYuri Benditovich } 17364474e37aSYuri Benditovich 17374474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf, 17384474e37aSYuri Benditovich size_t size, bool no_rss) 17394474e37aSYuri Benditovich { 17404474e37aSYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 17416e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 174217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1743bedd7e93SJason Wang VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE]; 1744bedd7e93SJason Wang size_t lens[VIRTQUEUE_MAX_SIZE]; 17456e790746SPaolo Bonzini struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE]; 17466e790746SPaolo Bonzini struct virtio_net_hdr_mrg_rxbuf mhdr; 17476e790746SPaolo Bonzini unsigned mhdr_cnt = 0; 1748bedd7e93SJason Wang size_t offset, i, guest_offset, j; 1749bedd7e93SJason Wang ssize_t err; 17506e790746SPaolo Bonzini 17516e790746SPaolo Bonzini if (!virtio_net_can_receive(nc)) { 17526e790746SPaolo Bonzini return -1; 17536e790746SPaolo Bonzini } 17546e790746SPaolo Bonzini 17550145c393SAndrew Melnychenko if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) { 17564474e37aSYuri Benditovich int index = virtio_net_process_rss(nc, buf, size); 17574474e37aSYuri Benditovich if (index >= 0) { 17584474e37aSYuri Benditovich NetClientState *nc2 = qemu_get_subqueue(n->nic, index); 17594474e37aSYuri Benditovich return virtio_net_receive_rcu(nc2, buf, size, true); 17604474e37aSYuri Benditovich } 17614474e37aSYuri Benditovich } 17624474e37aSYuri Benditovich 17636e790746SPaolo Bonzini /* hdr_len refers to the header we supply to the guest */ 17646e790746SPaolo Bonzini if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) { 17656e790746SPaolo Bonzini return 0; 17666e790746SPaolo Bonzini } 17676e790746SPaolo Bonzini 17686e790746SPaolo Bonzini if (!receive_filter(n, buf, size)) 17696e790746SPaolo Bonzini return size; 17706e790746SPaolo Bonzini 17716e790746SPaolo Bonzini offset = i = 0; 17726e790746SPaolo Bonzini 17736e790746SPaolo Bonzini while (offset < size) { 177451b19ebeSPaolo Bonzini VirtQueueElement *elem; 17756e790746SPaolo Bonzini int len, total; 177651b19ebeSPaolo Bonzini const struct iovec *sg; 17776e790746SPaolo Bonzini 17786e790746SPaolo Bonzini total = 0; 17796e790746SPaolo Bonzini 1780bedd7e93SJason Wang if (i == VIRTQUEUE_MAX_SIZE) { 1781bedd7e93SJason Wang virtio_error(vdev, "virtio-net unexpected long buffer chain"); 1782bedd7e93SJason Wang err = size; 1783bedd7e93SJason Wang goto err; 1784bedd7e93SJason Wang } 1785bedd7e93SJason Wang 178651b19ebeSPaolo Bonzini elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement)); 178751b19ebeSPaolo Bonzini if (!elem) { 1788ba10b9c0SGreg Kurz if (i) { 1789ba10b9c0SGreg Kurz virtio_error(vdev, "virtio-net unexpected empty queue: " 17906e790746SPaolo Bonzini "i %zd mergeable %d offset %zd, size %zd, " 1791019a3edbSGerd Hoffmann "guest hdr len %zd, host hdr len %zd " 1792019a3edbSGerd Hoffmann "guest features 0x%" PRIx64, 17936e790746SPaolo Bonzini i, n->mergeable_rx_bufs, offset, size, 1794019a3edbSGerd Hoffmann n->guest_hdr_len, n->host_hdr_len, 1795019a3edbSGerd Hoffmann vdev->guest_features); 1796ba10b9c0SGreg Kurz } 1797bedd7e93SJason Wang err = -1; 1798bedd7e93SJason Wang goto err; 17996e790746SPaolo Bonzini } 18006e790746SPaolo Bonzini 180151b19ebeSPaolo Bonzini if (elem->in_num < 1) { 1802ba10b9c0SGreg Kurz virtio_error(vdev, 1803ba10b9c0SGreg Kurz "virtio-net receive queue contains no in buffers"); 1804ba10b9c0SGreg Kurz virtqueue_detach_element(q->rx_vq, elem, 0); 1805ba10b9c0SGreg Kurz g_free(elem); 1806bedd7e93SJason Wang err = -1; 1807bedd7e93SJason Wang goto err; 18086e790746SPaolo Bonzini } 18096e790746SPaolo Bonzini 181051b19ebeSPaolo Bonzini sg = elem->in_sg; 18116e790746SPaolo Bonzini if (i == 0) { 18126e790746SPaolo Bonzini assert(offset == 0); 18136e790746SPaolo Bonzini if (n->mergeable_rx_bufs) { 18146e790746SPaolo Bonzini mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg), 181551b19ebeSPaolo Bonzini sg, elem->in_num, 18166e790746SPaolo Bonzini offsetof(typeof(mhdr), num_buffers), 18176e790746SPaolo Bonzini sizeof(mhdr.num_buffers)); 18186e790746SPaolo Bonzini } 18196e790746SPaolo Bonzini 182051b19ebeSPaolo Bonzini receive_header(n, sg, elem->in_num, buf, size); 1821e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1822e22f0603SYuri Benditovich offset = sizeof(mhdr); 1823e22f0603SYuri Benditovich iov_from_buf(sg, elem->in_num, offset, 1824e22f0603SYuri Benditovich buf + offset, n->host_hdr_len - sizeof(mhdr)); 1825e22f0603SYuri Benditovich } 18266e790746SPaolo Bonzini offset = n->host_hdr_len; 18276e790746SPaolo Bonzini total += n->guest_hdr_len; 18286e790746SPaolo Bonzini guest_offset = n->guest_hdr_len; 18296e790746SPaolo Bonzini } else { 18306e790746SPaolo Bonzini guest_offset = 0; 18316e790746SPaolo Bonzini } 18326e790746SPaolo Bonzini 18336e790746SPaolo Bonzini /* copy in packet. ugh */ 183451b19ebeSPaolo Bonzini len = iov_from_buf(sg, elem->in_num, guest_offset, 18356e790746SPaolo Bonzini buf + offset, size - offset); 18366e790746SPaolo Bonzini total += len; 18376e790746SPaolo Bonzini offset += len; 18386e790746SPaolo Bonzini /* If buffers can't be merged, at this point we 18396e790746SPaolo Bonzini * must have consumed the complete packet. 18406e790746SPaolo Bonzini * Otherwise, drop it. */ 18416e790746SPaolo Bonzini if (!n->mergeable_rx_bufs && offset < size) { 184227e57efeSLadi Prosek virtqueue_unpop(q->rx_vq, elem, total); 184351b19ebeSPaolo Bonzini g_free(elem); 1844bedd7e93SJason Wang err = size; 1845bedd7e93SJason Wang goto err; 18466e790746SPaolo Bonzini } 18476e790746SPaolo Bonzini 1848bedd7e93SJason Wang elems[i] = elem; 1849bedd7e93SJason Wang lens[i] = total; 1850bedd7e93SJason Wang i++; 18516e790746SPaolo Bonzini } 18526e790746SPaolo Bonzini 18536e790746SPaolo Bonzini if (mhdr_cnt) { 18541399c60dSRusty Russell virtio_stw_p(vdev, &mhdr.num_buffers, i); 18556e790746SPaolo Bonzini iov_from_buf(mhdr_sg, mhdr_cnt, 18566e790746SPaolo Bonzini 0, 18576e790746SPaolo Bonzini &mhdr.num_buffers, sizeof mhdr.num_buffers); 18586e790746SPaolo Bonzini } 18596e790746SPaolo Bonzini 1860bedd7e93SJason Wang for (j = 0; j < i; j++) { 1861bedd7e93SJason Wang /* signal other side */ 1862bedd7e93SJason Wang virtqueue_fill(q->rx_vq, elems[j], lens[j], j); 1863bedd7e93SJason Wang g_free(elems[j]); 1864bedd7e93SJason Wang } 1865bedd7e93SJason Wang 18666e790746SPaolo Bonzini virtqueue_flush(q->rx_vq, i); 186717a0ca55SKONRAD Frederic virtio_notify(vdev, q->rx_vq); 18686e790746SPaolo Bonzini 18696e790746SPaolo Bonzini return size; 1870bedd7e93SJason Wang 1871bedd7e93SJason Wang err: 1872bedd7e93SJason Wang for (j = 0; j < i; j++) { 1873bedd7e93SJason Wang g_free(elems[j]); 1874bedd7e93SJason Wang } 1875bedd7e93SJason Wang 1876bedd7e93SJason Wang return err; 18776e790746SPaolo Bonzini } 18786e790746SPaolo Bonzini 18792974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf, 188097cd965cSPaolo Bonzini size_t size) 188197cd965cSPaolo Bonzini { 1882068ddfa9SDr. David Alan Gilbert RCU_READ_LOCK_GUARD(); 188397cd965cSPaolo Bonzini 18844474e37aSYuri Benditovich return virtio_net_receive_rcu(nc, buf, size, false); 188597cd965cSPaolo Bonzini } 188697cd965cSPaolo Bonzini 18872974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain, 18882974e916SYuri Benditovich const uint8_t *buf, 18892974e916SYuri Benditovich VirtioNetRscUnit *unit) 18902974e916SYuri Benditovich { 18912974e916SYuri Benditovich uint16_t ip_hdrlen; 18922974e916SYuri Benditovich struct ip_header *ip; 18932974e916SYuri Benditovich 18942974e916SYuri Benditovich ip = (struct ip_header *)(buf + chain->n->guest_hdr_len 18952974e916SYuri Benditovich + sizeof(struct eth_header)); 18962974e916SYuri Benditovich unit->ip = (void *)ip; 18972974e916SYuri Benditovich ip_hdrlen = (ip->ip_ver_len & 0xF) << 2; 18982974e916SYuri Benditovich unit->ip_plen = &ip->ip_len; 18992974e916SYuri Benditovich unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen); 19002974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 19012974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen; 19022974e916SYuri Benditovich } 19032974e916SYuri Benditovich 19042974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain, 19052974e916SYuri Benditovich const uint8_t *buf, 19062974e916SYuri Benditovich VirtioNetRscUnit *unit) 19072974e916SYuri Benditovich { 19082974e916SYuri Benditovich struct ip6_header *ip6; 19092974e916SYuri Benditovich 19102974e916SYuri Benditovich ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len 19112974e916SYuri Benditovich + sizeof(struct eth_header)); 19122974e916SYuri Benditovich unit->ip = ip6; 19132974e916SYuri Benditovich unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 191478ee6bd0SPhilippe Mathieu-Daudé unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) 19152974e916SYuri Benditovich + sizeof(struct ip6_header)); 19162974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 19172974e916SYuri Benditovich 19182974e916SYuri Benditovich /* There is a difference between payload lenght in ipv4 and v6, 19192974e916SYuri Benditovich ip header is excluded in ipv6 */ 19202974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen; 19212974e916SYuri Benditovich } 19222974e916SYuri Benditovich 19232974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain, 19242974e916SYuri Benditovich VirtioNetRscSeg *seg) 19252974e916SYuri Benditovich { 19262974e916SYuri Benditovich int ret; 1927dd3d85e8SYuri Benditovich struct virtio_net_hdr_v1 *h; 19282974e916SYuri Benditovich 1929dd3d85e8SYuri Benditovich h = (struct virtio_net_hdr_v1 *)seg->buf; 19302974e916SYuri Benditovich h->flags = 0; 19312974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_NONE; 19322974e916SYuri Benditovich 19332974e916SYuri Benditovich if (seg->is_coalesced) { 1934dd3d85e8SYuri Benditovich h->rsc.segments = seg->packets; 1935dd3d85e8SYuri Benditovich h->rsc.dup_acks = seg->dup_ack; 19362974e916SYuri Benditovich h->flags = VIRTIO_NET_HDR_F_RSC_INFO; 19372974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 19382974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 19392974e916SYuri Benditovich } else { 19402974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 19412974e916SYuri Benditovich } 19422974e916SYuri Benditovich } 19432974e916SYuri Benditovich 19442974e916SYuri Benditovich ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size); 19452974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 19462974e916SYuri Benditovich g_free(seg->buf); 19472974e916SYuri Benditovich g_free(seg); 19482974e916SYuri Benditovich 19492974e916SYuri Benditovich return ret; 19502974e916SYuri Benditovich } 19512974e916SYuri Benditovich 19522974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq) 19532974e916SYuri Benditovich { 19542974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn; 19552974e916SYuri Benditovich VirtioNetRscChain *chain = (VirtioNetRscChain *)opq; 19562974e916SYuri Benditovich 19572974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) { 19582974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 19592974e916SYuri Benditovich chain->stat.purge_failed++; 19602974e916SYuri Benditovich continue; 19612974e916SYuri Benditovich } 19622974e916SYuri Benditovich } 19632974e916SYuri Benditovich 19642974e916SYuri Benditovich chain->stat.timer++; 19652974e916SYuri Benditovich if (!QTAILQ_EMPTY(&chain->buffers)) { 19662974e916SYuri Benditovich timer_mod(chain->drain_timer, 19672974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 19682974e916SYuri Benditovich } 19692974e916SYuri Benditovich } 19702974e916SYuri Benditovich 19712974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n) 19722974e916SYuri Benditovich { 19732974e916SYuri Benditovich VirtioNetRscChain *chain, *rn_chain; 19742974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn_seg; 19752974e916SYuri Benditovich 19762974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) { 19772974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) { 19782974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 19792974e916SYuri Benditovich g_free(seg->buf); 19802974e916SYuri Benditovich g_free(seg); 19812974e916SYuri Benditovich } 19822974e916SYuri Benditovich 19832974e916SYuri Benditovich timer_free(chain->drain_timer); 19842974e916SYuri Benditovich QTAILQ_REMOVE(&n->rsc_chains, chain, next); 19852974e916SYuri Benditovich g_free(chain); 19862974e916SYuri Benditovich } 19872974e916SYuri Benditovich } 19882974e916SYuri Benditovich 19892974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain, 19902974e916SYuri Benditovich NetClientState *nc, 19912974e916SYuri Benditovich const uint8_t *buf, size_t size) 19922974e916SYuri Benditovich { 19932974e916SYuri Benditovich uint16_t hdr_len; 19942974e916SYuri Benditovich VirtioNetRscSeg *seg; 19952974e916SYuri Benditovich 19962974e916SYuri Benditovich hdr_len = chain->n->guest_hdr_len; 19972974e916SYuri Benditovich seg = g_malloc(sizeof(VirtioNetRscSeg)); 19982974e916SYuri Benditovich seg->buf = g_malloc(hdr_len + sizeof(struct eth_header) 19992974e916SYuri Benditovich + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD); 20002974e916SYuri Benditovich memcpy(seg->buf, buf, size); 20012974e916SYuri Benditovich seg->size = size; 20022974e916SYuri Benditovich seg->packets = 1; 20032974e916SYuri Benditovich seg->dup_ack = 0; 20042974e916SYuri Benditovich seg->is_coalesced = 0; 20052974e916SYuri Benditovich seg->nc = nc; 20062974e916SYuri Benditovich 20072974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&chain->buffers, seg, next); 20082974e916SYuri Benditovich chain->stat.cache++; 20092974e916SYuri Benditovich 20102974e916SYuri Benditovich switch (chain->proto) { 20112974e916SYuri Benditovich case ETH_P_IP: 20122974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit); 20132974e916SYuri Benditovich break; 20142974e916SYuri Benditovich case ETH_P_IPV6: 20152974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit); 20162974e916SYuri Benditovich break; 20172974e916SYuri Benditovich default: 20182974e916SYuri Benditovich g_assert_not_reached(); 20192974e916SYuri Benditovich } 20202974e916SYuri Benditovich } 20212974e916SYuri Benditovich 20222974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain, 20232974e916SYuri Benditovich VirtioNetRscSeg *seg, 20242974e916SYuri Benditovich const uint8_t *buf, 20252974e916SYuri Benditovich struct tcp_header *n_tcp, 20262974e916SYuri Benditovich struct tcp_header *o_tcp) 20272974e916SYuri Benditovich { 20282974e916SYuri Benditovich uint32_t nack, oack; 20292974e916SYuri Benditovich uint16_t nwin, owin; 20302974e916SYuri Benditovich 20312974e916SYuri Benditovich nack = htonl(n_tcp->th_ack); 20322974e916SYuri Benditovich nwin = htons(n_tcp->th_win); 20332974e916SYuri Benditovich oack = htonl(o_tcp->th_ack); 20342974e916SYuri Benditovich owin = htons(o_tcp->th_win); 20352974e916SYuri Benditovich 20362974e916SYuri Benditovich if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) { 20372974e916SYuri Benditovich chain->stat.ack_out_of_win++; 20382974e916SYuri Benditovich return RSC_FINAL; 20392974e916SYuri Benditovich } else if (nack == oack) { 20402974e916SYuri Benditovich /* duplicated ack or window probe */ 20412974e916SYuri Benditovich if (nwin == owin) { 20422974e916SYuri Benditovich /* duplicated ack, add dup ack count due to whql test up to 1 */ 20432974e916SYuri Benditovich chain->stat.dup_ack++; 20442974e916SYuri Benditovich return RSC_FINAL; 20452974e916SYuri Benditovich } else { 20462974e916SYuri Benditovich /* Coalesce window update */ 20472974e916SYuri Benditovich o_tcp->th_win = n_tcp->th_win; 20482974e916SYuri Benditovich chain->stat.win_update++; 20492974e916SYuri Benditovich return RSC_COALESCE; 20502974e916SYuri Benditovich } 20512974e916SYuri Benditovich } else { 20522974e916SYuri Benditovich /* pure ack, go to 'C', finalize*/ 20532974e916SYuri Benditovich chain->stat.pure_ack++; 20542974e916SYuri Benditovich return RSC_FINAL; 20552974e916SYuri Benditovich } 20562974e916SYuri Benditovich } 20572974e916SYuri Benditovich 20582974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain, 20592974e916SYuri Benditovich VirtioNetRscSeg *seg, 20602974e916SYuri Benditovich const uint8_t *buf, 20612974e916SYuri Benditovich VirtioNetRscUnit *n_unit) 20622974e916SYuri Benditovich { 20632974e916SYuri Benditovich void *data; 20642974e916SYuri Benditovich uint16_t o_ip_len; 20652974e916SYuri Benditovich uint32_t nseq, oseq; 20662974e916SYuri Benditovich VirtioNetRscUnit *o_unit; 20672974e916SYuri Benditovich 20682974e916SYuri Benditovich o_unit = &seg->unit; 20692974e916SYuri Benditovich o_ip_len = htons(*o_unit->ip_plen); 20702974e916SYuri Benditovich nseq = htonl(n_unit->tcp->th_seq); 20712974e916SYuri Benditovich oseq = htonl(o_unit->tcp->th_seq); 20722974e916SYuri Benditovich 20732974e916SYuri Benditovich /* out of order or retransmitted. */ 20742974e916SYuri Benditovich if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) { 20752974e916SYuri Benditovich chain->stat.data_out_of_win++; 20762974e916SYuri Benditovich return RSC_FINAL; 20772974e916SYuri Benditovich } 20782974e916SYuri Benditovich 20792974e916SYuri Benditovich data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen; 20802974e916SYuri Benditovich if (nseq == oseq) { 20812974e916SYuri Benditovich if ((o_unit->payload == 0) && n_unit->payload) { 20822974e916SYuri Benditovich /* From no payload to payload, normal case, not a dup ack or etc */ 20832974e916SYuri Benditovich chain->stat.data_after_pure_ack++; 20842974e916SYuri Benditovich goto coalesce; 20852974e916SYuri Benditovich } else { 20862974e916SYuri Benditovich return virtio_net_rsc_handle_ack(chain, seg, buf, 20872974e916SYuri Benditovich n_unit->tcp, o_unit->tcp); 20882974e916SYuri Benditovich } 20892974e916SYuri Benditovich } else if ((nseq - oseq) != o_unit->payload) { 20902974e916SYuri Benditovich /* Not a consistent packet, out of order */ 20912974e916SYuri Benditovich chain->stat.data_out_of_order++; 20922974e916SYuri Benditovich return RSC_FINAL; 20932974e916SYuri Benditovich } else { 20942974e916SYuri Benditovich coalesce: 20952974e916SYuri Benditovich if ((o_ip_len + n_unit->payload) > chain->max_payload) { 20962974e916SYuri Benditovich chain->stat.over_size++; 20972974e916SYuri Benditovich return RSC_FINAL; 20982974e916SYuri Benditovich } 20992974e916SYuri Benditovich 21002974e916SYuri Benditovich /* Here comes the right data, the payload length in v4/v6 is different, 21012974e916SYuri Benditovich so use the field value to update and record the new data len */ 21022974e916SYuri Benditovich o_unit->payload += n_unit->payload; /* update new data len */ 21032974e916SYuri Benditovich 21042974e916SYuri Benditovich /* update field in ip header */ 21052974e916SYuri Benditovich *o_unit->ip_plen = htons(o_ip_len + n_unit->payload); 21062974e916SYuri Benditovich 21072974e916SYuri Benditovich /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced 21082974e916SYuri Benditovich for windows guest, while this may change the behavior for linux 21092974e916SYuri Benditovich guest (only if it uses RSC feature). */ 21102974e916SYuri Benditovich o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags; 21112974e916SYuri Benditovich 21122974e916SYuri Benditovich o_unit->tcp->th_ack = n_unit->tcp->th_ack; 21132974e916SYuri Benditovich o_unit->tcp->th_win = n_unit->tcp->th_win; 21142974e916SYuri Benditovich 21152974e916SYuri Benditovich memmove(seg->buf + seg->size, data, n_unit->payload); 21162974e916SYuri Benditovich seg->size += n_unit->payload; 21172974e916SYuri Benditovich seg->packets++; 21182974e916SYuri Benditovich chain->stat.coalesced++; 21192974e916SYuri Benditovich return RSC_COALESCE; 21202974e916SYuri Benditovich } 21212974e916SYuri Benditovich } 21222974e916SYuri Benditovich 21232974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain, 21242974e916SYuri Benditovich VirtioNetRscSeg *seg, 21252974e916SYuri Benditovich const uint8_t *buf, size_t size, 21262974e916SYuri Benditovich VirtioNetRscUnit *unit) 21272974e916SYuri Benditovich { 21282974e916SYuri Benditovich struct ip_header *ip1, *ip2; 21292974e916SYuri Benditovich 21302974e916SYuri Benditovich ip1 = (struct ip_header *)(unit->ip); 21312974e916SYuri Benditovich ip2 = (struct ip_header *)(seg->unit.ip); 21322974e916SYuri Benditovich if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst) 21332974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 21342974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 21352974e916SYuri Benditovich chain->stat.no_match++; 21362974e916SYuri Benditovich return RSC_NO_MATCH; 21372974e916SYuri Benditovich } 21382974e916SYuri Benditovich 21392974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 21402974e916SYuri Benditovich } 21412974e916SYuri Benditovich 21422974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain, 21432974e916SYuri Benditovich VirtioNetRscSeg *seg, 21442974e916SYuri Benditovich const uint8_t *buf, size_t size, 21452974e916SYuri Benditovich VirtioNetRscUnit *unit) 21462974e916SYuri Benditovich { 21472974e916SYuri Benditovich struct ip6_header *ip1, *ip2; 21482974e916SYuri Benditovich 21492974e916SYuri Benditovich ip1 = (struct ip6_header *)(unit->ip); 21502974e916SYuri Benditovich ip2 = (struct ip6_header *)(seg->unit.ip); 21512974e916SYuri Benditovich if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address)) 21522974e916SYuri Benditovich || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address)) 21532974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 21542974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 21552974e916SYuri Benditovich chain->stat.no_match++; 21562974e916SYuri Benditovich return RSC_NO_MATCH; 21572974e916SYuri Benditovich } 21582974e916SYuri Benditovich 21592974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 21602974e916SYuri Benditovich } 21612974e916SYuri Benditovich 21622974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain 21632974e916SYuri Benditovich * to prevent out of order */ 21642974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain, 21652974e916SYuri Benditovich struct tcp_header *tcp) 21662974e916SYuri Benditovich { 21672974e916SYuri Benditovich uint16_t tcp_hdr; 21682974e916SYuri Benditovich uint16_t tcp_flag; 21692974e916SYuri Benditovich 21702974e916SYuri Benditovich tcp_flag = htons(tcp->th_offset_flags); 21712974e916SYuri Benditovich tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10; 21722974e916SYuri Benditovich tcp_flag &= VIRTIO_NET_TCP_FLAG; 21732974e916SYuri Benditovich if (tcp_flag & TH_SYN) { 21742974e916SYuri Benditovich chain->stat.tcp_syn++; 21752974e916SYuri Benditovich return RSC_BYPASS; 21762974e916SYuri Benditovich } 21772974e916SYuri Benditovich 21782974e916SYuri Benditovich if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) { 21792974e916SYuri Benditovich chain->stat.tcp_ctrl_drain++; 21802974e916SYuri Benditovich return RSC_FINAL; 21812974e916SYuri Benditovich } 21822974e916SYuri Benditovich 21832974e916SYuri Benditovich if (tcp_hdr > sizeof(struct tcp_header)) { 21842974e916SYuri Benditovich chain->stat.tcp_all_opt++; 21852974e916SYuri Benditovich return RSC_FINAL; 21862974e916SYuri Benditovich } 21872974e916SYuri Benditovich 21882974e916SYuri Benditovich return RSC_CANDIDATE; 21892974e916SYuri Benditovich } 21902974e916SYuri Benditovich 21912974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain, 21922974e916SYuri Benditovich NetClientState *nc, 21932974e916SYuri Benditovich const uint8_t *buf, size_t size, 21942974e916SYuri Benditovich VirtioNetRscUnit *unit) 21952974e916SYuri Benditovich { 21962974e916SYuri Benditovich int ret; 21972974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 21982974e916SYuri Benditovich 21992974e916SYuri Benditovich if (QTAILQ_EMPTY(&chain->buffers)) { 22002974e916SYuri Benditovich chain->stat.empty_cache++; 22012974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 22022974e916SYuri Benditovich timer_mod(chain->drain_timer, 22032974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 22042974e916SYuri Benditovich return size; 22052974e916SYuri Benditovich } 22062974e916SYuri Benditovich 22072974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 22082974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 22092974e916SYuri Benditovich ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit); 22102974e916SYuri Benditovich } else { 22112974e916SYuri Benditovich ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit); 22122974e916SYuri Benditovich } 22132974e916SYuri Benditovich 22142974e916SYuri Benditovich if (ret == RSC_FINAL) { 22152974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 22162974e916SYuri Benditovich /* Send failed */ 22172974e916SYuri Benditovich chain->stat.final_failed++; 22182974e916SYuri Benditovich return 0; 22192974e916SYuri Benditovich } 22202974e916SYuri Benditovich 22212974e916SYuri Benditovich /* Send current packet */ 22222974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 22232974e916SYuri Benditovich } else if (ret == RSC_NO_MATCH) { 22242974e916SYuri Benditovich continue; 22252974e916SYuri Benditovich } else { 22262974e916SYuri Benditovich /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */ 22272974e916SYuri Benditovich seg->is_coalesced = 1; 22282974e916SYuri Benditovich return size; 22292974e916SYuri Benditovich } 22302974e916SYuri Benditovich } 22312974e916SYuri Benditovich 22322974e916SYuri Benditovich chain->stat.no_match_cache++; 22332974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 22342974e916SYuri Benditovich return size; 22352974e916SYuri Benditovich } 22362974e916SYuri Benditovich 22372974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */ 22382974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain, 22392974e916SYuri Benditovich NetClientState *nc, 22402974e916SYuri Benditovich const uint8_t *buf, size_t size, 22412974e916SYuri Benditovich uint16_t ip_start, uint16_t ip_size, 22422974e916SYuri Benditovich uint16_t tcp_port) 22432974e916SYuri Benditovich { 22442974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 22452974e916SYuri Benditovich uint32_t ppair1, ppair2; 22462974e916SYuri Benditovich 22472974e916SYuri Benditovich ppair1 = *(uint32_t *)(buf + tcp_port); 22482974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 22492974e916SYuri Benditovich ppair2 = *(uint32_t *)(seg->buf + tcp_port); 22502974e916SYuri Benditovich if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size) 22512974e916SYuri Benditovich || (ppair1 != ppair2)) { 22522974e916SYuri Benditovich continue; 22532974e916SYuri Benditovich } 22542974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 22552974e916SYuri Benditovich chain->stat.drain_failed++; 22562974e916SYuri Benditovich } 22572974e916SYuri Benditovich 22582974e916SYuri Benditovich break; 22592974e916SYuri Benditovich } 22602974e916SYuri Benditovich 22612974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 22622974e916SYuri Benditovich } 22632974e916SYuri Benditovich 22642974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain, 22652974e916SYuri Benditovich struct ip_header *ip, 22662974e916SYuri Benditovich const uint8_t *buf, size_t size) 22672974e916SYuri Benditovich { 22682974e916SYuri Benditovich uint16_t ip_len; 22692974e916SYuri Benditovich 22702974e916SYuri Benditovich /* Not an ipv4 packet */ 22712974e916SYuri Benditovich if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) { 22722974e916SYuri Benditovich chain->stat.ip_option++; 22732974e916SYuri Benditovich return RSC_BYPASS; 22742974e916SYuri Benditovich } 22752974e916SYuri Benditovich 22762974e916SYuri Benditovich /* Don't handle packets with ip option */ 22772974e916SYuri Benditovich if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) { 22782974e916SYuri Benditovich chain->stat.ip_option++; 22792974e916SYuri Benditovich return RSC_BYPASS; 22802974e916SYuri Benditovich } 22812974e916SYuri Benditovich 22822974e916SYuri Benditovich if (ip->ip_p != IPPROTO_TCP) { 22832974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 22842974e916SYuri Benditovich return RSC_BYPASS; 22852974e916SYuri Benditovich } 22862974e916SYuri Benditovich 22872974e916SYuri Benditovich /* Don't handle packets with ip fragment */ 22882974e916SYuri Benditovich if (!(htons(ip->ip_off) & IP_DF)) { 22892974e916SYuri Benditovich chain->stat.ip_frag++; 22902974e916SYuri Benditovich return RSC_BYPASS; 22912974e916SYuri Benditovich } 22922974e916SYuri Benditovich 22932974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 22942974e916SYuri Benditovich if (IPTOS_ECN(ip->ip_tos)) { 22952974e916SYuri Benditovich chain->stat.ip_ecn++; 22962974e916SYuri Benditovich return RSC_BYPASS; 22972974e916SYuri Benditovich } 22982974e916SYuri Benditovich 22992974e916SYuri Benditovich ip_len = htons(ip->ip_len); 23002974e916SYuri Benditovich if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header)) 23012974e916SYuri Benditovich || ip_len > (size - chain->n->guest_hdr_len - 23022974e916SYuri Benditovich sizeof(struct eth_header))) { 23032974e916SYuri Benditovich chain->stat.ip_hacked++; 23042974e916SYuri Benditovich return RSC_BYPASS; 23052974e916SYuri Benditovich } 23062974e916SYuri Benditovich 23072974e916SYuri Benditovich return RSC_CANDIDATE; 23082974e916SYuri Benditovich } 23092974e916SYuri Benditovich 23102974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain, 23112974e916SYuri Benditovich NetClientState *nc, 23122974e916SYuri Benditovich const uint8_t *buf, size_t size) 23132974e916SYuri Benditovich { 23142974e916SYuri Benditovich int32_t ret; 23152974e916SYuri Benditovich uint16_t hdr_len; 23162974e916SYuri Benditovich VirtioNetRscUnit unit; 23172974e916SYuri Benditovich 23182974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 23192974e916SYuri Benditovich 23202974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header) 23212974e916SYuri Benditovich + sizeof(struct tcp_header))) { 23222974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 23232974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23242974e916SYuri Benditovich } 23252974e916SYuri Benditovich 23262974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, buf, &unit); 23272974e916SYuri Benditovich if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size) 23282974e916SYuri Benditovich != RSC_CANDIDATE) { 23292974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23302974e916SYuri Benditovich } 23312974e916SYuri Benditovich 23322974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 23332974e916SYuri Benditovich if (ret == RSC_BYPASS) { 23342974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23352974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 23362974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 23372974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 12), 23382974e916SYuri Benditovich VIRTIO_NET_IP4_ADDR_SIZE, 23392974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)); 23402974e916SYuri Benditovich } 23412974e916SYuri Benditovich 23422974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 23432974e916SYuri Benditovich } 23442974e916SYuri Benditovich 23452974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain, 23462974e916SYuri Benditovich struct ip6_header *ip6, 23472974e916SYuri Benditovich const uint8_t *buf, size_t size) 23482974e916SYuri Benditovich { 23492974e916SYuri Benditovich uint16_t ip_len; 23502974e916SYuri Benditovich 23512974e916SYuri Benditovich if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4) 23522974e916SYuri Benditovich != IP_HEADER_VERSION_6) { 23532974e916SYuri Benditovich return RSC_BYPASS; 23542974e916SYuri Benditovich } 23552974e916SYuri Benditovich 23562974e916SYuri Benditovich /* Both option and protocol is checked in this */ 23572974e916SYuri Benditovich if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) { 23582974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 23592974e916SYuri Benditovich return RSC_BYPASS; 23602974e916SYuri Benditovich } 23612974e916SYuri Benditovich 23622974e916SYuri Benditovich ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 23632974e916SYuri Benditovich if (ip_len < sizeof(struct tcp_header) || 23642974e916SYuri Benditovich ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header) 23652974e916SYuri Benditovich - sizeof(struct ip6_header))) { 23662974e916SYuri Benditovich chain->stat.ip_hacked++; 23672974e916SYuri Benditovich return RSC_BYPASS; 23682974e916SYuri Benditovich } 23692974e916SYuri Benditovich 23702974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 23712974e916SYuri Benditovich if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) { 23722974e916SYuri Benditovich chain->stat.ip_ecn++; 23732974e916SYuri Benditovich return RSC_BYPASS; 23742974e916SYuri Benditovich } 23752974e916SYuri Benditovich 23762974e916SYuri Benditovich return RSC_CANDIDATE; 23772974e916SYuri Benditovich } 23782974e916SYuri Benditovich 23792974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc, 23802974e916SYuri Benditovich const uint8_t *buf, size_t size) 23812974e916SYuri Benditovich { 23822974e916SYuri Benditovich int32_t ret; 23832974e916SYuri Benditovich uint16_t hdr_len; 23842974e916SYuri Benditovich VirtioNetRscChain *chain; 23852974e916SYuri Benditovich VirtioNetRscUnit unit; 23862974e916SYuri Benditovich 23872974e916SYuri Benditovich chain = (VirtioNetRscChain *)opq; 23882974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 23892974e916SYuri Benditovich 23902974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header) 23912974e916SYuri Benditovich + sizeof(tcp_header))) { 23922974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23932974e916SYuri Benditovich } 23942974e916SYuri Benditovich 23952974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, buf, &unit); 23962974e916SYuri Benditovich if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain, 23972974e916SYuri Benditovich unit.ip, buf, size)) { 23982974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23992974e916SYuri Benditovich } 24002974e916SYuri Benditovich 24012974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 24022974e916SYuri Benditovich if (ret == RSC_BYPASS) { 24032974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24042974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 24052974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 24062974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 8), 24072974e916SYuri Benditovich VIRTIO_NET_IP6_ADDR_SIZE, 24082974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) 24092974e916SYuri Benditovich + sizeof(struct ip6_header)); 24102974e916SYuri Benditovich } 24112974e916SYuri Benditovich 24122974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 24132974e916SYuri Benditovich } 24142974e916SYuri Benditovich 24152974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n, 24162974e916SYuri Benditovich NetClientState *nc, 24172974e916SYuri Benditovich uint16_t proto) 24182974e916SYuri Benditovich { 24192974e916SYuri Benditovich VirtioNetRscChain *chain; 24202974e916SYuri Benditovich 24212974e916SYuri Benditovich if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) { 24222974e916SYuri Benditovich return NULL; 24232974e916SYuri Benditovich } 24242974e916SYuri Benditovich 24252974e916SYuri Benditovich QTAILQ_FOREACH(chain, &n->rsc_chains, next) { 24262974e916SYuri Benditovich if (chain->proto == proto) { 24272974e916SYuri Benditovich return chain; 24282974e916SYuri Benditovich } 24292974e916SYuri Benditovich } 24302974e916SYuri Benditovich 24312974e916SYuri Benditovich chain = g_malloc(sizeof(*chain)); 24322974e916SYuri Benditovich chain->n = n; 24332974e916SYuri Benditovich chain->proto = proto; 24342974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP) { 24352974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD; 24362974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 24372974e916SYuri Benditovich } else { 24382974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD; 24392974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 24402974e916SYuri Benditovich } 24412974e916SYuri Benditovich chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST, 24422974e916SYuri Benditovich virtio_net_rsc_purge, chain); 24432974e916SYuri Benditovich memset(&chain->stat, 0, sizeof(chain->stat)); 24442974e916SYuri Benditovich 24452974e916SYuri Benditovich QTAILQ_INIT(&chain->buffers); 24462974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next); 24472974e916SYuri Benditovich 24482974e916SYuri Benditovich return chain; 24492974e916SYuri Benditovich } 24502974e916SYuri Benditovich 24512974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc, 24522974e916SYuri Benditovich const uint8_t *buf, 24532974e916SYuri Benditovich size_t size) 24542974e916SYuri Benditovich { 24552974e916SYuri Benditovich uint16_t proto; 24562974e916SYuri Benditovich VirtioNetRscChain *chain; 24572974e916SYuri Benditovich struct eth_header *eth; 24582974e916SYuri Benditovich VirtIONet *n; 24592974e916SYuri Benditovich 24602974e916SYuri Benditovich n = qemu_get_nic_opaque(nc); 24612974e916SYuri Benditovich if (size < (n->host_hdr_len + sizeof(struct eth_header))) { 24622974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24632974e916SYuri Benditovich } 24642974e916SYuri Benditovich 24652974e916SYuri Benditovich eth = (struct eth_header *)(buf + n->guest_hdr_len); 24662974e916SYuri Benditovich proto = htons(eth->h_proto); 24672974e916SYuri Benditovich 24682974e916SYuri Benditovich chain = virtio_net_rsc_lookup_chain(n, nc, proto); 24692974e916SYuri Benditovich if (chain) { 24702974e916SYuri Benditovich chain->stat.received++; 24712974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) { 24722974e916SYuri Benditovich return virtio_net_rsc_receive4(chain, nc, buf, size); 24732974e916SYuri Benditovich } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) { 24742974e916SYuri Benditovich return virtio_net_rsc_receive6(chain, nc, buf, size); 24752974e916SYuri Benditovich } 24762974e916SYuri Benditovich } 24772974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24782974e916SYuri Benditovich } 24792974e916SYuri Benditovich 24802974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, 24812974e916SYuri Benditovich size_t size) 24822974e916SYuri Benditovich { 24832974e916SYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 24842974e916SYuri Benditovich if ((n->rsc4_enabled || n->rsc6_enabled)) { 24852974e916SYuri Benditovich return virtio_net_rsc_receive(nc, buf, size); 24862974e916SYuri Benditovich } else { 24872974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24882974e916SYuri Benditovich } 24892974e916SYuri Benditovich } 24902974e916SYuri Benditovich 24916e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q); 24926e790746SPaolo Bonzini 24936e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len) 24946e790746SPaolo Bonzini { 24956e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 24966e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 249717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 24986e790746SPaolo Bonzini 249951b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, q->async_tx.elem, 0); 250017a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 25016e790746SPaolo Bonzini 250251b19ebeSPaolo Bonzini g_free(q->async_tx.elem); 250351b19ebeSPaolo Bonzini q->async_tx.elem = NULL; 25046e790746SPaolo Bonzini 25056e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 25066e790746SPaolo Bonzini virtio_net_flush_tx(q); 25076e790746SPaolo Bonzini } 25086e790746SPaolo Bonzini 25096e790746SPaolo Bonzini /* TX */ 25106e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q) 25116e790746SPaolo Bonzini { 25126e790746SPaolo Bonzini VirtIONet *n = q->n; 251317a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 251451b19ebeSPaolo Bonzini VirtQueueElement *elem; 25156e790746SPaolo Bonzini int32_t num_packets = 0; 25166e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(q->tx_vq)); 251717a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 25186e790746SPaolo Bonzini return num_packets; 25196e790746SPaolo Bonzini } 25206e790746SPaolo Bonzini 252151b19ebeSPaolo Bonzini if (q->async_tx.elem) { 25226e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 25236e790746SPaolo Bonzini return num_packets; 25246e790746SPaolo Bonzini } 25256e790746SPaolo Bonzini 252651b19ebeSPaolo Bonzini for (;;) { 2527bd89dd98SJason Wang ssize_t ret; 252851b19ebeSPaolo Bonzini unsigned int out_num; 252951b19ebeSPaolo Bonzini struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg; 2530feb93f36SJason Wang struct virtio_net_hdr_mrg_rxbuf mhdr; 25316e790746SPaolo Bonzini 253251b19ebeSPaolo Bonzini elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement)); 253351b19ebeSPaolo Bonzini if (!elem) { 253451b19ebeSPaolo Bonzini break; 253551b19ebeSPaolo Bonzini } 253651b19ebeSPaolo Bonzini 253751b19ebeSPaolo Bonzini out_num = elem->out_num; 253851b19ebeSPaolo Bonzini out_sg = elem->out_sg; 25396e790746SPaolo Bonzini if (out_num < 1) { 2540fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header not in first element"); 2541fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2542fa5e56c2SGreg Kurz g_free(elem); 2543fa5e56c2SGreg Kurz return -EINVAL; 25446e790746SPaolo Bonzini } 25456e790746SPaolo Bonzini 2546032a74a1SCédric Le Goater if (n->has_vnet_hdr) { 2547feb93f36SJason Wang if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) < 2548feb93f36SJason Wang n->guest_hdr_len) { 2549fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header incorrect"); 2550fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2551fa5e56c2SGreg Kurz g_free(elem); 2552fa5e56c2SGreg Kurz return -EINVAL; 2553032a74a1SCédric Le Goater } 25541bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2555feb93f36SJason Wang virtio_net_hdr_swap(vdev, (void *) &mhdr); 2556feb93f36SJason Wang sg2[0].iov_base = &mhdr; 2557feb93f36SJason Wang sg2[0].iov_len = n->guest_hdr_len; 2558feb93f36SJason Wang out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1, 2559feb93f36SJason Wang out_sg, out_num, 2560feb93f36SJason Wang n->guest_hdr_len, -1); 2561feb93f36SJason Wang if (out_num == VIRTQUEUE_MAX_SIZE) { 2562feb93f36SJason Wang goto drop; 2563032a74a1SCédric Le Goater } 2564feb93f36SJason Wang out_num += 1; 2565feb93f36SJason Wang out_sg = sg2; 2566feb93f36SJason Wang } 2567feb93f36SJason Wang } 25686e790746SPaolo Bonzini /* 25696e790746SPaolo Bonzini * If host wants to see the guest header as is, we can 25706e790746SPaolo Bonzini * pass it on unchanged. Otherwise, copy just the parts 25716e790746SPaolo Bonzini * that host is interested in. 25726e790746SPaolo Bonzini */ 25736e790746SPaolo Bonzini assert(n->host_hdr_len <= n->guest_hdr_len); 25746e790746SPaolo Bonzini if (n->host_hdr_len != n->guest_hdr_len) { 25756e790746SPaolo Bonzini unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg), 25766e790746SPaolo Bonzini out_sg, out_num, 25776e790746SPaolo Bonzini 0, n->host_hdr_len); 25786e790746SPaolo Bonzini sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num, 25796e790746SPaolo Bonzini out_sg, out_num, 25806e790746SPaolo Bonzini n->guest_hdr_len, -1); 25816e790746SPaolo Bonzini out_num = sg_num; 25826e790746SPaolo Bonzini out_sg = sg; 25836e790746SPaolo Bonzini } 25846e790746SPaolo Bonzini 25856e790746SPaolo Bonzini ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index), 25866e790746SPaolo Bonzini out_sg, out_num, virtio_net_tx_complete); 25876e790746SPaolo Bonzini if (ret == 0) { 25886e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 25896e790746SPaolo Bonzini q->async_tx.elem = elem; 25906e790746SPaolo Bonzini return -EBUSY; 25916e790746SPaolo Bonzini } 25926e790746SPaolo Bonzini 2593feb93f36SJason Wang drop: 259451b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, elem, 0); 259517a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 259651b19ebeSPaolo Bonzini g_free(elem); 25976e790746SPaolo Bonzini 25986e790746SPaolo Bonzini if (++num_packets >= n->tx_burst) { 25996e790746SPaolo Bonzini break; 26006e790746SPaolo Bonzini } 26016e790746SPaolo Bonzini } 26026e790746SPaolo Bonzini return num_packets; 26036e790746SPaolo Bonzini } 26046e790746SPaolo Bonzini 26056e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq) 26066e790746SPaolo Bonzini { 260717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 26086e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 26096e790746SPaolo Bonzini 2610283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2611283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2612283e2c2aSYuri Benditovich return; 2613283e2c2aSYuri Benditovich } 2614283e2c2aSYuri Benditovich 26156e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 261617a0ca55SKONRAD Frederic if (!vdev->vm_running) { 26176e790746SPaolo Bonzini q->tx_waiting = 1; 26186e790746SPaolo Bonzini return; 26196e790746SPaolo Bonzini } 26206e790746SPaolo Bonzini 26216e790746SPaolo Bonzini if (q->tx_waiting) { 26226e790746SPaolo Bonzini virtio_queue_set_notification(vq, 1); 2623bc72ad67SAlex Bligh timer_del(q->tx_timer); 26246e790746SPaolo Bonzini q->tx_waiting = 0; 2625fa5e56c2SGreg Kurz if (virtio_net_flush_tx(q) == -EINVAL) { 2626fa5e56c2SGreg Kurz return; 2627fa5e56c2SGreg Kurz } 26286e790746SPaolo Bonzini } else { 2629bc72ad67SAlex Bligh timer_mod(q->tx_timer, 2630bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 26316e790746SPaolo Bonzini q->tx_waiting = 1; 26326e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 26336e790746SPaolo Bonzini } 26346e790746SPaolo Bonzini } 26356e790746SPaolo Bonzini 26366e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq) 26376e790746SPaolo Bonzini { 263817a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 26396e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 26406e790746SPaolo Bonzini 2641283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2642283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2643283e2c2aSYuri Benditovich return; 2644283e2c2aSYuri Benditovich } 2645283e2c2aSYuri Benditovich 26466e790746SPaolo Bonzini if (unlikely(q->tx_waiting)) { 26476e790746SPaolo Bonzini return; 26486e790746SPaolo Bonzini } 26496e790746SPaolo Bonzini q->tx_waiting = 1; 26506e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 265117a0ca55SKONRAD Frederic if (!vdev->vm_running) { 26526e790746SPaolo Bonzini return; 26536e790746SPaolo Bonzini } 26546e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 26556e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 26566e790746SPaolo Bonzini } 26576e790746SPaolo Bonzini 26586e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque) 26596e790746SPaolo Bonzini { 26606e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 26616e790746SPaolo Bonzini VirtIONet *n = q->n; 266217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2663e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2664e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2665e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2666e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2667e8bcf842SMichael S. Tsirkin return; 2668e8bcf842SMichael S. Tsirkin } 26696e790746SPaolo Bonzini 26706e790746SPaolo Bonzini q->tx_waiting = 0; 26716e790746SPaolo Bonzini 26726e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 267317a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 26746e790746SPaolo Bonzini return; 267517a0ca55SKONRAD Frederic } 26766e790746SPaolo Bonzini 26776e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 26786e790746SPaolo Bonzini virtio_net_flush_tx(q); 26796e790746SPaolo Bonzini } 26806e790746SPaolo Bonzini 26816e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque) 26826e790746SPaolo Bonzini { 26836e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 26846e790746SPaolo Bonzini VirtIONet *n = q->n; 268517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 26866e790746SPaolo Bonzini int32_t ret; 26876e790746SPaolo Bonzini 2688e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2689e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2690e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2691e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2692e8bcf842SMichael S. Tsirkin return; 2693e8bcf842SMichael S. Tsirkin } 26946e790746SPaolo Bonzini 26956e790746SPaolo Bonzini q->tx_waiting = 0; 26966e790746SPaolo Bonzini 26976e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 269817a0ca55SKONRAD Frederic if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) { 26996e790746SPaolo Bonzini return; 270017a0ca55SKONRAD Frederic } 27016e790746SPaolo Bonzini 27026e790746SPaolo Bonzini ret = virtio_net_flush_tx(q); 2703fa5e56c2SGreg Kurz if (ret == -EBUSY || ret == -EINVAL) { 2704fa5e56c2SGreg Kurz return; /* Notification re-enable handled by tx_complete or device 2705fa5e56c2SGreg Kurz * broken */ 27066e790746SPaolo Bonzini } 27076e790746SPaolo Bonzini 27086e790746SPaolo Bonzini /* If we flush a full burst of packets, assume there are 27096e790746SPaolo Bonzini * more coming and immediately reschedule */ 27106e790746SPaolo Bonzini if (ret >= n->tx_burst) { 27116e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 27126e790746SPaolo Bonzini q->tx_waiting = 1; 27136e790746SPaolo Bonzini return; 27146e790746SPaolo Bonzini } 27156e790746SPaolo Bonzini 27166e790746SPaolo Bonzini /* If less than a full burst, re-enable notification and flush 27176e790746SPaolo Bonzini * anything that may have come in while we weren't looking. If 27186e790746SPaolo Bonzini * we find something, assume the guest is still active and reschedule */ 27196e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2720fa5e56c2SGreg Kurz ret = virtio_net_flush_tx(q); 2721fa5e56c2SGreg Kurz if (ret == -EINVAL) { 2722fa5e56c2SGreg Kurz return; 2723fa5e56c2SGreg Kurz } else if (ret > 0) { 27246e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27256e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 27266e790746SPaolo Bonzini q->tx_waiting = 1; 27276e790746SPaolo Bonzini } 27286e790746SPaolo Bonzini } 27296e790746SPaolo Bonzini 2730f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index) 2731f9d6dbf0SWen Congyang { 2732f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2733f9d6dbf0SWen Congyang 27341c0fbfa3SMichael S. Tsirkin n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size, 27351c0fbfa3SMichael S. Tsirkin virtio_net_handle_rx); 27369b02e161SWei Wang 2737f9d6dbf0SWen Congyang if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) { 2738f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 27399b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 27409b02e161SWei Wang virtio_net_handle_tx_timer); 2741f9d6dbf0SWen Congyang n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, 2742f9d6dbf0SWen Congyang virtio_net_tx_timer, 2743f9d6dbf0SWen Congyang &n->vqs[index]); 2744f9d6dbf0SWen Congyang } else { 2745f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 27469b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 27479b02e161SWei Wang virtio_net_handle_tx_bh); 2748f9d6dbf0SWen Congyang n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]); 2749f9d6dbf0SWen Congyang } 2750f9d6dbf0SWen Congyang 2751f9d6dbf0SWen Congyang n->vqs[index].tx_waiting = 0; 2752f9d6dbf0SWen Congyang n->vqs[index].n = n; 2753f9d6dbf0SWen Congyang } 2754f9d6dbf0SWen Congyang 2755f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index) 2756f9d6dbf0SWen Congyang { 2757f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2758f9d6dbf0SWen Congyang VirtIONetQueue *q = &n->vqs[index]; 2759f9d6dbf0SWen Congyang NetClientState *nc = qemu_get_subqueue(n->nic, index); 2760f9d6dbf0SWen Congyang 2761f9d6dbf0SWen Congyang qemu_purge_queued_packets(nc); 2762f9d6dbf0SWen Congyang 2763f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2); 2764f9d6dbf0SWen Congyang if (q->tx_timer) { 2765f9d6dbf0SWen Congyang timer_free(q->tx_timer); 2766f989c30cSYunjian Wang q->tx_timer = NULL; 2767f9d6dbf0SWen Congyang } else { 2768f9d6dbf0SWen Congyang qemu_bh_delete(q->tx_bh); 2769f989c30cSYunjian Wang q->tx_bh = NULL; 2770f9d6dbf0SWen Congyang } 2771f989c30cSYunjian Wang q->tx_waiting = 0; 2772f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2 + 1); 2773f9d6dbf0SWen Congyang } 2774f9d6dbf0SWen Congyang 2775441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs) 2776f9d6dbf0SWen Congyang { 2777f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2778f9d6dbf0SWen Congyang int old_num_queues = virtio_get_num_queues(vdev); 2779441537f1SJason Wang int new_num_queues = new_max_queue_pairs * 2 + 1; 2780f9d6dbf0SWen Congyang int i; 2781f9d6dbf0SWen Congyang 2782f9d6dbf0SWen Congyang assert(old_num_queues >= 3); 2783f9d6dbf0SWen Congyang assert(old_num_queues % 2 == 1); 2784f9d6dbf0SWen Congyang 2785f9d6dbf0SWen Congyang if (old_num_queues == new_num_queues) { 2786f9d6dbf0SWen Congyang return; 2787f9d6dbf0SWen Congyang } 2788f9d6dbf0SWen Congyang 2789f9d6dbf0SWen Congyang /* 2790f9d6dbf0SWen Congyang * We always need to remove and add ctrl vq if 2791f9d6dbf0SWen Congyang * old_num_queues != new_num_queues. Remove ctrl_vq first, 279220f86a75SYuval Shaia * and then we only enter one of the following two loops. 2793f9d6dbf0SWen Congyang */ 2794f9d6dbf0SWen Congyang virtio_del_queue(vdev, old_num_queues - 1); 2795f9d6dbf0SWen Congyang 2796f9d6dbf0SWen Congyang for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) { 2797f9d6dbf0SWen Congyang /* new_num_queues < old_num_queues */ 2798f9d6dbf0SWen Congyang virtio_net_del_queue(n, i / 2); 2799f9d6dbf0SWen Congyang } 2800f9d6dbf0SWen Congyang 2801f9d6dbf0SWen Congyang for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) { 2802f9d6dbf0SWen Congyang /* new_num_queues > old_num_queues */ 2803f9d6dbf0SWen Congyang virtio_net_add_queue(n, i / 2); 2804f9d6dbf0SWen Congyang } 2805f9d6dbf0SWen Congyang 2806f9d6dbf0SWen Congyang /* add ctrl_vq last */ 2807f9d6dbf0SWen Congyang n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 2808f9d6dbf0SWen Congyang } 2809f9d6dbf0SWen Congyang 2810ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue) 28116e790746SPaolo Bonzini { 2812441537f1SJason Wang int max = multiqueue ? n->max_queue_pairs : 1; 2813f9d6dbf0SWen Congyang 28146e790746SPaolo Bonzini n->multiqueue = multiqueue; 2815441537f1SJason Wang virtio_net_change_num_queue_pairs(n, max); 28166e790746SPaolo Bonzini 2817441537f1SJason Wang virtio_net_set_queue_pairs(n); 28186e790746SPaolo Bonzini } 28196e790746SPaolo Bonzini 2820982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id) 2821037dab2fSGreg Kurz { 2822982b78c5SDr. David Alan Gilbert VirtIONet *n = opaque; 2823982b78c5SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 2824037dab2fSGreg Kurz int i, link_down; 2825037dab2fSGreg Kurz 28269d8c6a25SDr. David Alan Gilbert trace_virtio_net_post_load_device(); 2827982b78c5SDr. David Alan Gilbert virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs, 282895129d6fSCornelia Huck virtio_vdev_has_feature(vdev, 2829e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 2830e22f0603SYuri Benditovich virtio_vdev_has_feature(vdev, 2831e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 28326e790746SPaolo Bonzini 28336e790746SPaolo Bonzini /* MAC_TABLE_ENTRIES may be different from the saved image */ 2834982b78c5SDr. David Alan Gilbert if (n->mac_table.in_use > MAC_TABLE_ENTRIES) { 28356e790746SPaolo Bonzini n->mac_table.in_use = 0; 28366e790746SPaolo Bonzini } 28376e790746SPaolo Bonzini 2838982b78c5SDr. David Alan Gilbert if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 28396c666823SMichael S. Tsirkin n->curr_guest_offloads = virtio_net_supported_guest_offloads(n); 28406c666823SMichael S. Tsirkin } 28416c666823SMichael S. Tsirkin 28427788c3f2SMikhail Sennikovsky /* 28437788c3f2SMikhail Sennikovsky * curr_guest_offloads will be later overwritten by the 28447788c3f2SMikhail Sennikovsky * virtio_set_features_nocheck call done from the virtio_load. 28457788c3f2SMikhail Sennikovsky * Here we make sure it is preserved and restored accordingly 28467788c3f2SMikhail Sennikovsky * in the virtio_net_post_load_virtio callback. 28477788c3f2SMikhail Sennikovsky */ 28487788c3f2SMikhail Sennikovsky n->saved_guest_offloads = n->curr_guest_offloads; 28496c666823SMichael S. Tsirkin 2850441537f1SJason Wang virtio_net_set_queue_pairs(n); 28516e790746SPaolo Bonzini 28526e790746SPaolo Bonzini /* Find the first multicast entry in the saved MAC filter */ 28536e790746SPaolo Bonzini for (i = 0; i < n->mac_table.in_use; i++) { 28546e790746SPaolo Bonzini if (n->mac_table.macs[i * ETH_ALEN] & 1) { 28556e790746SPaolo Bonzini break; 28566e790746SPaolo Bonzini } 28576e790746SPaolo Bonzini } 28586e790746SPaolo Bonzini n->mac_table.first_multi = i; 28596e790746SPaolo Bonzini 28606e790746SPaolo Bonzini /* nc.link_down can't be migrated, so infer link_down according 28616e790746SPaolo Bonzini * to link status bit in n->status */ 28626e790746SPaolo Bonzini link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0; 2863441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 28646e790746SPaolo Bonzini qemu_get_subqueue(n->nic, i)->link_down = link_down; 28656e790746SPaolo Bonzini } 28666e790746SPaolo Bonzini 28676c666823SMichael S. Tsirkin if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 28686c666823SMichael S. Tsirkin virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 28699d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 28709d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 28719d8c6a25SDr. David Alan Gilbert virtio_net_announce_timer, n); 28729d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 28739d8c6a25SDr. David Alan Gilbert timer_mod(n->announce_timer.tm, 28749d8c6a25SDr. David Alan Gilbert qemu_clock_get_ms(n->announce_timer.type)); 28759d8c6a25SDr. David Alan Gilbert } else { 2876944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 28779d8c6a25SDr. David Alan Gilbert } 28786c666823SMichael S. Tsirkin } 28796c666823SMichael S. Tsirkin 2880e41b7114SYuri Benditovich if (n->rss_data.enabled) { 28810145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = n->rss_data.populate_hash; 28820145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 28830145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 28840145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 28850145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS for vhost"); 28860145c393SAndrew Melnychenko } else { 28870145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS - " 28880145c393SAndrew Melnychenko "fallback to software RSS"); 28890145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 28900145c393SAndrew Melnychenko } 28910145c393SAndrew Melnychenko } 28920145c393SAndrew Melnychenko } 28930145c393SAndrew Melnychenko 2894e41b7114SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 2895e41b7114SYuri Benditovich n->rss_data.indirections_len, 2896e41b7114SYuri Benditovich sizeof(n->rss_data.key)); 2897e41b7114SYuri Benditovich } else { 2898e41b7114SYuri Benditovich trace_virtio_net_rss_disable(); 2899e41b7114SYuri Benditovich } 29006e790746SPaolo Bonzini return 0; 29016e790746SPaolo Bonzini } 29026e790746SPaolo Bonzini 29037788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev) 29047788c3f2SMikhail Sennikovsky { 29057788c3f2SMikhail Sennikovsky VirtIONet *n = VIRTIO_NET(vdev); 29067788c3f2SMikhail Sennikovsky /* 29077788c3f2SMikhail Sennikovsky * The actual needed state is now in saved_guest_offloads, 29087788c3f2SMikhail Sennikovsky * see virtio_net_post_load_device for detail. 29097788c3f2SMikhail Sennikovsky * Restore it back and apply the desired offloads. 29107788c3f2SMikhail Sennikovsky */ 29117788c3f2SMikhail Sennikovsky n->curr_guest_offloads = n->saved_guest_offloads; 29127788c3f2SMikhail Sennikovsky if (peer_has_vnet_hdr(n)) { 29137788c3f2SMikhail Sennikovsky virtio_net_apply_guest_offloads(n); 29147788c3f2SMikhail Sennikovsky } 29157788c3f2SMikhail Sennikovsky 29167788c3f2SMikhail Sennikovsky return 0; 29177788c3f2SMikhail Sennikovsky } 29187788c3f2SMikhail Sennikovsky 2919982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */ 2920982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = { 2921982b78c5SDr. David Alan Gilbert .name = "virtio-net-queue-tx_waiting", 2922982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 2923982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(tx_waiting, VirtIONetQueue), 2924982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 2925982b78c5SDr. David Alan Gilbert }, 2926982b78c5SDr. David Alan Gilbert }; 2927982b78c5SDr. David Alan Gilbert 2928441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id) 2929982b78c5SDr. David Alan Gilbert { 2930441537f1SJason Wang return VIRTIO_NET(opaque)->max_queue_pairs > 1; 2931982b78c5SDr. David Alan Gilbert } 2932982b78c5SDr. David Alan Gilbert 2933982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id) 2934982b78c5SDr. David Alan Gilbert { 2935982b78c5SDr. David Alan Gilbert return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque), 2936982b78c5SDr. David Alan Gilbert VIRTIO_NET_F_CTRL_GUEST_OFFLOADS); 2937982b78c5SDr. David Alan Gilbert } 2938982b78c5SDr. David Alan Gilbert 2939982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id) 2940982b78c5SDr. David Alan Gilbert { 2941982b78c5SDr. David Alan Gilbert return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES; 2942982b78c5SDr. David Alan Gilbert } 2943982b78c5SDr. David Alan Gilbert 2944982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id) 2945982b78c5SDr. David Alan Gilbert { 2946982b78c5SDr. David Alan Gilbert return !mac_table_fits(opaque, version_id); 2947982b78c5SDr. David Alan Gilbert } 2948982b78c5SDr. David Alan Gilbert 2949982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods 2950982b78c5SDr. David Alan Gilbert * although only some fields are used by each. 2951982b78c5SDr. David Alan Gilbert */ 2952982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp { 2953982b78c5SDr. David Alan Gilbert VirtIONet *parent; 2954982b78c5SDr. David Alan Gilbert VirtIONetQueue *vqs_1; 2955441537f1SJason Wang uint16_t curr_queue_pairs_1; 2956982b78c5SDr. David Alan Gilbert uint8_t has_ufo; 2957982b78c5SDr. David Alan Gilbert uint32_t has_vnet_hdr; 2958982b78c5SDr. David Alan Gilbert }; 2959982b78c5SDr. David Alan Gilbert 2960982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than 2961441537f1SJason Wang * the 1st entry in the queue_pairs and only if there's more than one 2962982b78c5SDr. David Alan Gilbert * entry. We use the tmp mechanism to calculate a temporary 2963982b78c5SDr. David Alan Gilbert * pointer and count and also validate the count. 2964982b78c5SDr. David Alan Gilbert */ 2965982b78c5SDr. David Alan Gilbert 296644b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque) 2967982b78c5SDr. David Alan Gilbert { 2968982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 2969982b78c5SDr. David Alan Gilbert 2970982b78c5SDr. David Alan Gilbert tmp->vqs_1 = tmp->parent->vqs + 1; 2971441537f1SJason Wang tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1; 2972441537f1SJason Wang if (tmp->parent->curr_queue_pairs == 0) { 2973441537f1SJason Wang tmp->curr_queue_pairs_1 = 0; 2974982b78c5SDr. David Alan Gilbert } 297544b1ff31SDr. David Alan Gilbert 297644b1ff31SDr. David Alan Gilbert return 0; 2977982b78c5SDr. David Alan Gilbert } 2978982b78c5SDr. David Alan Gilbert 2979982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque) 2980982b78c5SDr. David Alan Gilbert { 2981982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 2982982b78c5SDr. David Alan Gilbert 2983982b78c5SDr. David Alan Gilbert /* Reuse the pointer setup from save */ 2984982b78c5SDr. David Alan Gilbert virtio_net_tx_waiting_pre_save(opaque); 2985982b78c5SDr. David Alan Gilbert 2986441537f1SJason Wang if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) { 2987441537f1SJason Wang error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x", 2988441537f1SJason Wang tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs); 2989982b78c5SDr. David Alan Gilbert 2990982b78c5SDr. David Alan Gilbert return -EINVAL; 2991982b78c5SDr. David Alan Gilbert } 2992982b78c5SDr. David Alan Gilbert 2993982b78c5SDr. David Alan Gilbert return 0; /* all good */ 2994982b78c5SDr. David Alan Gilbert } 2995982b78c5SDr. David Alan Gilbert 2996982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = { 2997982b78c5SDr. David Alan Gilbert .name = "virtio-net-tx_waiting", 2998982b78c5SDr. David Alan Gilbert .pre_load = virtio_net_tx_waiting_pre_load, 2999982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_tx_waiting_pre_save, 3000982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3001982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp, 3002441537f1SJason Wang curr_queue_pairs_1, 3003982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3004982b78c5SDr. David Alan Gilbert struct VirtIONetQueue), 3005982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3006982b78c5SDr. David Alan Gilbert }, 3007982b78c5SDr. David Alan Gilbert }; 3008982b78c5SDr. David Alan Gilbert 3009982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the 3010982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3011982b78c5SDr. David Alan Gilbert */ 3012982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id) 3013982b78c5SDr. David Alan Gilbert { 3014982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3015982b78c5SDr. David Alan Gilbert 3016982b78c5SDr. David Alan Gilbert if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) { 3017982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires TUN_F_UFO support"); 3018982b78c5SDr. David Alan Gilbert return -EINVAL; 3019982b78c5SDr. David Alan Gilbert } 3020982b78c5SDr. David Alan Gilbert 3021982b78c5SDr. David Alan Gilbert return 0; 3022982b78c5SDr. David Alan Gilbert } 3023982b78c5SDr. David Alan Gilbert 302444b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque) 3025982b78c5SDr. David Alan Gilbert { 3026982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3027982b78c5SDr. David Alan Gilbert 3028982b78c5SDr. David Alan Gilbert tmp->has_ufo = tmp->parent->has_ufo; 302944b1ff31SDr. David Alan Gilbert 303044b1ff31SDr. David Alan Gilbert return 0; 3031982b78c5SDr. David Alan Gilbert } 3032982b78c5SDr. David Alan Gilbert 3033982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = { 3034982b78c5SDr. David Alan Gilbert .name = "virtio-net-ufo", 3035982b78c5SDr. David Alan Gilbert .post_load = virtio_net_ufo_post_load, 3036982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_ufo_pre_save, 3037982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3038982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp), 3039982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3040982b78c5SDr. David Alan Gilbert }, 3041982b78c5SDr. David Alan Gilbert }; 3042982b78c5SDr. David Alan Gilbert 3043982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the 3044982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3045982b78c5SDr. David Alan Gilbert */ 3046982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id) 3047982b78c5SDr. David Alan Gilbert { 3048982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3049982b78c5SDr. David Alan Gilbert 3050982b78c5SDr. David Alan Gilbert if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) { 3051982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires vnet_hdr=on"); 3052982b78c5SDr. David Alan Gilbert return -EINVAL; 3053982b78c5SDr. David Alan Gilbert } 3054982b78c5SDr. David Alan Gilbert 3055982b78c5SDr. David Alan Gilbert return 0; 3056982b78c5SDr. David Alan Gilbert } 3057982b78c5SDr. David Alan Gilbert 305844b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque) 3059982b78c5SDr. David Alan Gilbert { 3060982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3061982b78c5SDr. David Alan Gilbert 3062982b78c5SDr. David Alan Gilbert tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr; 306344b1ff31SDr. David Alan Gilbert 306444b1ff31SDr. David Alan Gilbert return 0; 3065982b78c5SDr. David Alan Gilbert } 3066982b78c5SDr. David Alan Gilbert 3067982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = { 3068982b78c5SDr. David Alan Gilbert .name = "virtio-net-vnet", 3069982b78c5SDr. David Alan Gilbert .post_load = virtio_net_vnet_post_load, 3070982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_vnet_pre_save, 3071982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3072982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp), 3073982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3074982b78c5SDr. David Alan Gilbert }, 3075982b78c5SDr. David Alan Gilbert }; 3076982b78c5SDr. David Alan Gilbert 3077e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque) 3078e41b7114SYuri Benditovich { 3079e41b7114SYuri Benditovich return VIRTIO_NET(opaque)->rss_data.enabled; 3080e41b7114SYuri Benditovich } 3081e41b7114SYuri Benditovich 3082e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = { 3083e41b7114SYuri Benditovich .name = "virtio-net-device/rss", 3084e41b7114SYuri Benditovich .version_id = 1, 3085e41b7114SYuri Benditovich .minimum_version_id = 1, 3086e41b7114SYuri Benditovich .needed = virtio_net_rss_needed, 3087e41b7114SYuri Benditovich .fields = (VMStateField[]) { 3088e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.enabled, VirtIONet), 3089e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.redirect, VirtIONet), 3090e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.populate_hash, VirtIONet), 3091e41b7114SYuri Benditovich VMSTATE_UINT32(rss_data.hash_types, VirtIONet), 3092e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.indirections_len, VirtIONet), 3093e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.default_queue, VirtIONet), 3094e41b7114SYuri Benditovich VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet, 3095e41b7114SYuri Benditovich VIRTIO_NET_RSS_MAX_KEY_SIZE), 3096e41b7114SYuri Benditovich VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet, 3097e41b7114SYuri Benditovich rss_data.indirections_len, 0, 3098e41b7114SYuri Benditovich vmstate_info_uint16, uint16_t), 3099e41b7114SYuri Benditovich VMSTATE_END_OF_LIST() 3100e41b7114SYuri Benditovich }, 3101e41b7114SYuri Benditovich }; 3102e41b7114SYuri Benditovich 3103982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = { 3104982b78c5SDr. David Alan Gilbert .name = "virtio-net-device", 3105982b78c5SDr. David Alan Gilbert .version_id = VIRTIO_NET_VM_VERSION, 3106982b78c5SDr. David Alan Gilbert .minimum_version_id = VIRTIO_NET_VM_VERSION, 3107982b78c5SDr. David Alan Gilbert .post_load = virtio_net_post_load_device, 3108982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3109982b78c5SDr. David Alan Gilbert VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN), 3110982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_POINTER(vqs, VirtIONet, 3111982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3112982b78c5SDr. David Alan Gilbert VirtIONetQueue), 3113982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet), 3114982b78c5SDr. David Alan Gilbert VMSTATE_UINT16(status, VirtIONet), 3115982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(promisc, VirtIONet), 3116982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(allmulti, VirtIONet), 3117982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mac_table.in_use, VirtIONet), 3118982b78c5SDr. David Alan Gilbert 3119982b78c5SDr. David Alan Gilbert /* Guarded pair: If it fits we load it, else we throw it away 3120982b78c5SDr. David Alan Gilbert * - can happen if source has a larger MAC table.; post-load 3121982b78c5SDr. David Alan Gilbert * sets flags in this case. 3122982b78c5SDr. David Alan Gilbert */ 3123982b78c5SDr. David Alan Gilbert VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet, 3124982b78c5SDr. David Alan Gilbert 0, mac_table_fits, mac_table.in_use, 3125982b78c5SDr. David Alan Gilbert ETH_ALEN), 3126982b78c5SDr. David Alan Gilbert VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0, 3127982b78c5SDr. David Alan Gilbert mac_table.in_use, ETH_ALEN), 3128982b78c5SDr. David Alan Gilbert 3129982b78c5SDr. David Alan Gilbert /* Note: This is an array of uint32's that's always been saved as a 3130982b78c5SDr. David Alan Gilbert * buffer; hold onto your endiannesses; it's actually used as a bitmap 3131982b78c5SDr. David Alan Gilbert * but based on the uint. 3132982b78c5SDr. David Alan Gilbert */ 3133982b78c5SDr. David Alan Gilbert VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3), 3134982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3135982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_vnet), 3136982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet), 3137982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet), 3138982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(alluni, VirtIONet), 3139982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nomulti, VirtIONet), 3140982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nouni, VirtIONet), 3141982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nobcast, VirtIONet), 3142982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3143982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_ufo), 3144441537f1SJason Wang VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0, 3145982b78c5SDr. David Alan Gilbert vmstate_info_uint16_equal, uint16_t), 3146441537f1SJason Wang VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1), 3147982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3148982b78c5SDr. David Alan Gilbert vmstate_virtio_net_tx_waiting), 3149982b78c5SDr. David Alan Gilbert VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet, 3150982b78c5SDr. David Alan Gilbert has_ctrl_guest_offloads), 3151982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3152982b78c5SDr. David Alan Gilbert }, 3153e41b7114SYuri Benditovich .subsections = (const VMStateDescription * []) { 3154e41b7114SYuri Benditovich &vmstate_virtio_net_rss, 3155e41b7114SYuri Benditovich NULL 3156e41b7114SYuri Benditovich } 3157982b78c5SDr. David Alan Gilbert }; 3158982b78c5SDr. David Alan Gilbert 31596e790746SPaolo Bonzini static NetClientInfo net_virtio_info = { 3160f394b2e2SEric Blake .type = NET_CLIENT_DRIVER_NIC, 31616e790746SPaolo Bonzini .size = sizeof(NICState), 31626e790746SPaolo Bonzini .can_receive = virtio_net_can_receive, 31636e790746SPaolo Bonzini .receive = virtio_net_receive, 31646e790746SPaolo Bonzini .link_status_changed = virtio_net_set_link_status, 3165b1be4280SAmos Kong .query_rx_filter = virtio_net_query_rxfilter, 3166b2c929f0SDr. David Alan Gilbert .announce = virtio_net_announce, 31676e790746SPaolo Bonzini }; 31686e790746SPaolo Bonzini 31696e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx) 31706e790746SPaolo Bonzini { 317117a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 31726e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx)); 31736e790746SPaolo Bonzini assert(n->vhost_started); 3174ed8b4afeSNikolay Nikolaev return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx); 31756e790746SPaolo Bonzini } 31766e790746SPaolo Bonzini 31776e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx, 31786e790746SPaolo Bonzini bool mask) 31796e790746SPaolo Bonzini { 318017a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 31816e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx)); 31826e790746SPaolo Bonzini assert(n->vhost_started); 3183a882b571SMichael S. Tsirkin vhost_net_virtqueue_mask(get_vhost_net(nc->peer), 3184a882b571SMichael S. Tsirkin vdev, idx, mask); 31856e790746SPaolo Bonzini } 31866e790746SPaolo Bonzini 3187019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features) 31886e790746SPaolo Bonzini { 31890cd09c3aSCornelia Huck virtio_add_feature(&host_features, VIRTIO_NET_F_MAC); 3190a93e599dSMaxime Coquelin 3191ba550851SStefano Garzarella n->config_size = virtio_feature_get_config_size(feature_sizes, 3192ba550851SStefano Garzarella host_features); 319317ec5a86SKONRAD Frederic } 31946e790746SPaolo Bonzini 31958a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name, 31968a253ec2SKONRAD Frederic const char *type) 31978a253ec2SKONRAD Frederic { 31988a253ec2SKONRAD Frederic /* 31998a253ec2SKONRAD Frederic * The name can be NULL, the netclient name will be type.x. 32008a253ec2SKONRAD Frederic */ 32018a253ec2SKONRAD Frederic assert(type != NULL); 32028a253ec2SKONRAD Frederic 32038a253ec2SKONRAD Frederic g_free(n->netclient_name); 32048a253ec2SKONRAD Frederic g_free(n->netclient_type); 32058a253ec2SKONRAD Frederic n->netclient_name = g_strdup(name); 32068a253ec2SKONRAD Frederic n->netclient_type = g_strdup(type); 32078a253ec2SKONRAD Frederic } 32088a253ec2SKONRAD Frederic 32090e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev) 32109711cd0dSJens Freimann { 32119711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 32129711cd0dSJens Freimann PCIDevice *pci_dev; 32139711cd0dSJens Freimann Error *err = NULL; 32149711cd0dSJens Freimann 32150e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 32169711cd0dSJens Freimann if (hotplug_ctrl) { 32170e9a65c5SJuan Quintela pci_dev = PCI_DEVICE(dev); 32189711cd0dSJens Freimann pci_dev->partially_hotplugged = true; 32190e9a65c5SJuan Quintela hotplug_handler_unplug_request(hotplug_ctrl, dev, &err); 32209711cd0dSJens Freimann if (err) { 32219711cd0dSJens Freimann error_report_err(err); 32229711cd0dSJens Freimann return false; 32239711cd0dSJens Freimann } 32249711cd0dSJens Freimann } else { 32259711cd0dSJens Freimann return false; 32269711cd0dSJens Freimann } 32279711cd0dSJens Freimann return true; 32289711cd0dSJens Freimann } 32299711cd0dSJens Freimann 32300e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev, 32310e9a65c5SJuan Quintela Error **errp) 32329711cd0dSJens Freimann { 32335a0948d3SMarkus Armbruster Error *err = NULL; 32349711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 32350e9a65c5SJuan Quintela PCIDevice *pdev = PCI_DEVICE(dev); 323678274682SJuan Quintela BusState *primary_bus; 32379711cd0dSJens Freimann 32389711cd0dSJens Freimann if (!pdev->partially_hotplugged) { 32399711cd0dSJens Freimann return true; 32409711cd0dSJens Freimann } 32410e9a65c5SJuan Quintela primary_bus = dev->parent_bus; 324278274682SJuan Quintela if (!primary_bus) { 3243150ab54aSJens Freimann error_setg(errp, "virtio_net: couldn't find primary bus"); 32445a0948d3SMarkus Armbruster return false; 32459711cd0dSJens Freimann } 32460e9a65c5SJuan Quintela qdev_set_parent_bus(dev, primary_bus, &error_abort); 3247e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 32480e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 32499711cd0dSJens Freimann if (hotplug_ctrl) { 32500e9a65c5SJuan Quintela hotplug_handler_pre_plug(hotplug_ctrl, dev, &err); 32515a0948d3SMarkus Armbruster if (err) { 32525a0948d3SMarkus Armbruster goto out; 32535a0948d3SMarkus Armbruster } 32540e9a65c5SJuan Quintela hotplug_handler_plug(hotplug_ctrl, dev, &err); 32559711cd0dSJens Freimann } 3256109c20eaSLaurent Vivier pdev->partially_hotplugged = false; 3257150ab54aSJens Freimann 3258150ab54aSJens Freimann out: 32595a0948d3SMarkus Armbruster error_propagate(errp, err); 32605a0948d3SMarkus Armbruster return !err; 32619711cd0dSJens Freimann } 32629711cd0dSJens Freimann 326307a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s) 32649711cd0dSJens Freimann { 32659711cd0dSJens Freimann bool should_be_hidden; 32669711cd0dSJens Freimann Error *err = NULL; 326707a5d816SJuan Quintela DeviceState *dev = failover_find_primary_device(n); 326807a5d816SJuan Quintela 326907a5d816SJuan Quintela if (!dev) { 327007a5d816SJuan Quintela return; 327107a5d816SJuan Quintela } 32729711cd0dSJens Freimann 3273e2bde83eSJuan Quintela should_be_hidden = qatomic_read(&n->failover_primary_hidden); 32749711cd0dSJens Freimann 32754dbac1aeSMarkus Armbruster if (migration_in_setup(s) && !should_be_hidden) { 327607a5d816SJuan Quintela if (failover_unplug_primary(n, dev)) { 327707a5d816SJuan Quintela vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev); 327807a5d816SJuan Quintela qapi_event_send_unplug_primary(dev->id); 3279e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 32809711cd0dSJens Freimann } else { 32819711cd0dSJens Freimann warn_report("couldn't unplug primary device"); 32829711cd0dSJens Freimann } 32839711cd0dSJens Freimann } else if (migration_has_failed(s)) { 3284150ab54aSJens Freimann /* We already unplugged the device let's plug it back */ 328507a5d816SJuan Quintela if (!failover_replug_primary(n, dev, &err)) { 32869711cd0dSJens Freimann if (err) { 32879711cd0dSJens Freimann error_report_err(err); 32889711cd0dSJens Freimann } 32899711cd0dSJens Freimann } 32909711cd0dSJens Freimann } 32919711cd0dSJens Freimann } 32929711cd0dSJens Freimann 32939711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data) 32949711cd0dSJens Freimann { 32959711cd0dSJens Freimann MigrationState *s = data; 32969711cd0dSJens Freimann VirtIONet *n = container_of(notifier, VirtIONet, migration_state); 32979711cd0dSJens Freimann virtio_net_handle_migration_primary(n, s); 32989711cd0dSJens Freimann } 32999711cd0dSJens Freimann 3300b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener, 3301f3558b1bSKevin Wolf const QDict *device_opts, 3302f3558b1bSKevin Wolf bool from_json, 3303f3558b1bSKevin Wolf Error **errp) 33049711cd0dSJens Freimann { 33059711cd0dSJens Freimann VirtIONet *n = container_of(listener, VirtIONet, primary_listener); 33064f0303aeSJuan Quintela const char *standby_id; 33079711cd0dSJens Freimann 33084d0e59acSJens Freimann if (!device_opts) { 330989631fedSJuan Quintela return false; 33104d0e59acSJens Freimann } 3311bcfc906bSLaurent Vivier 3312bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "failover_pair_id")) { 3313bcfc906bSLaurent Vivier return false; 3314bcfc906bSLaurent Vivier } 3315bcfc906bSLaurent Vivier 3316bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "id")) { 3317bcfc906bSLaurent Vivier error_setg(errp, "Device with failover_pair_id needs to have id"); 3318bcfc906bSLaurent Vivier return false; 3319bcfc906bSLaurent Vivier } 3320bcfc906bSLaurent Vivier 3321bcfc906bSLaurent Vivier standby_id = qdict_get_str(device_opts, "failover_pair_id"); 332289631fedSJuan Quintela if (g_strcmp0(standby_id, n->netclient_name) != 0) { 332389631fedSJuan Quintela return false; 33249711cd0dSJens Freimann } 33259711cd0dSJens Freimann 33267fe7791eSLaurent Vivier /* 33277fe7791eSLaurent Vivier * The hide helper can be called several times for a given device. 33287fe7791eSLaurent Vivier * Check there is only one primary for a virtio-net device but 33297fe7791eSLaurent Vivier * don't duplicate the qdict several times if it's called for the same 33307fe7791eSLaurent Vivier * device. 33317fe7791eSLaurent Vivier */ 3332259a10dbSKevin Wolf if (n->primary_opts) { 33337fe7791eSLaurent Vivier const char *old, *new; 33347fe7791eSLaurent Vivier /* devices with failover_pair_id always have an id */ 33357fe7791eSLaurent Vivier old = qdict_get_str(n->primary_opts, "id"); 33367fe7791eSLaurent Vivier new = qdict_get_str(device_opts, "id"); 33377fe7791eSLaurent Vivier if (strcmp(old, new) != 0) { 33387fe7791eSLaurent Vivier error_setg(errp, "Cannot attach more than one primary device to " 33397fe7791eSLaurent Vivier "'%s': '%s' and '%s'", n->netclient_name, old, new); 3340259a10dbSKevin Wolf return false; 3341259a10dbSKevin Wolf } 33427fe7791eSLaurent Vivier } else { 3343f3558b1bSKevin Wolf n->primary_opts = qdict_clone_shallow(device_opts); 3344f3558b1bSKevin Wolf n->primary_opts_from_json = from_json; 33457fe7791eSLaurent Vivier } 3346259a10dbSKevin Wolf 3347e2bde83eSJuan Quintela /* failover_primary_hidden is set during feature negotiation */ 33483abad4a2SJuan Quintela return qatomic_read(&n->failover_primary_hidden); 33499711cd0dSJens Freimann } 33509711cd0dSJens Freimann 3351e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp) 335217ec5a86SKONRAD Frederic { 3353e6f746b3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3354284a32f0SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3355284a32f0SAndreas Färber NetClientState *nc; 33561773d9eeSKONRAD Frederic int i; 335717ec5a86SKONRAD Frederic 3358a93e599dSMaxime Coquelin if (n->net_conf.mtu) { 3359127833eeSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_MTU); 3360a93e599dSMaxime Coquelin } 3361a93e599dSMaxime Coquelin 33629473939eSJason Baron if (n->net_conf.duplex_str) { 33639473939eSJason Baron if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) { 33649473939eSJason Baron n->net_conf.duplex = DUPLEX_HALF; 33659473939eSJason Baron } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) { 33669473939eSJason Baron n->net_conf.duplex = DUPLEX_FULL; 33679473939eSJason Baron } else { 33689473939eSJason Baron error_setg(errp, "'duplex' must be 'half' or 'full'"); 3369843c4cfcSMarkus Armbruster return; 33709473939eSJason Baron } 33719473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 33729473939eSJason Baron } else { 33739473939eSJason Baron n->net_conf.duplex = DUPLEX_UNKNOWN; 33749473939eSJason Baron } 33759473939eSJason Baron 33769473939eSJason Baron if (n->net_conf.speed < SPEED_UNKNOWN) { 33779473939eSJason Baron error_setg(errp, "'speed' must be between 0 and INT_MAX"); 3378843c4cfcSMarkus Armbruster return; 3379843c4cfcSMarkus Armbruster } 3380843c4cfcSMarkus Armbruster if (n->net_conf.speed >= 0) { 33819473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 33829473939eSJason Baron } 33839473939eSJason Baron 33849711cd0dSJens Freimann if (n->failover) { 3385b91ad981SJuan Quintela n->primary_listener.hide_device = failover_hide_primary_device; 3386e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 33879711cd0dSJens Freimann device_listener_register(&n->primary_listener); 33889711cd0dSJens Freimann n->migration_state.notify = virtio_net_migration_state_notifier; 33899711cd0dSJens Freimann add_migration_state_change_notifier(&n->migration_state); 33909711cd0dSJens Freimann n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY); 33919711cd0dSJens Freimann } 33929711cd0dSJens Freimann 3393da3e8a23SShannon Zhao virtio_net_set_config_size(n, n->host_features); 3394284a32f0SAndreas Färber virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size); 339517ec5a86SKONRAD Frederic 33961c0fbfa3SMichael S. Tsirkin /* 33971c0fbfa3SMichael S. Tsirkin * We set a lower limit on RX queue size to what it always was. 33981c0fbfa3SMichael S. Tsirkin * Guests that want a smaller ring can always resize it without 33991c0fbfa3SMichael S. Tsirkin * help from us (using virtio 1 and up). 34001c0fbfa3SMichael S. Tsirkin */ 34011c0fbfa3SMichael S. Tsirkin if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE || 34021c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE || 34035f997fd1SMichal Privoznik !is_power_of_2(n->net_conf.rx_queue_size)) { 34041c0fbfa3SMichael S. Tsirkin error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), " 34051c0fbfa3SMichael S. Tsirkin "must be a power of 2 between %d and %d.", 34061c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE, 34071c0fbfa3SMichael S. Tsirkin VIRTQUEUE_MAX_SIZE); 34081c0fbfa3SMichael S. Tsirkin virtio_cleanup(vdev); 34091c0fbfa3SMichael S. Tsirkin return; 34101c0fbfa3SMichael S. Tsirkin } 34111c0fbfa3SMichael S. Tsirkin 34129b02e161SWei Wang if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE || 34139b02e161SWei Wang n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE || 34149b02e161SWei Wang !is_power_of_2(n->net_conf.tx_queue_size)) { 34159b02e161SWei Wang error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), " 34169b02e161SWei Wang "must be a power of 2 between %d and %d", 34179b02e161SWei Wang n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE, 34189b02e161SWei Wang VIRTQUEUE_MAX_SIZE); 34199b02e161SWei Wang virtio_cleanup(vdev); 34209b02e161SWei Wang return; 34219b02e161SWei Wang } 34229b02e161SWei Wang 342322288fe5SJason Wang n->max_ncs = MAX(n->nic_conf.peers.queues, 1); 342422288fe5SJason Wang 342522288fe5SJason Wang /* 342622288fe5SJason Wang * Figure out the datapath queue pairs since the backend could 342722288fe5SJason Wang * provide control queue via peers as well. 342822288fe5SJason Wang */ 342922288fe5SJason Wang if (n->nic_conf.peers.queues) { 343022288fe5SJason Wang for (i = 0; i < n->max_ncs; i++) { 343122288fe5SJason Wang if (n->nic_conf.peers.ncs[i]->is_datapath) { 343222288fe5SJason Wang ++n->max_queue_pairs; 343322288fe5SJason Wang } 343422288fe5SJason Wang } 343522288fe5SJason Wang } 343622288fe5SJason Wang n->max_queue_pairs = MAX(n->max_queue_pairs, 1); 343722288fe5SJason Wang 3438441537f1SJason Wang if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) { 343922288fe5SJason Wang error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), " 3440631b22eaSStefan Weil "must be a positive integer less than %d.", 3441441537f1SJason Wang n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2); 34427e0e736eSJason Wang virtio_cleanup(vdev); 34437e0e736eSJason Wang return; 34447e0e736eSJason Wang } 3445441537f1SJason Wang n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queue_pairs); 3446441537f1SJason Wang n->curr_queue_pairs = 1; 34471773d9eeSKONRAD Frederic n->tx_timeout = n->net_conf.txtimer; 34486e790746SPaolo Bonzini 34491773d9eeSKONRAD Frederic if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer") 34501773d9eeSKONRAD Frederic && strcmp(n->net_conf.tx, "bh")) { 34510765691eSMarkus Armbruster warn_report("virtio-net: " 34526e790746SPaolo Bonzini "Unknown option tx=%s, valid options: \"timer\" \"bh\"", 34531773d9eeSKONRAD Frederic n->net_conf.tx); 34540765691eSMarkus Armbruster error_printf("Defaulting to \"bh\""); 34556e790746SPaolo Bonzini } 34566e790746SPaolo Bonzini 34572eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n), 34582eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size); 34599b02e161SWei Wang 3460441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3461f9d6dbf0SWen Congyang virtio_net_add_queue(n, i); 3462da51a335SJason Wang } 3463da51a335SJason Wang 346417a0ca55SKONRAD Frederic n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 34651773d9eeSKONRAD Frederic qemu_macaddr_default_if_unset(&n->nic_conf.macaddr); 34661773d9eeSKONRAD Frederic memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac)); 34676e790746SPaolo Bonzini n->status = VIRTIO_NET_S_LINK_UP; 34689d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 34699d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 3470f57fcf70SJason Wang virtio_net_announce_timer, n); 3471b2c929f0SDr. David Alan Gilbert n->announce_timer.round = 0; 34726e790746SPaolo Bonzini 34738a253ec2SKONRAD Frederic if (n->netclient_type) { 34748a253ec2SKONRAD Frederic /* 34758a253ec2SKONRAD Frederic * Happen when virtio_net_set_netclient_name has been called. 34768a253ec2SKONRAD Frederic */ 34778a253ec2SKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 34788a253ec2SKONRAD Frederic n->netclient_type, n->netclient_name, n); 34798a253ec2SKONRAD Frederic } else { 34801773d9eeSKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 3481284a32f0SAndreas Färber object_get_typename(OBJECT(dev)), dev->id, n); 34828a253ec2SKONRAD Frederic } 34838a253ec2SKONRAD Frederic 3484441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3485d4c62930SBin Meng n->nic->ncs[i].do_not_pad = true; 3486d4c62930SBin Meng } 3487d4c62930SBin Meng 34886e790746SPaolo Bonzini peer_test_vnet_hdr(n); 34896e790746SPaolo Bonzini if (peer_has_vnet_hdr(n)) { 3490441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3491d6085e3aSStefan Hajnoczi qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true); 34926e790746SPaolo Bonzini } 34936e790746SPaolo Bonzini n->host_hdr_len = sizeof(struct virtio_net_hdr); 34946e790746SPaolo Bonzini } else { 34956e790746SPaolo Bonzini n->host_hdr_len = 0; 34966e790746SPaolo Bonzini } 34976e790746SPaolo Bonzini 34981773d9eeSKONRAD Frederic qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a); 34996e790746SPaolo Bonzini 35006e790746SPaolo Bonzini n->vqs[0].tx_waiting = 0; 35011773d9eeSKONRAD Frederic n->tx_burst = n->net_conf.txburst; 3502e22f0603SYuri Benditovich virtio_net_set_mrg_rx_bufs(n, 0, 0, 0); 35036e790746SPaolo Bonzini n->promisc = 1; /* for compatibility */ 35046e790746SPaolo Bonzini 35056e790746SPaolo Bonzini n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 35066e790746SPaolo Bonzini 35076e790746SPaolo Bonzini n->vlans = g_malloc0(MAX_VLAN >> 3); 35086e790746SPaolo Bonzini 3509b1be4280SAmos Kong nc = qemu_get_queue(n->nic); 3510b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 3511b1be4280SAmos Kong 3512e87936eaSCindy Lu if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 3513e87936eaSCindy Lu struct virtio_net_config netcfg = {}; 3514e87936eaSCindy Lu memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN); 3515e87936eaSCindy Lu vhost_net_set_config(get_vhost_net(nc->peer), 3516e87936eaSCindy Lu (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER); 3517e87936eaSCindy Lu } 35182974e916SYuri Benditovich QTAILQ_INIT(&n->rsc_chains); 3519284a32f0SAndreas Färber n->qdev = dev; 35204474e37aSYuri Benditovich 35214474e37aSYuri Benditovich net_rx_pkt_init(&n->rx_pkt, false); 35220145c393SAndrew Melnychenko 35230145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 35240145c393SAndrew Melnychenko virtio_net_load_ebpf(n); 35250145c393SAndrew Melnychenko } 352617ec5a86SKONRAD Frederic } 352717ec5a86SKONRAD Frederic 3528b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev) 352917ec5a86SKONRAD Frederic { 3530306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3531306ec6c3SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3532441537f1SJason Wang int i, max_queue_pairs; 353317ec5a86SKONRAD Frederic 35340145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 35350145c393SAndrew Melnychenko virtio_net_unload_ebpf(n); 35360145c393SAndrew Melnychenko } 35370145c393SAndrew Melnychenko 353817ec5a86SKONRAD Frederic /* This will stop vhost backend if appropriate. */ 353917ec5a86SKONRAD Frederic virtio_net_set_status(vdev, 0); 354017ec5a86SKONRAD Frederic 35418a253ec2SKONRAD Frederic g_free(n->netclient_name); 35428a253ec2SKONRAD Frederic n->netclient_name = NULL; 35438a253ec2SKONRAD Frederic g_free(n->netclient_type); 35448a253ec2SKONRAD Frederic n->netclient_type = NULL; 35458a253ec2SKONRAD Frederic 354617ec5a86SKONRAD Frederic g_free(n->mac_table.macs); 354717ec5a86SKONRAD Frederic g_free(n->vlans); 354817ec5a86SKONRAD Frederic 35499711cd0dSJens Freimann if (n->failover) { 3550f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 355165018100SJuan Quintela device_listener_unregister(&n->primary_listener); 35521e157667SLaurent Vivier remove_migration_state_change_notifier(&n->migration_state); 3553f3558b1bSKevin Wolf } else { 3554f3558b1bSKevin Wolf assert(n->primary_opts == NULL); 35559711cd0dSJens Freimann } 35569711cd0dSJens Freimann 3557441537f1SJason Wang max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3558441537f1SJason Wang for (i = 0; i < max_queue_pairs; i++) { 3559f9d6dbf0SWen Congyang virtio_net_del_queue(n, i); 356017ec5a86SKONRAD Frederic } 3561d945d9f1SYuri Benditovich /* delete also control vq */ 3562441537f1SJason Wang virtio_del_queue(vdev, max_queue_pairs * 2); 3563944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 356417ec5a86SKONRAD Frederic g_free(n->vqs); 356517ec5a86SKONRAD Frederic qemu_del_nic(n->nic); 35662974e916SYuri Benditovich virtio_net_rsc_cleanup(n); 356759079029SYuri Benditovich g_free(n->rss_data.indirections_table); 35684474e37aSYuri Benditovich net_rx_pkt_uninit(n->rx_pkt); 35696a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 357017ec5a86SKONRAD Frederic } 357117ec5a86SKONRAD Frederic 357217ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj) 357317ec5a86SKONRAD Frederic { 357417ec5a86SKONRAD Frederic VirtIONet *n = VIRTIO_NET(obj); 357517ec5a86SKONRAD Frederic 357617ec5a86SKONRAD Frederic /* 357717ec5a86SKONRAD Frederic * The default config_size is sizeof(struct virtio_net_config). 357817ec5a86SKONRAD Frederic * Can be overriden with virtio_net_set_config_size. 357917ec5a86SKONRAD Frederic */ 358017ec5a86SKONRAD Frederic n->config_size = sizeof(struct virtio_net_config); 3581aa4197c3SGonglei device_add_bootindex_property(obj, &n->nic_conf.bootindex, 3582aa4197c3SGonglei "bootindex", "/ethernet-phy@0", 358340c2281cSMarkus Armbruster DEVICE(n)); 35840145c393SAndrew Melnychenko 35850145c393SAndrew Melnychenko ebpf_rss_init(&n->ebpf_rss); 358617ec5a86SKONRAD Frederic } 358717ec5a86SKONRAD Frederic 358844b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque) 35894d45dcfbSHalil Pasic { 35904d45dcfbSHalil Pasic VirtIONet *n = opaque; 35914d45dcfbSHalil Pasic 35924d45dcfbSHalil Pasic /* At this point, backend must be stopped, otherwise 35934d45dcfbSHalil Pasic * it might keep writing to memory. */ 35944d45dcfbSHalil Pasic assert(!n->vhost_started); 359544b1ff31SDr. David Alan Gilbert 359644b1ff31SDr. David Alan Gilbert return 0; 35974d45dcfbSHalil Pasic } 35984d45dcfbSHalil Pasic 35999711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque) 36009711cd0dSJens Freimann { 36019711cd0dSJens Freimann DeviceState *dev = opaque; 360221e8709bSJuan Quintela DeviceState *primary; 36039711cd0dSJens Freimann VirtIODevice *vdev = VIRTIO_DEVICE(dev); 36049711cd0dSJens Freimann VirtIONet *n = VIRTIO_NET(vdev); 36059711cd0dSJens Freimann 3606284f42a5SJens Freimann if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) { 3607284f42a5SJens Freimann return false; 3608284f42a5SJens Freimann } 360921e8709bSJuan Quintela primary = failover_find_primary_device(n); 361021e8709bSJuan Quintela return primary ? primary->pending_deleted_event : false; 36119711cd0dSJens Freimann } 36129711cd0dSJens Freimann 36139711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque) 36149711cd0dSJens Freimann { 36159711cd0dSJens Freimann DeviceState *dev = opaque; 36169711cd0dSJens Freimann VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev); 36179711cd0dSJens Freimann 36189711cd0dSJens Freimann return vdc->primary_unplug_pending(dev); 36199711cd0dSJens Freimann } 36209711cd0dSJens Freimann 36214d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = { 36224d45dcfbSHalil Pasic .name = "virtio-net", 36234d45dcfbSHalil Pasic .minimum_version_id = VIRTIO_NET_VM_VERSION, 36244d45dcfbSHalil Pasic .version_id = VIRTIO_NET_VM_VERSION, 36254d45dcfbSHalil Pasic .fields = (VMStateField[]) { 36264d45dcfbSHalil Pasic VMSTATE_VIRTIO_DEVICE, 36274d45dcfbSHalil Pasic VMSTATE_END_OF_LIST() 36284d45dcfbSHalil Pasic }, 36294d45dcfbSHalil Pasic .pre_save = virtio_net_pre_save, 36309711cd0dSJens Freimann .dev_unplug_pending = dev_unplug_pending, 36314d45dcfbSHalil Pasic }; 3632290c2428SDr. David Alan Gilbert 363317ec5a86SKONRAD Frederic static Property virtio_net_properties[] = { 3634127833eeSJason Baron DEFINE_PROP_BIT64("csum", VirtIONet, host_features, 3635127833eeSJason Baron VIRTIO_NET_F_CSUM, true), 3636127833eeSJason Baron DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features, 363787108bb2SShannon Zhao VIRTIO_NET_F_GUEST_CSUM, true), 3638127833eeSJason Baron DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true), 3639127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features, 364087108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO4, true), 3641127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features, 364287108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO6, true), 3643127833eeSJason Baron DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features, 364487108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ECN, true), 3645127833eeSJason Baron DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features, 364687108bb2SShannon Zhao VIRTIO_NET_F_GUEST_UFO, true), 3647127833eeSJason Baron DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features, 364887108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ANNOUNCE, true), 3649127833eeSJason Baron DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features, 365087108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO4, true), 3651127833eeSJason Baron DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features, 365287108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO6, true), 3653127833eeSJason Baron DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features, 365487108bb2SShannon Zhao VIRTIO_NET_F_HOST_ECN, true), 3655127833eeSJason Baron DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features, 365687108bb2SShannon Zhao VIRTIO_NET_F_HOST_UFO, true), 3657127833eeSJason Baron DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features, 365887108bb2SShannon Zhao VIRTIO_NET_F_MRG_RXBUF, true), 3659127833eeSJason Baron DEFINE_PROP_BIT64("status", VirtIONet, host_features, 366087108bb2SShannon Zhao VIRTIO_NET_F_STATUS, true), 3661127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features, 366287108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VQ, true), 3663127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features, 366487108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX, true), 3665127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features, 366687108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VLAN, true), 3667127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features, 366887108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX_EXTRA, true), 3669127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features, 367087108bb2SShannon Zhao VIRTIO_NET_F_CTRL_MAC_ADDR, true), 3671127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features, 367287108bb2SShannon Zhao VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true), 3673127833eeSJason Baron DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false), 367459079029SYuri Benditovich DEFINE_PROP_BIT64("rss", VirtIONet, host_features, 367559079029SYuri Benditovich VIRTIO_NET_F_RSS, false), 3676e22f0603SYuri Benditovich DEFINE_PROP_BIT64("hash", VirtIONet, host_features, 3677e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT, false), 36782974e916SYuri Benditovich DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features, 36792974e916SYuri Benditovich VIRTIO_NET_F_RSC_EXT, false), 36802974e916SYuri Benditovich DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout, 36812974e916SYuri Benditovich VIRTIO_NET_RSC_DEFAULT_INTERVAL), 368217ec5a86SKONRAD Frederic DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf), 368317ec5a86SKONRAD Frederic DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer, 368417ec5a86SKONRAD Frederic TX_TIMER_INTERVAL), 368517ec5a86SKONRAD Frederic DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST), 368617ec5a86SKONRAD Frederic DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx), 36871c0fbfa3SMichael S. Tsirkin DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size, 36881c0fbfa3SMichael S. Tsirkin VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE), 36899b02e161SWei Wang DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size, 36909b02e161SWei Wang VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE), 3691a93e599dSMaxime Coquelin DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0), 369275ebec11SMaxime Coquelin DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend, 369375ebec11SMaxime Coquelin true), 36949473939eSJason Baron DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN), 36959473939eSJason Baron DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str), 36969711cd0dSJens Freimann DEFINE_PROP_BOOL("failover", VirtIONet, failover, false), 369717ec5a86SKONRAD Frederic DEFINE_PROP_END_OF_LIST(), 369817ec5a86SKONRAD Frederic }; 369917ec5a86SKONRAD Frederic 370017ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data) 370117ec5a86SKONRAD Frederic { 370217ec5a86SKONRAD Frederic DeviceClass *dc = DEVICE_CLASS(klass); 370317ec5a86SKONRAD Frederic VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 3704e6f746b3SAndreas Färber 37054f67d30bSMarc-André Lureau device_class_set_props(dc, virtio_net_properties); 3706290c2428SDr. David Alan Gilbert dc->vmsd = &vmstate_virtio_net; 3707125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_NETWORK, dc->categories); 3708e6f746b3SAndreas Färber vdc->realize = virtio_net_device_realize; 3709306ec6c3SAndreas Färber vdc->unrealize = virtio_net_device_unrealize; 371017ec5a86SKONRAD Frederic vdc->get_config = virtio_net_get_config; 371117ec5a86SKONRAD Frederic vdc->set_config = virtio_net_set_config; 371217ec5a86SKONRAD Frederic vdc->get_features = virtio_net_get_features; 371317ec5a86SKONRAD Frederic vdc->set_features = virtio_net_set_features; 371417ec5a86SKONRAD Frederic vdc->bad_features = virtio_net_bad_features; 371517ec5a86SKONRAD Frederic vdc->reset = virtio_net_reset; 371617ec5a86SKONRAD Frederic vdc->set_status = virtio_net_set_status; 371717ec5a86SKONRAD Frederic vdc->guest_notifier_mask = virtio_net_guest_notifier_mask; 371817ec5a86SKONRAD Frederic vdc->guest_notifier_pending = virtio_net_guest_notifier_pending; 37192a083ffdSMichael S. Tsirkin vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO); 37207788c3f2SMikhail Sennikovsky vdc->post_load = virtio_net_post_load_virtio; 3721982b78c5SDr. David Alan Gilbert vdc->vmsd = &vmstate_virtio_net_device; 37229711cd0dSJens Freimann vdc->primary_unplug_pending = primary_unplug_pending; 372317ec5a86SKONRAD Frederic } 372417ec5a86SKONRAD Frederic 372517ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = { 372617ec5a86SKONRAD Frederic .name = TYPE_VIRTIO_NET, 372717ec5a86SKONRAD Frederic .parent = TYPE_VIRTIO_DEVICE, 372817ec5a86SKONRAD Frederic .instance_size = sizeof(VirtIONet), 372917ec5a86SKONRAD Frederic .instance_init = virtio_net_instance_init, 373017ec5a86SKONRAD Frederic .class_init = virtio_net_class_init, 373117ec5a86SKONRAD Frederic }; 373217ec5a86SKONRAD Frederic 373317ec5a86SKONRAD Frederic static void virtio_register_types(void) 373417ec5a86SKONRAD Frederic { 373517ec5a86SKONRAD Frederic type_register_static(&virtio_net_info); 373617ec5a86SKONRAD Frederic } 373717ec5a86SKONRAD Frederic 373817ec5a86SKONRAD Frederic type_init(virtio_register_types) 3739