16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Network Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 149b8bfe21SPeter Maydell #include "qemu/osdep.h" 159711cd0dSJens Freimann #include "qemu/atomic.h" 166e790746SPaolo Bonzini #include "qemu/iov.h" 17db725815SMarkus Armbruster #include "qemu/main-loop.h" 180b8fa32fSMarkus Armbruster #include "qemu/module.h" 196e790746SPaolo Bonzini #include "hw/virtio/virtio.h" 206e790746SPaolo Bonzini #include "net/net.h" 216e790746SPaolo Bonzini #include "net/checksum.h" 226e790746SPaolo Bonzini #include "net/tap.h" 236e790746SPaolo Bonzini #include "qemu/error-report.h" 246e790746SPaolo Bonzini #include "qemu/timer.h" 259711cd0dSJens Freimann #include "qemu/option.h" 269711cd0dSJens Freimann #include "qemu/option_int.h" 279711cd0dSJens Freimann #include "qemu/config-file.h" 289711cd0dSJens Freimann #include "qapi/qmp/qdict.h" 296e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h" 306e790746SPaolo Bonzini #include "net/vhost_net.h" 319d8c6a25SDr. David Alan Gilbert #include "net/announce.h" 3217ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h" 33e688df6bSMarkus Armbruster #include "qapi/error.h" 349af23989SMarkus Armbruster #include "qapi/qapi-events-net.h" 35a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h" 369711cd0dSJens Freimann #include "qapi/qapi-types-migration.h" 379711cd0dSJens Freimann #include "qapi/qapi-events-migration.h" 381399c60dSRusty Russell #include "hw/virtio/virtio-access.h" 39f8d806c9SJuan Quintela #include "migration/misc.h" 409473939eSJason Baron #include "standard-headers/linux/ethtool.h" 412f780b6aSMarkus Armbruster #include "sysemu/sysemu.h" 429d8c6a25SDr. David Alan Gilbert #include "trace.h" 439711cd0dSJens Freimann #include "monitor/qdev.h" 449711cd0dSJens Freimann #include "hw/pci/pci.h" 454474e37aSYuri Benditovich #include "net_rx_pkt.h" 46108a6481SCindy Lu #include "hw/virtio/vhost.h" 476e790746SPaolo Bonzini 486e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION 11 496e790746SPaolo Bonzini 506e790746SPaolo Bonzini #define MAC_TABLE_ENTRIES 64 516e790746SPaolo Bonzini #define MAX_VLAN (1 << 12) /* Per 802.1Q definition */ 526e790746SPaolo Bonzini 531c0fbfa3SMichael S. Tsirkin /* previously fixed value */ 541c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256 559b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256 569b02e161SWei Wang 57441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */ 581c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 599b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 601c0fbfa3SMichael S. Tsirkin 612974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE 8 /* ipv4 saddr + daddr */ 622974e916SYuri Benditovich 632974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG 0x3F 642974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH 0xF000 652974e916SYuri Benditovich 662974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */ 672974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header)) 682974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535 692974e916SYuri Benditovich 702974e916SYuri Benditovich /* header length value in ip header without option */ 712974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5 722974e916SYuri Benditovich 732974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE 32 /* ipv6 saddr + daddr */ 742974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD 752974e916SYuri Benditovich 762974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance 772974e916SYuri Benditovich a lot, and should be tuned carefully, '300000'(300us) is the recommended 782974e916SYuri Benditovich value to pass the WHQL test, '50000' can gain 2x netperf throughput with 792974e916SYuri Benditovich tso/gso/gro 'off'. */ 802974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000 812974e916SYuri Benditovich 8259079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \ 8359079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \ 8459079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \ 8559079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \ 8659079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \ 8759079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \ 8859079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \ 8959079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \ 9059079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) 9159079029SYuri Benditovich 92ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = { 93127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MAC, 945d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mac)}, 95127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_STATUS, 965d5b33c0SMax Reitz .end = endof(struct virtio_net_config, status)}, 97127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MQ, 985d5b33c0SMax Reitz .end = endof(struct virtio_net_config, max_virtqueue_pairs)}, 99127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MTU, 1005d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mtu)}, 1019473939eSJason Baron {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX, 1025d5b33c0SMax Reitz .end = endof(struct virtio_net_config, duplex)}, 103e22f0603SYuri Benditovich {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT), 10459079029SYuri Benditovich .end = endof(struct virtio_net_config, supported_hash_types)}, 1056e790746SPaolo Bonzini {} 1066e790746SPaolo Bonzini }; 1076e790746SPaolo Bonzini 1086e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc) 1096e790746SPaolo Bonzini { 1106e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1116e790746SPaolo Bonzini 1126e790746SPaolo Bonzini return &n->vqs[nc->queue_index]; 1136e790746SPaolo Bonzini } 1146e790746SPaolo Bonzini 1156e790746SPaolo Bonzini static int vq2q(int queue_index) 1166e790746SPaolo Bonzini { 1176e790746SPaolo Bonzini return queue_index / 2; 1186e790746SPaolo Bonzini } 1196e790746SPaolo Bonzini 1206e790746SPaolo Bonzini /* TODO 1216e790746SPaolo Bonzini * - we could suppress RX interrupt if we were so inclined. 1226e790746SPaolo Bonzini */ 1236e790746SPaolo Bonzini 1246e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config) 1256e790746SPaolo Bonzini { 12617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1276e790746SPaolo Bonzini struct virtio_net_config netcfg; 128c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 129fb592882SCindy Lu static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } }; 1306e790746SPaolo Bonzini 131108a6481SCindy Lu int ret = 0; 132108a6481SCindy Lu memset(&netcfg, 0 , sizeof(struct virtio_net_config)); 1331399c60dSRusty Russell virtio_stw_p(vdev, &netcfg.status, n->status); 134441537f1SJason Wang virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs); 135a93e599dSMaxime Coquelin virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu); 1366e790746SPaolo Bonzini memcpy(netcfg.mac, n->mac, ETH_ALEN); 1379473939eSJason Baron virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed); 1389473939eSJason Baron netcfg.duplex = n->net_conf.duplex; 13959079029SYuri Benditovich netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE; 14059079029SYuri Benditovich virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length, 141e22f0603SYuri Benditovich virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ? 142e22f0603SYuri Benditovich VIRTIO_NET_RSS_MAX_TABLE_LEN : 1); 14359079029SYuri Benditovich virtio_stl_p(vdev, &netcfg.supported_hash_types, 14459079029SYuri Benditovich VIRTIO_NET_RSS_SUPPORTED_HASHES); 1456e790746SPaolo Bonzini memcpy(config, &netcfg, n->config_size); 146108a6481SCindy Lu 147c546ecf2SJason Wang /* 148c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 149c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 150c546ecf2SJason Wang */ 151c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 152108a6481SCindy Lu ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg, 153108a6481SCindy Lu n->config_size); 154108a6481SCindy Lu if (ret != -1) { 155fb592882SCindy Lu /* 156fb592882SCindy Lu * Some NIC/kernel combinations present 0 as the mac address. As 157fb592882SCindy Lu * that is not a legal address, try to proceed with the 158fb592882SCindy Lu * address from the QEMU command line in the hope that the 159fb592882SCindy Lu * address has been configured correctly elsewhere - just not 160fb592882SCindy Lu * reported by the device. 161fb592882SCindy Lu */ 162fb592882SCindy Lu if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) { 163fb592882SCindy Lu info_report("Zero hardware mac address detected. Ignoring."); 164fb592882SCindy Lu memcpy(netcfg.mac, n->mac, ETH_ALEN); 165fb592882SCindy Lu } 166108a6481SCindy Lu memcpy(config, &netcfg, n->config_size); 167108a6481SCindy Lu } 168108a6481SCindy Lu } 1696e790746SPaolo Bonzini } 1706e790746SPaolo Bonzini 1716e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config) 1726e790746SPaolo Bonzini { 17317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1746e790746SPaolo Bonzini struct virtio_net_config netcfg = {}; 175c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 1766e790746SPaolo Bonzini 1776e790746SPaolo Bonzini memcpy(&netcfg, config, n->config_size); 1786e790746SPaolo Bonzini 17995129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) && 18095129d6fSCornelia Huck !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) && 1816e790746SPaolo Bonzini memcmp(netcfg.mac, n->mac, ETH_ALEN)) { 1826e790746SPaolo Bonzini memcpy(n->mac, netcfg.mac, ETH_ALEN); 1836e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1846e790746SPaolo Bonzini } 185108a6481SCindy Lu 186c546ecf2SJason Wang /* 187c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 188c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 189c546ecf2SJason Wang */ 190c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 191c546ecf2SJason Wang vhost_net_set_config(get_vhost_net(nc->peer), 192c546ecf2SJason Wang (uint8_t *)&netcfg, 0, n->config_size, 193108a6481SCindy Lu VHOST_SET_CONFIG_TYPE_MASTER); 194108a6481SCindy Lu } 1956e790746SPaolo Bonzini } 1966e790746SPaolo Bonzini 1976e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status) 1986e790746SPaolo Bonzini { 19917a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2006e790746SPaolo Bonzini return (status & VIRTIO_CONFIG_S_DRIVER_OK) && 20117a0ca55SKONRAD Frederic (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running; 2026e790746SPaolo Bonzini } 2036e790746SPaolo Bonzini 204b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net) 205b2c929f0SDr. David Alan Gilbert { 206b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(net); 207b2c929f0SDr. David Alan Gilbert trace_virtio_net_announce_notify(); 208b2c929f0SDr. David Alan Gilbert 209b2c929f0SDr. David Alan Gilbert net->status |= VIRTIO_NET_S_ANNOUNCE; 210b2c929f0SDr. David Alan Gilbert virtio_notify_config(vdev); 211b2c929f0SDr. David Alan Gilbert } 212b2c929f0SDr. David Alan Gilbert 213f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque) 214f57fcf70SJason Wang { 215f57fcf70SJason Wang VirtIONet *n = opaque; 2169d8c6a25SDr. David Alan Gilbert trace_virtio_net_announce_timer(n->announce_timer.round); 217f57fcf70SJason Wang 2189d8c6a25SDr. David Alan Gilbert n->announce_timer.round--; 219b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 220b2c929f0SDr. David Alan Gilbert } 221b2c929f0SDr. David Alan Gilbert 222b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc) 223b2c929f0SDr. David Alan Gilbert { 224b2c929f0SDr. David Alan Gilbert VirtIONet *n = qemu_get_nic_opaque(nc); 225b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 226b2c929f0SDr. David Alan Gilbert 227b2c929f0SDr. David Alan Gilbert /* 228b2c929f0SDr. David Alan Gilbert * Make sure the virtio migration announcement timer isn't running 229b2c929f0SDr. David Alan Gilbert * If it is, let it trigger announcement so that we do not cause 230b2c929f0SDr. David Alan Gilbert * confusion. 231b2c929f0SDr. David Alan Gilbert */ 232b2c929f0SDr. David Alan Gilbert if (n->announce_timer.round) { 233b2c929f0SDr. David Alan Gilbert return; 234b2c929f0SDr. David Alan Gilbert } 235b2c929f0SDr. David Alan Gilbert 236b2c929f0SDr. David Alan Gilbert if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 237b2c929f0SDr. David Alan Gilbert virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 238b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 239b2c929f0SDr. David Alan Gilbert } 240f57fcf70SJason Wang } 241f57fcf70SJason Wang 2426e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status) 2436e790746SPaolo Bonzini { 24417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2456e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 246441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 247*22288fe5SJason Wang int cvq = n->max_ncs - n->max_queue_pairs; 2486e790746SPaolo Bonzini 249ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 2506e790746SPaolo Bonzini return; 2516e790746SPaolo Bonzini } 2526e790746SPaolo Bonzini 2538c1ac475SRadim Krčmář if ((virtio_net_started(n, status) && !nc->peer->link_down) == 2548c1ac475SRadim Krčmář !!n->vhost_started) { 2556e790746SPaolo Bonzini return; 2566e790746SPaolo Bonzini } 2576e790746SPaolo Bonzini if (!n->vhost_started) { 258086abc1cSMichael S. Tsirkin int r, i; 259086abc1cSMichael S. Tsirkin 2601bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2611bfa316cSGreg Kurz error_report("backend does not support %s vnet headers; " 2621bfa316cSGreg Kurz "falling back on userspace virtio", 2631bfa316cSGreg Kurz virtio_is_big_endian(vdev) ? "BE" : "LE"); 2641bfa316cSGreg Kurz return; 2651bfa316cSGreg Kurz } 2661bfa316cSGreg Kurz 267086abc1cSMichael S. Tsirkin /* Any packets outstanding? Purge them to avoid touching rings 268086abc1cSMichael S. Tsirkin * when vhost is running. 269086abc1cSMichael S. Tsirkin */ 270441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 271086abc1cSMichael S. Tsirkin NetClientState *qnc = qemu_get_subqueue(n->nic, i); 272086abc1cSMichael S. Tsirkin 273086abc1cSMichael S. Tsirkin /* Purge both directions: TX and RX. */ 274086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->peer->incoming_queue, qnc); 275086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->incoming_queue, qnc->peer); 276086abc1cSMichael S. Tsirkin } 277086abc1cSMichael S. Tsirkin 278a93e599dSMaxime Coquelin if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) { 279a93e599dSMaxime Coquelin r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu); 280a93e599dSMaxime Coquelin if (r < 0) { 281a93e599dSMaxime Coquelin error_report("%uBytes MTU not supported by the backend", 282a93e599dSMaxime Coquelin n->net_conf.mtu); 283a93e599dSMaxime Coquelin 284a93e599dSMaxime Coquelin return; 285a93e599dSMaxime Coquelin } 286a93e599dSMaxime Coquelin } 287a93e599dSMaxime Coquelin 2886e790746SPaolo Bonzini n->vhost_started = 1; 289*22288fe5SJason Wang r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq); 2906e790746SPaolo Bonzini if (r < 0) { 2916e790746SPaolo Bonzini error_report("unable to start vhost net: %d: " 2926e790746SPaolo Bonzini "falling back on userspace virtio", -r); 2936e790746SPaolo Bonzini n->vhost_started = 0; 2946e790746SPaolo Bonzini } 2956e790746SPaolo Bonzini } else { 296*22288fe5SJason Wang vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq); 2976e790746SPaolo Bonzini n->vhost_started = 0; 2986e790746SPaolo Bonzini } 2996e790746SPaolo Bonzini } 3006e790746SPaolo Bonzini 3011bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev, 3021bfa316cSGreg Kurz NetClientState *peer, 3031bfa316cSGreg Kurz bool enable) 3041bfa316cSGreg Kurz { 3051bfa316cSGreg Kurz if (virtio_is_big_endian(vdev)) { 3061bfa316cSGreg Kurz return qemu_set_vnet_be(peer, enable); 3071bfa316cSGreg Kurz } else { 3081bfa316cSGreg Kurz return qemu_set_vnet_le(peer, enable); 3091bfa316cSGreg Kurz } 3101bfa316cSGreg Kurz } 3111bfa316cSGreg Kurz 3121bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs, 313441537f1SJason Wang int queue_pairs, bool enable) 3141bfa316cSGreg Kurz { 3151bfa316cSGreg Kurz int i; 3161bfa316cSGreg Kurz 317441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 3181bfa316cSGreg Kurz if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 && 3191bfa316cSGreg Kurz enable) { 3201bfa316cSGreg Kurz while (--i >= 0) { 3211bfa316cSGreg Kurz virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false); 3221bfa316cSGreg Kurz } 3231bfa316cSGreg Kurz 3241bfa316cSGreg Kurz return true; 3251bfa316cSGreg Kurz } 3261bfa316cSGreg Kurz } 3271bfa316cSGreg Kurz 3281bfa316cSGreg Kurz return false; 3291bfa316cSGreg Kurz } 3301bfa316cSGreg Kurz 3311bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status) 3321bfa316cSGreg Kurz { 3331bfa316cSGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(n); 334441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3351bfa316cSGreg Kurz 3361bfa316cSGreg Kurz if (virtio_net_started(n, status)) { 3371bfa316cSGreg Kurz /* Before using the device, we tell the network backend about the 3381bfa316cSGreg Kurz * endianness to use when parsing vnet headers. If the backend 3391bfa316cSGreg Kurz * can't do it, we fallback onto fixing the headers in the core 3401bfa316cSGreg Kurz * virtio-net code. 3411bfa316cSGreg Kurz */ 3421bfa316cSGreg Kurz n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs, 343441537f1SJason Wang queue_pairs, true); 3441bfa316cSGreg Kurz } else if (virtio_net_started(n, vdev->status)) { 3451bfa316cSGreg Kurz /* After using the device, we need to reset the network backend to 3461bfa316cSGreg Kurz * the default (guest native endianness), otherwise the guest may 3471bfa316cSGreg Kurz * lose network connectivity if it is rebooted into a different 3481bfa316cSGreg Kurz * endianness. 3491bfa316cSGreg Kurz */ 350441537f1SJason Wang virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false); 3511bfa316cSGreg Kurz } 3521bfa316cSGreg Kurz } 3531bfa316cSGreg Kurz 354283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq) 355283e2c2aSYuri Benditovich { 356283e2c2aSYuri Benditovich unsigned int dropped = virtqueue_drop_all(vq); 357283e2c2aSYuri Benditovich if (dropped) { 358283e2c2aSYuri Benditovich virtio_notify(vdev, vq); 359283e2c2aSYuri Benditovich } 360283e2c2aSYuri Benditovich } 361283e2c2aSYuri Benditovich 3626e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status) 3636e790746SPaolo Bonzini { 36417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 3656e790746SPaolo Bonzini VirtIONetQueue *q; 3666e790746SPaolo Bonzini int i; 3676e790746SPaolo Bonzini uint8_t queue_status; 3686e790746SPaolo Bonzini 3691bfa316cSGreg Kurz virtio_net_vnet_endian_status(n, status); 3706e790746SPaolo Bonzini virtio_net_vhost_status(n, status); 3716e790746SPaolo Bonzini 372441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 37338705bb5SFam Zheng NetClientState *ncs = qemu_get_subqueue(n->nic, i); 37438705bb5SFam Zheng bool queue_started; 3756e790746SPaolo Bonzini q = &n->vqs[i]; 3766e790746SPaolo Bonzini 377441537f1SJason Wang if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) { 3786e790746SPaolo Bonzini queue_status = 0; 3796e790746SPaolo Bonzini } else { 3806e790746SPaolo Bonzini queue_status = status; 3816e790746SPaolo Bonzini } 38238705bb5SFam Zheng queue_started = 38338705bb5SFam Zheng virtio_net_started(n, queue_status) && !n->vhost_started; 38438705bb5SFam Zheng 38538705bb5SFam Zheng if (queue_started) { 38638705bb5SFam Zheng qemu_flush_queued_packets(ncs); 38738705bb5SFam Zheng } 3886e790746SPaolo Bonzini 3896e790746SPaolo Bonzini if (!q->tx_waiting) { 3906e790746SPaolo Bonzini continue; 3916e790746SPaolo Bonzini } 3926e790746SPaolo Bonzini 39338705bb5SFam Zheng if (queue_started) { 3946e790746SPaolo Bonzini if (q->tx_timer) { 395bc72ad67SAlex Bligh timer_mod(q->tx_timer, 396bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 3976e790746SPaolo Bonzini } else { 3986e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 3996e790746SPaolo Bonzini } 4006e790746SPaolo Bonzini } else { 4016e790746SPaolo Bonzini if (q->tx_timer) { 402bc72ad67SAlex Bligh timer_del(q->tx_timer); 4036e790746SPaolo Bonzini } else { 4046e790746SPaolo Bonzini qemu_bh_cancel(q->tx_bh); 4056e790746SPaolo Bonzini } 406283e2c2aSYuri Benditovich if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 && 40770e53e6eSJason Wang (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) && 40870e53e6eSJason Wang vdev->vm_running) { 409283e2c2aSYuri Benditovich /* if tx is waiting we are likely have some packets in tx queue 410283e2c2aSYuri Benditovich * and disabled notification */ 411283e2c2aSYuri Benditovich q->tx_waiting = 0; 412283e2c2aSYuri Benditovich virtio_queue_set_notification(q->tx_vq, 1); 413283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, q->tx_vq); 414283e2c2aSYuri Benditovich } 4156e790746SPaolo Bonzini } 4166e790746SPaolo Bonzini } 4176e790746SPaolo Bonzini } 4186e790746SPaolo Bonzini 4196e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc) 4206e790746SPaolo Bonzini { 4216e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 42217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 4236e790746SPaolo Bonzini uint16_t old_status = n->status; 4246e790746SPaolo Bonzini 4256e790746SPaolo Bonzini if (nc->link_down) 4266e790746SPaolo Bonzini n->status &= ~VIRTIO_NET_S_LINK_UP; 4276e790746SPaolo Bonzini else 4286e790746SPaolo Bonzini n->status |= VIRTIO_NET_S_LINK_UP; 4296e790746SPaolo Bonzini 4306e790746SPaolo Bonzini if (n->status != old_status) 43117a0ca55SKONRAD Frederic virtio_notify_config(vdev); 4326e790746SPaolo Bonzini 43317a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 4346e790746SPaolo Bonzini } 4356e790746SPaolo Bonzini 436b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc) 437b1be4280SAmos Kong { 438b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 439b1be4280SAmos Kong 440b1be4280SAmos Kong if (nc->rxfilter_notify_enabled) { 441ddfb0baaSMarkus Armbruster char *path = object_get_canonical_path(OBJECT(n->qdev)); 44206150279SWenchao Xia qapi_event_send_nic_rx_filter_changed(!!n->netclient_name, 4433ab72385SPeter Xu n->netclient_name, path); 44496e35046SAmos Kong g_free(path); 445b1be4280SAmos Kong 446b1be4280SAmos Kong /* disable event notification to avoid events flooding */ 447b1be4280SAmos Kong nc->rxfilter_notify_enabled = 0; 448b1be4280SAmos Kong } 449b1be4280SAmos Kong } 450b1be4280SAmos Kong 451f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n) 452f7bc8ef8SAmos Kong { 45354aa3de7SEric Blake intList *list; 454f7bc8ef8SAmos Kong int i, j; 455f7bc8ef8SAmos Kong 456f7bc8ef8SAmos Kong list = NULL; 457f7bc8ef8SAmos Kong for (i = 0; i < MAX_VLAN >> 5; i++) { 458f7bc8ef8SAmos Kong for (j = 0; n->vlans[i] && j <= 0x1f; j++) { 459f7bc8ef8SAmos Kong if (n->vlans[i] & (1U << j)) { 46054aa3de7SEric Blake QAPI_LIST_PREPEND(list, (i << 5) + j); 461f7bc8ef8SAmos Kong } 462f7bc8ef8SAmos Kong } 463f7bc8ef8SAmos Kong } 464f7bc8ef8SAmos Kong 465f7bc8ef8SAmos Kong return list; 466f7bc8ef8SAmos Kong } 467f7bc8ef8SAmos Kong 468b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc) 469b1be4280SAmos Kong { 470b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 471f7bc8ef8SAmos Kong VirtIODevice *vdev = VIRTIO_DEVICE(n); 472b1be4280SAmos Kong RxFilterInfo *info; 47354aa3de7SEric Blake strList *str_list; 474f7bc8ef8SAmos Kong int i; 475b1be4280SAmos Kong 476b1be4280SAmos Kong info = g_malloc0(sizeof(*info)); 477b1be4280SAmos Kong info->name = g_strdup(nc->name); 478b1be4280SAmos Kong info->promiscuous = n->promisc; 479b1be4280SAmos Kong 480b1be4280SAmos Kong if (n->nouni) { 481b1be4280SAmos Kong info->unicast = RX_STATE_NONE; 482b1be4280SAmos Kong } else if (n->alluni) { 483b1be4280SAmos Kong info->unicast = RX_STATE_ALL; 484b1be4280SAmos Kong } else { 485b1be4280SAmos Kong info->unicast = RX_STATE_NORMAL; 486b1be4280SAmos Kong } 487b1be4280SAmos Kong 488b1be4280SAmos Kong if (n->nomulti) { 489b1be4280SAmos Kong info->multicast = RX_STATE_NONE; 490b1be4280SAmos Kong } else if (n->allmulti) { 491b1be4280SAmos Kong info->multicast = RX_STATE_ALL; 492b1be4280SAmos Kong } else { 493b1be4280SAmos Kong info->multicast = RX_STATE_NORMAL; 494b1be4280SAmos Kong } 495b1be4280SAmos Kong 496b1be4280SAmos Kong info->broadcast_allowed = n->nobcast; 497b1be4280SAmos Kong info->multicast_overflow = n->mac_table.multi_overflow; 498b1be4280SAmos Kong info->unicast_overflow = n->mac_table.uni_overflow; 499b1be4280SAmos Kong 500b0575ba4SScott Feldman info->main_mac = qemu_mac_strdup_printf(n->mac); 501b1be4280SAmos Kong 502b1be4280SAmos Kong str_list = NULL; 503b1be4280SAmos Kong for (i = 0; i < n->mac_table.first_multi; i++) { 50454aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 50554aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 506b1be4280SAmos Kong } 507b1be4280SAmos Kong info->unicast_table = str_list; 508b1be4280SAmos Kong 509b1be4280SAmos Kong str_list = NULL; 510b1be4280SAmos Kong for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 51154aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 51254aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 513b1be4280SAmos Kong } 514b1be4280SAmos Kong info->multicast_table = str_list; 515f7bc8ef8SAmos Kong info->vlan_table = get_vlan_table(n); 516b1be4280SAmos Kong 51795129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) { 518f7bc8ef8SAmos Kong info->vlan = RX_STATE_ALL; 519f7bc8ef8SAmos Kong } else if (!info->vlan_table) { 520f7bc8ef8SAmos Kong info->vlan = RX_STATE_NONE; 521f7bc8ef8SAmos Kong } else { 522f7bc8ef8SAmos Kong info->vlan = RX_STATE_NORMAL; 523b1be4280SAmos Kong } 524b1be4280SAmos Kong 525b1be4280SAmos Kong /* enable event notification after query */ 526b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 527b1be4280SAmos Kong 528b1be4280SAmos Kong return info; 529b1be4280SAmos Kong } 530b1be4280SAmos Kong 5316e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev) 5326e790746SPaolo Bonzini { 53317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 53494b52958SGreg Kurz int i; 5356e790746SPaolo Bonzini 5366e790746SPaolo Bonzini /* Reset back to compatibility mode */ 5376e790746SPaolo Bonzini n->promisc = 1; 5386e790746SPaolo Bonzini n->allmulti = 0; 5396e790746SPaolo Bonzini n->alluni = 0; 5406e790746SPaolo Bonzini n->nomulti = 0; 5416e790746SPaolo Bonzini n->nouni = 0; 5426e790746SPaolo Bonzini n->nobcast = 0; 5436e790746SPaolo Bonzini /* multiqueue is disabled by default */ 544441537f1SJason Wang n->curr_queue_pairs = 1; 5459d8c6a25SDr. David Alan Gilbert timer_del(n->announce_timer.tm); 5469d8c6a25SDr. David Alan Gilbert n->announce_timer.round = 0; 547f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 5486e790746SPaolo Bonzini 5496e790746SPaolo Bonzini /* Flush any MAC and VLAN filter table state */ 5506e790746SPaolo Bonzini n->mac_table.in_use = 0; 5516e790746SPaolo Bonzini n->mac_table.first_multi = 0; 5526e790746SPaolo Bonzini n->mac_table.multi_overflow = 0; 5536e790746SPaolo Bonzini n->mac_table.uni_overflow = 0; 5546e790746SPaolo Bonzini memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN); 5556e790746SPaolo Bonzini memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac)); 556702d66a8SMichael S. Tsirkin qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 5576e790746SPaolo Bonzini memset(n->vlans, 0, MAX_VLAN >> 3); 55894b52958SGreg Kurz 55994b52958SGreg Kurz /* Flush any async TX */ 560441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 56194b52958SGreg Kurz NetClientState *nc = qemu_get_subqueue(n->nic, i); 56294b52958SGreg Kurz 56394b52958SGreg Kurz if (nc->peer) { 56494b52958SGreg Kurz qemu_flush_or_purge_queued_packets(nc->peer, true); 56594b52958SGreg Kurz assert(!virtio_net_get_subqueue(nc)->async_tx.elem); 56694b52958SGreg Kurz } 56794b52958SGreg Kurz } 5686e790746SPaolo Bonzini } 5696e790746SPaolo Bonzini 5706e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n) 5716e790746SPaolo Bonzini { 5726e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 5736e790746SPaolo Bonzini if (!nc->peer) { 5746e790746SPaolo Bonzini return; 5756e790746SPaolo Bonzini } 5766e790746SPaolo Bonzini 577d6085e3aSStefan Hajnoczi n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer); 5786e790746SPaolo Bonzini } 5796e790746SPaolo Bonzini 5806e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n) 5816e790746SPaolo Bonzini { 5826e790746SPaolo Bonzini return n->has_vnet_hdr; 5836e790746SPaolo Bonzini } 5846e790746SPaolo Bonzini 5856e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n) 5866e790746SPaolo Bonzini { 5876e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) 5886e790746SPaolo Bonzini return 0; 5896e790746SPaolo Bonzini 590d6085e3aSStefan Hajnoczi n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer); 5916e790746SPaolo Bonzini 5926e790746SPaolo Bonzini return n->has_ufo; 5936e790746SPaolo Bonzini } 5946e790746SPaolo Bonzini 595bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs, 596e22f0603SYuri Benditovich int version_1, int hash_report) 5976e790746SPaolo Bonzini { 5986e790746SPaolo Bonzini int i; 5996e790746SPaolo Bonzini NetClientState *nc; 6006e790746SPaolo Bonzini 6016e790746SPaolo Bonzini n->mergeable_rx_bufs = mergeable_rx_bufs; 6026e790746SPaolo Bonzini 603bb9d17f8SCornelia Huck if (version_1) { 604e22f0603SYuri Benditovich n->guest_hdr_len = hash_report ? 605e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_v1_hash) : 606e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_mrg_rxbuf); 607e22f0603SYuri Benditovich n->rss_data.populate_hash = !!hash_report; 608bb9d17f8SCornelia Huck } else { 6096e790746SPaolo Bonzini n->guest_hdr_len = n->mergeable_rx_bufs ? 610bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr_mrg_rxbuf) : 611bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr); 612bb9d17f8SCornelia Huck } 6136e790746SPaolo Bonzini 614441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6156e790746SPaolo Bonzini nc = qemu_get_subqueue(n->nic, i); 6166e790746SPaolo Bonzini 6176e790746SPaolo Bonzini if (peer_has_vnet_hdr(n) && 618d6085e3aSStefan Hajnoczi qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) { 619d6085e3aSStefan Hajnoczi qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len); 6206e790746SPaolo Bonzini n->host_hdr_len = n->guest_hdr_len; 6216e790746SPaolo Bonzini } 6226e790746SPaolo Bonzini } 6236e790746SPaolo Bonzini } 6246e790746SPaolo Bonzini 6252eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n) 6262eef278bSMichael S. Tsirkin { 6272eef278bSMichael S. Tsirkin NetClientState *peer = n->nic_conf.peers.ncs[0]; 6282eef278bSMichael S. Tsirkin 6292eef278bSMichael S. Tsirkin /* 6302eef278bSMichael S. Tsirkin * Backends other than vhost-user don't support max queue size. 6312eef278bSMichael S. Tsirkin */ 6322eef278bSMichael S. Tsirkin if (!peer) { 6332eef278bSMichael S. Tsirkin return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 6342eef278bSMichael S. Tsirkin } 6352eef278bSMichael S. Tsirkin 6362eef278bSMichael S. Tsirkin if (peer->info->type != NET_CLIENT_DRIVER_VHOST_USER) { 6372eef278bSMichael S. Tsirkin return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 6382eef278bSMichael S. Tsirkin } 6392eef278bSMichael S. Tsirkin 6402eef278bSMichael S. Tsirkin return VIRTQUEUE_MAX_SIZE; 6412eef278bSMichael S. Tsirkin } 6422eef278bSMichael S. Tsirkin 6436e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index) 6446e790746SPaolo Bonzini { 6456e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 6466e790746SPaolo Bonzini 6476e790746SPaolo Bonzini if (!nc->peer) { 6486e790746SPaolo Bonzini return 0; 6496e790746SPaolo Bonzini } 6506e790746SPaolo Bonzini 651f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 6527263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 1); 6537263a0adSChangchun Ouyang } 6547263a0adSChangchun Ouyang 655f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 6566e790746SPaolo Bonzini return 0; 6576e790746SPaolo Bonzini } 6586e790746SPaolo Bonzini 659441537f1SJason Wang if (n->max_queue_pairs == 1) { 6601074b879SJason Wang return 0; 6611074b879SJason Wang } 6621074b879SJason Wang 6636e790746SPaolo Bonzini return tap_enable(nc->peer); 6646e790746SPaolo Bonzini } 6656e790746SPaolo Bonzini 6666e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index) 6676e790746SPaolo Bonzini { 6686e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 6696e790746SPaolo Bonzini 6706e790746SPaolo Bonzini if (!nc->peer) { 6716e790746SPaolo Bonzini return 0; 6726e790746SPaolo Bonzini } 6736e790746SPaolo Bonzini 674f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 6757263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 0); 6767263a0adSChangchun Ouyang } 6777263a0adSChangchun Ouyang 678f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 6796e790746SPaolo Bonzini return 0; 6806e790746SPaolo Bonzini } 6816e790746SPaolo Bonzini 6826e790746SPaolo Bonzini return tap_disable(nc->peer); 6836e790746SPaolo Bonzini } 6846e790746SPaolo Bonzini 685441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n) 6866e790746SPaolo Bonzini { 6876e790746SPaolo Bonzini int i; 688ddfa83eaSJoel Stanley int r; 6896e790746SPaolo Bonzini 69068b5f314SYuri Benditovich if (n->nic->peer_deleted) { 69168b5f314SYuri Benditovich return; 69268b5f314SYuri Benditovich } 69368b5f314SYuri Benditovich 694441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 695441537f1SJason Wang if (i < n->curr_queue_pairs) { 696ddfa83eaSJoel Stanley r = peer_attach(n, i); 697ddfa83eaSJoel Stanley assert(!r); 6986e790746SPaolo Bonzini } else { 699ddfa83eaSJoel Stanley r = peer_detach(n, i); 700ddfa83eaSJoel Stanley assert(!r); 7016e790746SPaolo Bonzini } 7026e790746SPaolo Bonzini } 7036e790746SPaolo Bonzini } 7046e790746SPaolo Bonzini 705ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue); 7066e790746SPaolo Bonzini 7079d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features, 7089d5b731dSJason Wang Error **errp) 7096e790746SPaolo Bonzini { 71017a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 7116e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 7126e790746SPaolo Bonzini 713da3e8a23SShannon Zhao /* Firstly sync all virtio-net possible supported features */ 714da3e8a23SShannon Zhao features |= n->host_features; 715da3e8a23SShannon Zhao 7160cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7176e790746SPaolo Bonzini 7186e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) { 7190cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_CSUM); 7200cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4); 7210cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6); 7220cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN); 7236e790746SPaolo Bonzini 7240cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM); 7250cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4); 7260cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6); 7270cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN); 728e22f0603SYuri Benditovich 729e22f0603SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT); 7306e790746SPaolo Bonzini } 7316e790746SPaolo Bonzini 7326e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) { 7330cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO); 7340cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO); 7356e790746SPaolo Bonzini } 7366e790746SPaolo Bonzini 737ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 7386e790746SPaolo Bonzini return features; 7396e790746SPaolo Bonzini } 7402974e916SYuri Benditovich 7410145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 74259079029SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_RSS); 7430145c393SAndrew Melnychenko } 74475ebec11SMaxime Coquelin features = vhost_net_get_features(get_vhost_net(nc->peer), features); 74575ebec11SMaxime Coquelin vdev->backend_features = features; 74675ebec11SMaxime Coquelin 74775ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 74875ebec11SMaxime Coquelin (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) { 74975ebec11SMaxime Coquelin features |= (1ULL << VIRTIO_NET_F_MTU); 75075ebec11SMaxime Coquelin } 75175ebec11SMaxime Coquelin 75275ebec11SMaxime Coquelin return features; 7536e790746SPaolo Bonzini } 7546e790746SPaolo Bonzini 755019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev) 7566e790746SPaolo Bonzini { 757019a3edbSGerd Hoffmann uint64_t features = 0; 7586e790746SPaolo Bonzini 7596e790746SPaolo Bonzini /* Linux kernel 2.6.25. It understood MAC (as everyone must), 7606e790746SPaolo Bonzini * but also these: */ 7610cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7620cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_CSUM); 7630cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4); 7640cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6); 7650cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN); 7666e790746SPaolo Bonzini 7676e790746SPaolo Bonzini return features; 7686e790746SPaolo Bonzini } 7696e790746SPaolo Bonzini 770644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n) 771644c9858SDmitry Fleytman { 772ad37bb3bSStefan Hajnoczi qemu_set_offload(qemu_get_queue(n->nic)->peer, 773644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)), 774644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)), 775644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)), 776644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)), 777644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO))); 778644c9858SDmitry Fleytman } 779644c9858SDmitry Fleytman 780644c9858SDmitry Fleytman static uint64_t virtio_net_guest_offloads_by_features(uint32_t features) 781644c9858SDmitry Fleytman { 782644c9858SDmitry Fleytman static const uint64_t guest_offloads_mask = 783644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_CSUM) | 784644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO4) | 785644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO6) | 786644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_ECN) | 787644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_UFO); 788644c9858SDmitry Fleytman 789644c9858SDmitry Fleytman return guest_offloads_mask & features; 790644c9858SDmitry Fleytman } 791644c9858SDmitry Fleytman 792644c9858SDmitry Fleytman static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n) 793644c9858SDmitry Fleytman { 794644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 795644c9858SDmitry Fleytman return virtio_net_guest_offloads_by_features(vdev->guest_features); 796644c9858SDmitry Fleytman } 797644c9858SDmitry Fleytman 798f5e1847bSJuan Quintela typedef struct { 799f5e1847bSJuan Quintela VirtIONet *n; 80012b2fad7SKevin Wolf DeviceState *dev; 80112b2fad7SKevin Wolf } FailoverDevice; 802f5e1847bSJuan Quintela 803f5e1847bSJuan Quintela /** 80412b2fad7SKevin Wolf * Set the failover primary device 805f5e1847bSJuan Quintela * 806f5e1847bSJuan Quintela * @opaque: FailoverId to setup 807f5e1847bSJuan Quintela * @opts: opts for device we are handling 808f5e1847bSJuan Quintela * @errp: returns an error if this function fails 809f5e1847bSJuan Quintela */ 81012b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque) 811f5e1847bSJuan Quintela { 81212b2fad7SKevin Wolf FailoverDevice *fdev = opaque; 81312b2fad7SKevin Wolf PCIDevice *pci_dev = (PCIDevice *) 81412b2fad7SKevin Wolf object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE); 815f5e1847bSJuan Quintela 81612b2fad7SKevin Wolf if (!pci_dev) { 81712b2fad7SKevin Wolf return 0; 81812b2fad7SKevin Wolf } 81912b2fad7SKevin Wolf 82012b2fad7SKevin Wolf if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) { 82112b2fad7SKevin Wolf fdev->dev = dev; 822f5e1847bSJuan Quintela return 1; 823f5e1847bSJuan Quintela } 824f5e1847bSJuan Quintela 825f5e1847bSJuan Quintela return 0; 826f5e1847bSJuan Quintela } 827f5e1847bSJuan Quintela 828f5e1847bSJuan Quintela /** 82985d3b931SJuan Quintela * Find the primary device for this failover virtio-net 83085d3b931SJuan Quintela * 83185d3b931SJuan Quintela * @n: VirtIONet device 83285d3b931SJuan Quintela * @errp: returns an error if this function fails 83385d3b931SJuan Quintela */ 8340a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n) 8359711cd0dSJens Freimann { 83612b2fad7SKevin Wolf FailoverDevice fdev = { 83712b2fad7SKevin Wolf .n = n, 83812b2fad7SKevin Wolf }; 8399711cd0dSJens Freimann 84012b2fad7SKevin Wolf qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL, 84112b2fad7SKevin Wolf NULL, NULL, &fdev); 84212b2fad7SKevin Wolf return fdev.dev; 8439711cd0dSJens Freimann } 8449711cd0dSJens Freimann 84521e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp) 84621e8709bSJuan Quintela { 84721e8709bSJuan Quintela Error *err = NULL; 84821e8709bSJuan Quintela DeviceState *dev = failover_find_primary_device(n); 84921e8709bSJuan Quintela 85021e8709bSJuan Quintela if (dev) { 85121e8709bSJuan Quintela return; 85221e8709bSJuan Quintela } 85321e8709bSJuan Quintela 854259a10dbSKevin Wolf if (!n->primary_opts) { 85597ca9c59SLaurent Vivier error_setg(errp, "Primary device not found"); 85697ca9c59SLaurent Vivier error_append_hint(errp, "Virtio-net failover will not work. Make " 85797ca9c59SLaurent Vivier "sure primary device has parameter" 85897ca9c59SLaurent Vivier " failover_pair_id=%s\n", n->netclient_name); 85921e8709bSJuan Quintela return; 86021e8709bSJuan Quintela } 861259a10dbSKevin Wolf 862f3558b1bSKevin Wolf dev = qdev_device_add_from_qdict(n->primary_opts, 863f3558b1bSKevin Wolf n->primary_opts_from_json, 864f3558b1bSKevin Wolf &err); 86521e8709bSJuan Quintela if (err) { 866f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 867259a10dbSKevin Wolf n->primary_opts = NULL; 86800e7b129SLaurent Vivier } else { 86900e7b129SLaurent Vivier object_unref(OBJECT(dev)); 87021e8709bSJuan Quintela } 87121e8709bSJuan Quintela error_propagate(errp, err); 87221e8709bSJuan Quintela } 87321e8709bSJuan Quintela 874d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features) 8756e790746SPaolo Bonzini { 87617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 8779711cd0dSJens Freimann Error *err = NULL; 8786e790746SPaolo Bonzini int i; 8796e790746SPaolo Bonzini 88075ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 88175ebec11SMaxime Coquelin !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) { 88275ebec11SMaxime Coquelin features &= ~(1ULL << VIRTIO_NET_F_MTU); 88375ebec11SMaxime Coquelin } 88475ebec11SMaxime Coquelin 885ef546f12SCornelia Huck virtio_net_set_multiqueue(n, 88659079029SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_RSS) || 88795129d6fSCornelia Huck virtio_has_feature(features, VIRTIO_NET_F_MQ)); 8886e790746SPaolo Bonzini 889ef546f12SCornelia Huck virtio_net_set_mrg_rx_bufs(n, 89095129d6fSCornelia Huck virtio_has_feature(features, 891bb9d17f8SCornelia Huck VIRTIO_NET_F_MRG_RXBUF), 89295129d6fSCornelia Huck virtio_has_feature(features, 893e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 894e22f0603SYuri Benditovich virtio_has_feature(features, 895e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 8966e790746SPaolo Bonzini 8972974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 8982974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4); 8992974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 9002974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6); 901e22f0603SYuri Benditovich n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS); 9022974e916SYuri Benditovich 9036e790746SPaolo Bonzini if (n->has_vnet_hdr) { 904644c9858SDmitry Fleytman n->curr_guest_offloads = 905644c9858SDmitry Fleytman virtio_net_guest_offloads_by_features(features); 906644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 9076e790746SPaolo Bonzini } 9086e790746SPaolo Bonzini 909441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 9106e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, i); 9116e790746SPaolo Bonzini 912ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 9136e790746SPaolo Bonzini continue; 9146e790746SPaolo Bonzini } 915ed8b4afeSNikolay Nikolaev vhost_net_ack_features(get_vhost_net(nc->peer), features); 9166e790746SPaolo Bonzini } 9170b1eaa88SStefan Fritsch 91895129d6fSCornelia Huck if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) { 9190b1eaa88SStefan Fritsch memset(n->vlans, 0, MAX_VLAN >> 3); 9200b1eaa88SStefan Fritsch } else { 9210b1eaa88SStefan Fritsch memset(n->vlans, 0xff, MAX_VLAN >> 3); 9220b1eaa88SStefan Fritsch } 9239711cd0dSJens Freimann 9249711cd0dSJens Freimann if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) { 9259711cd0dSJens Freimann qapi_event_send_failover_negotiated(n->netclient_name); 926e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 9279711cd0dSJens Freimann failover_add_primary(n, &err); 9289711cd0dSJens Freimann if (err) { 9299711cd0dSJens Freimann warn_report_err(err); 9309711cd0dSJens Freimann } 9316e790746SPaolo Bonzini } 93221e8709bSJuan Quintela } 9336e790746SPaolo Bonzini 9346e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd, 9356e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 9366e790746SPaolo Bonzini { 9376e790746SPaolo Bonzini uint8_t on; 9386e790746SPaolo Bonzini size_t s; 939b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 9406e790746SPaolo Bonzini 9416e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on)); 9426e790746SPaolo Bonzini if (s != sizeof(on)) { 9436e790746SPaolo Bonzini return VIRTIO_NET_ERR; 9446e790746SPaolo Bonzini } 9456e790746SPaolo Bonzini 9466e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) { 9476e790746SPaolo Bonzini n->promisc = on; 9486e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) { 9496e790746SPaolo Bonzini n->allmulti = on; 9506e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) { 9516e790746SPaolo Bonzini n->alluni = on; 9526e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) { 9536e790746SPaolo Bonzini n->nomulti = on; 9546e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) { 9556e790746SPaolo Bonzini n->nouni = on; 9566e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) { 9576e790746SPaolo Bonzini n->nobcast = on; 9586e790746SPaolo Bonzini } else { 9596e790746SPaolo Bonzini return VIRTIO_NET_ERR; 9606e790746SPaolo Bonzini } 9616e790746SPaolo Bonzini 962b1be4280SAmos Kong rxfilter_notify(nc); 963b1be4280SAmos Kong 9646e790746SPaolo Bonzini return VIRTIO_NET_OK; 9656e790746SPaolo Bonzini } 9666e790746SPaolo Bonzini 967644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd, 968644c9858SDmitry Fleytman struct iovec *iov, unsigned int iov_cnt) 969644c9858SDmitry Fleytman { 970644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 971644c9858SDmitry Fleytman uint64_t offloads; 972644c9858SDmitry Fleytman size_t s; 973644c9858SDmitry Fleytman 97495129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 975644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 976644c9858SDmitry Fleytman } 977644c9858SDmitry Fleytman 978644c9858SDmitry Fleytman s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads)); 979644c9858SDmitry Fleytman if (s != sizeof(offloads)) { 980644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 981644c9858SDmitry Fleytman } 982644c9858SDmitry Fleytman 983644c9858SDmitry Fleytman if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) { 984644c9858SDmitry Fleytman uint64_t supported_offloads; 985644c9858SDmitry Fleytman 986189ae6bbSJason Wang offloads = virtio_ldq_p(vdev, &offloads); 987189ae6bbSJason Wang 988644c9858SDmitry Fleytman if (!n->has_vnet_hdr) { 989644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 990644c9858SDmitry Fleytman } 991644c9858SDmitry Fleytman 9922974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 9932974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4); 9942974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 9952974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6); 9962974e916SYuri Benditovich virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT); 9972974e916SYuri Benditovich 998644c9858SDmitry Fleytman supported_offloads = virtio_net_supported_guest_offloads(n); 999644c9858SDmitry Fleytman if (offloads & ~supported_offloads) { 1000644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1001644c9858SDmitry Fleytman } 1002644c9858SDmitry Fleytman 1003644c9858SDmitry Fleytman n->curr_guest_offloads = offloads; 1004644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 1005644c9858SDmitry Fleytman 1006644c9858SDmitry Fleytman return VIRTIO_NET_OK; 1007644c9858SDmitry Fleytman } else { 1008644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1009644c9858SDmitry Fleytman } 1010644c9858SDmitry Fleytman } 1011644c9858SDmitry Fleytman 10126e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd, 10136e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 10146e790746SPaolo Bonzini { 10151399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 10166e790746SPaolo Bonzini struct virtio_net_ctrl_mac mac_data; 10176e790746SPaolo Bonzini size_t s; 1018b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 10196e790746SPaolo Bonzini 10206e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) { 10216e790746SPaolo Bonzini if (iov_size(iov, iov_cnt) != sizeof(n->mac)) { 10226e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10236e790746SPaolo Bonzini } 10246e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac)); 10256e790746SPaolo Bonzini assert(s == sizeof(n->mac)); 10266e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1027b1be4280SAmos Kong rxfilter_notify(nc); 1028b1be4280SAmos Kong 10296e790746SPaolo Bonzini return VIRTIO_NET_OK; 10306e790746SPaolo Bonzini } 10316e790746SPaolo Bonzini 10326e790746SPaolo Bonzini if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) { 10336e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10346e790746SPaolo Bonzini } 10356e790746SPaolo Bonzini 1036cae2e556SAmos Kong int in_use = 0; 1037cae2e556SAmos Kong int first_multi = 0; 1038cae2e556SAmos Kong uint8_t uni_overflow = 0; 1039cae2e556SAmos Kong uint8_t multi_overflow = 0; 1040cae2e556SAmos Kong uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 10416e790746SPaolo Bonzini 10426e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 10436e790746SPaolo Bonzini sizeof(mac_data.entries)); 10441399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 10456e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1046b1be4280SAmos Kong goto error; 10476e790746SPaolo Bonzini } 10486e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 10496e790746SPaolo Bonzini 10506e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) { 1051b1be4280SAmos Kong goto error; 10526e790746SPaolo Bonzini } 10536e790746SPaolo Bonzini 10546e790746SPaolo Bonzini if (mac_data.entries <= MAC_TABLE_ENTRIES) { 1055cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, macs, 10566e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 10576e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1058b1be4280SAmos Kong goto error; 10596e790746SPaolo Bonzini } 1060cae2e556SAmos Kong in_use += mac_data.entries; 10616e790746SPaolo Bonzini } else { 1062cae2e556SAmos Kong uni_overflow = 1; 10636e790746SPaolo Bonzini } 10646e790746SPaolo Bonzini 10656e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN); 10666e790746SPaolo Bonzini 1067cae2e556SAmos Kong first_multi = in_use; 10686e790746SPaolo Bonzini 10696e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 10706e790746SPaolo Bonzini sizeof(mac_data.entries)); 10711399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 10726e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1073b1be4280SAmos Kong goto error; 10746e790746SPaolo Bonzini } 10756e790746SPaolo Bonzini 10766e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 10776e790746SPaolo Bonzini 10786e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) { 1079b1be4280SAmos Kong goto error; 10806e790746SPaolo Bonzini } 10816e790746SPaolo Bonzini 1082edc24385SMichael S. Tsirkin if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) { 1083cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN], 10846e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 10856e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1086b1be4280SAmos Kong goto error; 10876e790746SPaolo Bonzini } 1088cae2e556SAmos Kong in_use += mac_data.entries; 10896e790746SPaolo Bonzini } else { 1090cae2e556SAmos Kong multi_overflow = 1; 10916e790746SPaolo Bonzini } 10926e790746SPaolo Bonzini 1093cae2e556SAmos Kong n->mac_table.in_use = in_use; 1094cae2e556SAmos Kong n->mac_table.first_multi = first_multi; 1095cae2e556SAmos Kong n->mac_table.uni_overflow = uni_overflow; 1096cae2e556SAmos Kong n->mac_table.multi_overflow = multi_overflow; 1097cae2e556SAmos Kong memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN); 1098cae2e556SAmos Kong g_free(macs); 1099b1be4280SAmos Kong rxfilter_notify(nc); 1100b1be4280SAmos Kong 11016e790746SPaolo Bonzini return VIRTIO_NET_OK; 1102b1be4280SAmos Kong 1103b1be4280SAmos Kong error: 1104cae2e556SAmos Kong g_free(macs); 1105b1be4280SAmos Kong return VIRTIO_NET_ERR; 11066e790746SPaolo Bonzini } 11076e790746SPaolo Bonzini 11086e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd, 11096e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 11106e790746SPaolo Bonzini { 11111399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 11126e790746SPaolo Bonzini uint16_t vid; 11136e790746SPaolo Bonzini size_t s; 1114b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 11156e790746SPaolo Bonzini 11166e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid)); 11171399c60dSRusty Russell vid = virtio_lduw_p(vdev, &vid); 11186e790746SPaolo Bonzini if (s != sizeof(vid)) { 11196e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11206e790746SPaolo Bonzini } 11216e790746SPaolo Bonzini 11226e790746SPaolo Bonzini if (vid >= MAX_VLAN) 11236e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11246e790746SPaolo Bonzini 11256e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_VLAN_ADD) 11266e790746SPaolo Bonzini n->vlans[vid >> 5] |= (1U << (vid & 0x1f)); 11276e790746SPaolo Bonzini else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL) 11286e790746SPaolo Bonzini n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f)); 11296e790746SPaolo Bonzini else 11306e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11316e790746SPaolo Bonzini 1132b1be4280SAmos Kong rxfilter_notify(nc); 1133b1be4280SAmos Kong 11346e790746SPaolo Bonzini return VIRTIO_NET_OK; 11356e790746SPaolo Bonzini } 11366e790746SPaolo Bonzini 1137f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd, 1138f57fcf70SJason Wang struct iovec *iov, unsigned int iov_cnt) 1139f57fcf70SJason Wang { 11409d8c6a25SDr. David Alan Gilbert trace_virtio_net_handle_announce(n->announce_timer.round); 1141f57fcf70SJason Wang if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK && 1142f57fcf70SJason Wang n->status & VIRTIO_NET_S_ANNOUNCE) { 1143f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 11449d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 11459d8c6a25SDr. David Alan Gilbert qemu_announce_timer_step(&n->announce_timer); 1146f57fcf70SJason Wang } 1147f57fcf70SJason Wang return VIRTIO_NET_OK; 1148f57fcf70SJason Wang } else { 1149f57fcf70SJason Wang return VIRTIO_NET_ERR; 1150f57fcf70SJason Wang } 1151f57fcf70SJason Wang } 1152f57fcf70SJason Wang 11530145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n); 11540145c393SAndrew Melnychenko 115559079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n) 115659079029SYuri Benditovich { 115759079029SYuri Benditovich if (n->rss_data.enabled) { 115859079029SYuri Benditovich trace_virtio_net_rss_disable(); 115959079029SYuri Benditovich } 116059079029SYuri Benditovich n->rss_data.enabled = false; 11610145c393SAndrew Melnychenko 11620145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 11630145c393SAndrew Melnychenko } 11640145c393SAndrew Melnychenko 11650145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd) 11660145c393SAndrew Melnychenko { 11670145c393SAndrew Melnychenko NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0); 11680145c393SAndrew Melnychenko if (nc == NULL || nc->info->set_steering_ebpf == NULL) { 11690145c393SAndrew Melnychenko return false; 11700145c393SAndrew Melnychenko } 11710145c393SAndrew Melnychenko 11720145c393SAndrew Melnychenko return nc->info->set_steering_ebpf(nc, prog_fd); 11730145c393SAndrew Melnychenko } 11740145c393SAndrew Melnychenko 11750145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data, 11760145c393SAndrew Melnychenko struct EBPFRSSConfig *config) 11770145c393SAndrew Melnychenko { 11780145c393SAndrew Melnychenko config->redirect = data->redirect; 11790145c393SAndrew Melnychenko config->populate_hash = data->populate_hash; 11800145c393SAndrew Melnychenko config->hash_types = data->hash_types; 11810145c393SAndrew Melnychenko config->indirections_len = data->indirections_len; 11820145c393SAndrew Melnychenko config->default_queue = data->default_queue; 11830145c393SAndrew Melnychenko } 11840145c393SAndrew Melnychenko 11850145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n) 11860145c393SAndrew Melnychenko { 11870145c393SAndrew Melnychenko struct EBPFRSSConfig config = {}; 11880145c393SAndrew Melnychenko 11890145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 11900145c393SAndrew Melnychenko return false; 11910145c393SAndrew Melnychenko } 11920145c393SAndrew Melnychenko 11930145c393SAndrew Melnychenko rss_data_to_rss_config(&n->rss_data, &config); 11940145c393SAndrew Melnychenko 11950145c393SAndrew Melnychenko if (!ebpf_rss_set_all(&n->ebpf_rss, &config, 11960145c393SAndrew Melnychenko n->rss_data.indirections_table, n->rss_data.key)) { 11970145c393SAndrew Melnychenko return false; 11980145c393SAndrew Melnychenko } 11990145c393SAndrew Melnychenko 12000145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) { 12010145c393SAndrew Melnychenko return false; 12020145c393SAndrew Melnychenko } 12030145c393SAndrew Melnychenko 12040145c393SAndrew Melnychenko return true; 12050145c393SAndrew Melnychenko } 12060145c393SAndrew Melnychenko 12070145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n) 12080145c393SAndrew Melnychenko { 12090145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 12100145c393SAndrew Melnychenko } 12110145c393SAndrew Melnychenko 12120145c393SAndrew Melnychenko static bool virtio_net_load_ebpf(VirtIONet *n) 12130145c393SAndrew Melnychenko { 12140145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, -1)) { 12150145c393SAndrew Melnychenko /* backend does't support steering ebpf */ 12160145c393SAndrew Melnychenko return false; 12170145c393SAndrew Melnychenko } 12180145c393SAndrew Melnychenko 12190145c393SAndrew Melnychenko return ebpf_rss_load(&n->ebpf_rss); 12200145c393SAndrew Melnychenko } 12210145c393SAndrew Melnychenko 12220145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n) 12230145c393SAndrew Melnychenko { 12240145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 12250145c393SAndrew Melnychenko ebpf_rss_unload(&n->ebpf_rss); 122659079029SYuri Benditovich } 122759079029SYuri Benditovich 122859079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n, 1229e22f0603SYuri Benditovich struct iovec *iov, 1230e22f0603SYuri Benditovich unsigned int iov_cnt, 1231e22f0603SYuri Benditovich bool do_rss) 123259079029SYuri Benditovich { 123359079029SYuri Benditovich VirtIODevice *vdev = VIRTIO_DEVICE(n); 123459079029SYuri Benditovich struct virtio_net_rss_config cfg; 123559079029SYuri Benditovich size_t s, offset = 0, size_get; 1236441537f1SJason Wang uint16_t queue_pairs, i; 123759079029SYuri Benditovich struct { 123859079029SYuri Benditovich uint16_t us; 123959079029SYuri Benditovich uint8_t b; 124059079029SYuri Benditovich } QEMU_PACKED temp; 124159079029SYuri Benditovich const char *err_msg = ""; 124259079029SYuri Benditovich uint32_t err_value = 0; 124359079029SYuri Benditovich 1244e22f0603SYuri Benditovich if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) { 124559079029SYuri Benditovich err_msg = "RSS is not negotiated"; 124659079029SYuri Benditovich goto error; 124759079029SYuri Benditovich } 1248e22f0603SYuri Benditovich if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) { 1249e22f0603SYuri Benditovich err_msg = "Hash report is not negotiated"; 1250e22f0603SYuri Benditovich goto error; 1251e22f0603SYuri Benditovich } 125259079029SYuri Benditovich size_get = offsetof(struct virtio_net_rss_config, indirection_table); 125359079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get); 125459079029SYuri Benditovich if (s != size_get) { 125559079029SYuri Benditovich err_msg = "Short command buffer"; 125659079029SYuri Benditovich err_value = (uint32_t)s; 125759079029SYuri Benditovich goto error; 125859079029SYuri Benditovich } 125959079029SYuri Benditovich n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types); 126059079029SYuri Benditovich n->rss_data.indirections_len = 126159079029SYuri Benditovich virtio_lduw_p(vdev, &cfg.indirection_table_mask); 126259079029SYuri Benditovich n->rss_data.indirections_len++; 1263e22f0603SYuri Benditovich if (!do_rss) { 1264e22f0603SYuri Benditovich n->rss_data.indirections_len = 1; 1265e22f0603SYuri Benditovich } 126659079029SYuri Benditovich if (!is_power_of_2(n->rss_data.indirections_len)) { 126759079029SYuri Benditovich err_msg = "Invalid size of indirection table"; 126859079029SYuri Benditovich err_value = n->rss_data.indirections_len; 126959079029SYuri Benditovich goto error; 127059079029SYuri Benditovich } 127159079029SYuri Benditovich if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) { 127259079029SYuri Benditovich err_msg = "Too large indirection table"; 127359079029SYuri Benditovich err_value = n->rss_data.indirections_len; 127459079029SYuri Benditovich goto error; 127559079029SYuri Benditovich } 1276e22f0603SYuri Benditovich n->rss_data.default_queue = do_rss ? 1277e22f0603SYuri Benditovich virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0; 1278441537f1SJason Wang if (n->rss_data.default_queue >= n->max_queue_pairs) { 127959079029SYuri Benditovich err_msg = "Invalid default queue"; 128059079029SYuri Benditovich err_value = n->rss_data.default_queue; 128159079029SYuri Benditovich goto error; 128259079029SYuri Benditovich } 128359079029SYuri Benditovich offset += size_get; 128459079029SYuri Benditovich size_get = sizeof(uint16_t) * n->rss_data.indirections_len; 128559079029SYuri Benditovich g_free(n->rss_data.indirections_table); 128659079029SYuri Benditovich n->rss_data.indirections_table = g_malloc(size_get); 128759079029SYuri Benditovich if (!n->rss_data.indirections_table) { 128859079029SYuri Benditovich err_msg = "Can't allocate indirections table"; 128959079029SYuri Benditovich err_value = n->rss_data.indirections_len; 129059079029SYuri Benditovich goto error; 129159079029SYuri Benditovich } 129259079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, 129359079029SYuri Benditovich n->rss_data.indirections_table, size_get); 129459079029SYuri Benditovich if (s != size_get) { 129559079029SYuri Benditovich err_msg = "Short indirection table buffer"; 129659079029SYuri Benditovich err_value = (uint32_t)s; 129759079029SYuri Benditovich goto error; 129859079029SYuri Benditovich } 129959079029SYuri Benditovich for (i = 0; i < n->rss_data.indirections_len; ++i) { 130059079029SYuri Benditovich uint16_t val = n->rss_data.indirections_table[i]; 130159079029SYuri Benditovich n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val); 130259079029SYuri Benditovich } 130359079029SYuri Benditovich offset += size_get; 130459079029SYuri Benditovich size_get = sizeof(temp); 130559079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get); 130659079029SYuri Benditovich if (s != size_get) { 1307441537f1SJason Wang err_msg = "Can't get queue_pairs"; 130859079029SYuri Benditovich err_value = (uint32_t)s; 130959079029SYuri Benditovich goto error; 131059079029SYuri Benditovich } 1311441537f1SJason Wang queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs; 1312441537f1SJason Wang if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) { 1313441537f1SJason Wang err_msg = "Invalid number of queue_pairs"; 1314441537f1SJason Wang err_value = queue_pairs; 131559079029SYuri Benditovich goto error; 131659079029SYuri Benditovich } 131759079029SYuri Benditovich if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) { 131859079029SYuri Benditovich err_msg = "Invalid key size"; 131959079029SYuri Benditovich err_value = temp.b; 132059079029SYuri Benditovich goto error; 132159079029SYuri Benditovich } 132259079029SYuri Benditovich if (!temp.b && n->rss_data.hash_types) { 132359079029SYuri Benditovich err_msg = "No key provided"; 132459079029SYuri Benditovich err_value = 0; 132559079029SYuri Benditovich goto error; 132659079029SYuri Benditovich } 132759079029SYuri Benditovich if (!temp.b && !n->rss_data.hash_types) { 132859079029SYuri Benditovich virtio_net_disable_rss(n); 1329441537f1SJason Wang return queue_pairs; 133059079029SYuri Benditovich } 133159079029SYuri Benditovich offset += size_get; 133259079029SYuri Benditovich size_get = temp.b; 133359079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get); 133459079029SYuri Benditovich if (s != size_get) { 133559079029SYuri Benditovich err_msg = "Can get key buffer"; 133659079029SYuri Benditovich err_value = (uint32_t)s; 133759079029SYuri Benditovich goto error; 133859079029SYuri Benditovich } 133959079029SYuri Benditovich n->rss_data.enabled = true; 13400145c393SAndrew Melnychenko 13410145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 13420145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 13430145c393SAndrew Melnychenko /* EBPF must be loaded for vhost */ 13440145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 13450145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS for vhost"); 13460145c393SAndrew Melnychenko goto error; 13470145c393SAndrew Melnychenko } 13480145c393SAndrew Melnychenko /* fallback to software RSS */ 13490145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS - fallback to software RSS"); 13500145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 13510145c393SAndrew Melnychenko } 13520145c393SAndrew Melnychenko } else { 13530145c393SAndrew Melnychenko /* use software RSS for hash populating */ 13540145c393SAndrew Melnychenko /* and detach eBPF if was loaded before */ 13550145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 13560145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 13570145c393SAndrew Melnychenko } 13580145c393SAndrew Melnychenko 135959079029SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 136059079029SYuri Benditovich n->rss_data.indirections_len, 136159079029SYuri Benditovich temp.b); 1362441537f1SJason Wang return queue_pairs; 136359079029SYuri Benditovich error: 136459079029SYuri Benditovich trace_virtio_net_rss_error(err_msg, err_value); 136559079029SYuri Benditovich virtio_net_disable_rss(n); 136659079029SYuri Benditovich return 0; 136759079029SYuri Benditovich } 136859079029SYuri Benditovich 13696e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd, 13706e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 13716e790746SPaolo Bonzini { 137217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1373441537f1SJason Wang uint16_t queue_pairs; 13746e790746SPaolo Bonzini 137559079029SYuri Benditovich virtio_net_disable_rss(n); 1376e22f0603SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) { 1377441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false); 1378441537f1SJason Wang return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR; 1379e22f0603SYuri Benditovich } 138059079029SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) { 1381441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true); 138259079029SYuri Benditovich } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) { 138359079029SYuri Benditovich struct virtio_net_ctrl_mq mq; 138459079029SYuri Benditovich size_t s; 138559079029SYuri Benditovich if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) { 138659079029SYuri Benditovich return VIRTIO_NET_ERR; 138759079029SYuri Benditovich } 13886e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq)); 13896e790746SPaolo Bonzini if (s != sizeof(mq)) { 13906e790746SPaolo Bonzini return VIRTIO_NET_ERR; 13916e790746SPaolo Bonzini } 1392441537f1SJason Wang queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs); 13936e790746SPaolo Bonzini 139459079029SYuri Benditovich } else { 13956e790746SPaolo Bonzini return VIRTIO_NET_ERR; 13966e790746SPaolo Bonzini } 13976e790746SPaolo Bonzini 1398441537f1SJason Wang if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN || 1399441537f1SJason Wang queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX || 1400441537f1SJason Wang queue_pairs > n->max_queue_pairs || 14016e790746SPaolo Bonzini !n->multiqueue) { 14026e790746SPaolo Bonzini return VIRTIO_NET_ERR; 14036e790746SPaolo Bonzini } 14046e790746SPaolo Bonzini 1405441537f1SJason Wang n->curr_queue_pairs = queue_pairs; 1406441537f1SJason Wang /* stop the backend before changing the number of queue_pairs to avoid handling a 14076e790746SPaolo Bonzini * disabled queue */ 140817a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 1409441537f1SJason Wang virtio_net_set_queue_pairs(n); 14106e790746SPaolo Bonzini 14116e790746SPaolo Bonzini return VIRTIO_NET_OK; 14126e790746SPaolo Bonzini } 1413ba7eadb5SGreg Kurz 14146e790746SPaolo Bonzini static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq) 14156e790746SPaolo Bonzini { 141617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 14176e790746SPaolo Bonzini struct virtio_net_ctrl_hdr ctrl; 14186e790746SPaolo Bonzini virtio_net_ctrl_ack status = VIRTIO_NET_ERR; 141951b19ebeSPaolo Bonzini VirtQueueElement *elem; 14206e790746SPaolo Bonzini size_t s; 1421771b6ed3SJason Wang struct iovec *iov, *iov2; 14226e790746SPaolo Bonzini unsigned int iov_cnt; 14236e790746SPaolo Bonzini 142451b19ebeSPaolo Bonzini for (;;) { 142551b19ebeSPaolo Bonzini elem = virtqueue_pop(vq, sizeof(VirtQueueElement)); 142651b19ebeSPaolo Bonzini if (!elem) { 142751b19ebeSPaolo Bonzini break; 142851b19ebeSPaolo Bonzini } 142951b19ebeSPaolo Bonzini if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) || 143051b19ebeSPaolo Bonzini iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) { 1431ba7eadb5SGreg Kurz virtio_error(vdev, "virtio-net ctrl missing headers"); 1432ba7eadb5SGreg Kurz virtqueue_detach_element(vq, elem, 0); 1433ba7eadb5SGreg Kurz g_free(elem); 1434ba7eadb5SGreg Kurz break; 14356e790746SPaolo Bonzini } 14366e790746SPaolo Bonzini 143751b19ebeSPaolo Bonzini iov_cnt = elem->out_num; 143851b19ebeSPaolo Bonzini iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num); 14396e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl)); 14406e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, sizeof(ctrl)); 14416e790746SPaolo Bonzini if (s != sizeof(ctrl)) { 14426e790746SPaolo Bonzini status = VIRTIO_NET_ERR; 14436e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_RX) { 14446e790746SPaolo Bonzini status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt); 14456e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) { 14466e790746SPaolo Bonzini status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt); 14476e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) { 14486e790746SPaolo Bonzini status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt); 1449f57fcf70SJason Wang } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) { 1450f57fcf70SJason Wang status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt); 14516e790746SPaolo Bonzini } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) { 14526e790746SPaolo Bonzini status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt); 1453644c9858SDmitry Fleytman } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) { 1454644c9858SDmitry Fleytman status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt); 14556e790746SPaolo Bonzini } 14566e790746SPaolo Bonzini 145751b19ebeSPaolo Bonzini s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status)); 14586e790746SPaolo Bonzini assert(s == sizeof(status)); 14596e790746SPaolo Bonzini 146051b19ebeSPaolo Bonzini virtqueue_push(vq, elem, sizeof(status)); 14616e790746SPaolo Bonzini virtio_notify(vdev, vq); 1462771b6ed3SJason Wang g_free(iov2); 146351b19ebeSPaolo Bonzini g_free(elem); 14646e790746SPaolo Bonzini } 14656e790746SPaolo Bonzini } 14666e790746SPaolo Bonzini 14676e790746SPaolo Bonzini /* RX */ 14686e790746SPaolo Bonzini 14696e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq) 14706e790746SPaolo Bonzini { 147117a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 14726e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(vq)); 14736e790746SPaolo Bonzini 14746e790746SPaolo Bonzini qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index)); 14756e790746SPaolo Bonzini } 14766e790746SPaolo Bonzini 1477b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc) 14786e790746SPaolo Bonzini { 14796e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 148017a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 14816e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 14826e790746SPaolo Bonzini 148317a0ca55SKONRAD Frederic if (!vdev->vm_running) { 1484b8c4b67eSPhilippe Mathieu-Daudé return false; 14856e790746SPaolo Bonzini } 14866e790746SPaolo Bonzini 1487441537f1SJason Wang if (nc->queue_index >= n->curr_queue_pairs) { 1488b8c4b67eSPhilippe Mathieu-Daudé return false; 14896e790746SPaolo Bonzini } 14906e790746SPaolo Bonzini 14916e790746SPaolo Bonzini if (!virtio_queue_ready(q->rx_vq) || 149217a0ca55SKONRAD Frederic !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 1493b8c4b67eSPhilippe Mathieu-Daudé return false; 14946e790746SPaolo Bonzini } 14956e790746SPaolo Bonzini 1496b8c4b67eSPhilippe Mathieu-Daudé return true; 14976e790746SPaolo Bonzini } 14986e790746SPaolo Bonzini 14996e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize) 15006e790746SPaolo Bonzini { 15016e790746SPaolo Bonzini VirtIONet *n = q->n; 15026e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 15036e790746SPaolo Bonzini (n->mergeable_rx_bufs && 15046e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 15056e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 1); 15066e790746SPaolo Bonzini 15076e790746SPaolo Bonzini /* To avoid a race condition where the guest has made some buffers 15086e790746SPaolo Bonzini * available after the above check but before notification was 15096e790746SPaolo Bonzini * enabled, check for available buffers again. 15106e790746SPaolo Bonzini */ 15116e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 15126e790746SPaolo Bonzini (n->mergeable_rx_bufs && 15136e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 15146e790746SPaolo Bonzini return 0; 15156e790746SPaolo Bonzini } 15166e790746SPaolo Bonzini } 15176e790746SPaolo Bonzini 15186e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 0); 15196e790746SPaolo Bonzini return 1; 15206e790746SPaolo Bonzini } 15216e790746SPaolo Bonzini 15221399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr) 1523032a74a1SCédric Le Goater { 15241399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->hdr_len); 15251399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->gso_size); 15261399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_start); 15271399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_offset); 1528032a74a1SCédric Le Goater } 1529032a74a1SCédric Le Goater 15306e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so 15316e790746SPaolo Bonzini * it never finds out that the packets don't have valid checksums. This 15326e790746SPaolo Bonzini * causes dhclient to get upset. Fedora's carried a patch for ages to 15336e790746SPaolo Bonzini * fix this with Xen but it hasn't appeared in an upstream release of 15346e790746SPaolo Bonzini * dhclient yet. 15356e790746SPaolo Bonzini * 15366e790746SPaolo Bonzini * To avoid breaking existing guests, we catch udp packets and add 15376e790746SPaolo Bonzini * checksums. This is terrible but it's better than hacking the guest 15386e790746SPaolo Bonzini * kernels. 15396e790746SPaolo Bonzini * 15406e790746SPaolo Bonzini * N.B. if we introduce a zero-copy API, this operation is no longer free so 15416e790746SPaolo Bonzini * we should provide a mechanism to disable it to avoid polluting the host 15426e790746SPaolo Bonzini * cache. 15436e790746SPaolo Bonzini */ 15446e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr, 15456e790746SPaolo Bonzini uint8_t *buf, size_t size) 15466e790746SPaolo Bonzini { 15476e790746SPaolo Bonzini if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */ 15486e790746SPaolo Bonzini (size > 27 && size < 1500) && /* normal sized MTU */ 15496e790746SPaolo Bonzini (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */ 15506e790746SPaolo Bonzini (buf[23] == 17) && /* ip.protocol == UDP */ 15516e790746SPaolo Bonzini (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */ 1552f5746335SBin Meng net_checksum_calculate(buf, size, CSUM_UDP); 15536e790746SPaolo Bonzini hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM; 15546e790746SPaolo Bonzini } 15556e790746SPaolo Bonzini } 15566e790746SPaolo Bonzini 15576e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt, 15586e790746SPaolo Bonzini const void *buf, size_t size) 15596e790746SPaolo Bonzini { 15606e790746SPaolo Bonzini if (n->has_vnet_hdr) { 15616e790746SPaolo Bonzini /* FIXME this cast is evil */ 15626e790746SPaolo Bonzini void *wbuf = (void *)buf; 15636e790746SPaolo Bonzini work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len, 15646e790746SPaolo Bonzini size - n->host_hdr_len); 15651bfa316cSGreg Kurz 15661bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 15671399c60dSRusty Russell virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf); 15681bfa316cSGreg Kurz } 15696e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr)); 15706e790746SPaolo Bonzini } else { 15716e790746SPaolo Bonzini struct virtio_net_hdr hdr = { 15726e790746SPaolo Bonzini .flags = 0, 15736e790746SPaolo Bonzini .gso_type = VIRTIO_NET_HDR_GSO_NONE 15746e790746SPaolo Bonzini }; 15756e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr); 15766e790746SPaolo Bonzini } 15776e790746SPaolo Bonzini } 15786e790746SPaolo Bonzini 15796e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size) 15806e790746SPaolo Bonzini { 15816e790746SPaolo Bonzini static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff}; 15826e790746SPaolo Bonzini static const uint8_t vlan[] = {0x81, 0x00}; 15836e790746SPaolo Bonzini uint8_t *ptr = (uint8_t *)buf; 15846e790746SPaolo Bonzini int i; 15856e790746SPaolo Bonzini 15866e790746SPaolo Bonzini if (n->promisc) 15876e790746SPaolo Bonzini return 1; 15886e790746SPaolo Bonzini 15896e790746SPaolo Bonzini ptr += n->host_hdr_len; 15906e790746SPaolo Bonzini 15916e790746SPaolo Bonzini if (!memcmp(&ptr[12], vlan, sizeof(vlan))) { 15927542d3e7SPeter Maydell int vid = lduw_be_p(ptr + 14) & 0xfff; 15936e790746SPaolo Bonzini if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f)))) 15946e790746SPaolo Bonzini return 0; 15956e790746SPaolo Bonzini } 15966e790746SPaolo Bonzini 15976e790746SPaolo Bonzini if (ptr[0] & 1) { // multicast 15986e790746SPaolo Bonzini if (!memcmp(ptr, bcast, sizeof(bcast))) { 15996e790746SPaolo Bonzini return !n->nobcast; 16006e790746SPaolo Bonzini } else if (n->nomulti) { 16016e790746SPaolo Bonzini return 0; 16026e790746SPaolo Bonzini } else if (n->allmulti || n->mac_table.multi_overflow) { 16036e790746SPaolo Bonzini return 1; 16046e790746SPaolo Bonzini } 16056e790746SPaolo Bonzini 16066e790746SPaolo Bonzini for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 16076e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 16086e790746SPaolo Bonzini return 1; 16096e790746SPaolo Bonzini } 16106e790746SPaolo Bonzini } 16116e790746SPaolo Bonzini } else { // unicast 16126e790746SPaolo Bonzini if (n->nouni) { 16136e790746SPaolo Bonzini return 0; 16146e790746SPaolo Bonzini } else if (n->alluni || n->mac_table.uni_overflow) { 16156e790746SPaolo Bonzini return 1; 16166e790746SPaolo Bonzini } else if (!memcmp(ptr, n->mac, ETH_ALEN)) { 16176e790746SPaolo Bonzini return 1; 16186e790746SPaolo Bonzini } 16196e790746SPaolo Bonzini 16206e790746SPaolo Bonzini for (i = 0; i < n->mac_table.first_multi; i++) { 16216e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 16226e790746SPaolo Bonzini return 1; 16236e790746SPaolo Bonzini } 16246e790746SPaolo Bonzini } 16256e790746SPaolo Bonzini } 16266e790746SPaolo Bonzini 16276e790746SPaolo Bonzini return 0; 16286e790746SPaolo Bonzini } 16296e790746SPaolo Bonzini 16304474e37aSYuri Benditovich static uint8_t virtio_net_get_hash_type(bool isip4, 16314474e37aSYuri Benditovich bool isip6, 16324474e37aSYuri Benditovich bool isudp, 16334474e37aSYuri Benditovich bool istcp, 16344474e37aSYuri Benditovich uint32_t types) 16354474e37aSYuri Benditovich { 16364474e37aSYuri Benditovich if (isip4) { 16374474e37aSYuri Benditovich if (istcp && (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4)) { 16384474e37aSYuri Benditovich return NetPktRssIpV4Tcp; 16394474e37aSYuri Benditovich } 16404474e37aSYuri Benditovich if (isudp && (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4)) { 16414474e37aSYuri Benditovich return NetPktRssIpV4Udp; 16424474e37aSYuri Benditovich } 16434474e37aSYuri Benditovich if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) { 16444474e37aSYuri Benditovich return NetPktRssIpV4; 16454474e37aSYuri Benditovich } 16464474e37aSYuri Benditovich } else if (isip6) { 16474474e37aSYuri Benditovich uint32_t mask = VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | 16484474e37aSYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6; 16494474e37aSYuri Benditovich 16504474e37aSYuri Benditovich if (istcp && (types & mask)) { 16514474e37aSYuri Benditovich return (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) ? 16524474e37aSYuri Benditovich NetPktRssIpV6TcpEx : NetPktRssIpV6Tcp; 16534474e37aSYuri Benditovich } 16544474e37aSYuri Benditovich mask = VIRTIO_NET_RSS_HASH_TYPE_UDP_EX | VIRTIO_NET_RSS_HASH_TYPE_UDPv6; 16554474e37aSYuri Benditovich if (isudp && (types & mask)) { 16564474e37aSYuri Benditovich return (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) ? 16574474e37aSYuri Benditovich NetPktRssIpV6UdpEx : NetPktRssIpV6Udp; 16584474e37aSYuri Benditovich } 16594474e37aSYuri Benditovich mask = VIRTIO_NET_RSS_HASH_TYPE_IP_EX | VIRTIO_NET_RSS_HASH_TYPE_IPv6; 16604474e37aSYuri Benditovich if (types & mask) { 16614474e37aSYuri Benditovich return (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) ? 16624474e37aSYuri Benditovich NetPktRssIpV6Ex : NetPktRssIpV6; 16634474e37aSYuri Benditovich } 16644474e37aSYuri Benditovich } 16654474e37aSYuri Benditovich return 0xff; 16664474e37aSYuri Benditovich } 16674474e37aSYuri Benditovich 1668e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report, 1669e22f0603SYuri Benditovich uint32_t hash) 1670e22f0603SYuri Benditovich { 1671e22f0603SYuri Benditovich struct virtio_net_hdr_v1_hash *hdr = (void *)buf; 1672e22f0603SYuri Benditovich hdr->hash_value = hash; 1673e22f0603SYuri Benditovich hdr->hash_report = report; 1674e22f0603SYuri Benditovich } 1675e22f0603SYuri Benditovich 16764474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf, 167797cd965cSPaolo Bonzini size_t size) 16786e790746SPaolo Bonzini { 16796e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1680e22f0603SYuri Benditovich unsigned int index = nc->queue_index, new_index = index; 16814474e37aSYuri Benditovich struct NetRxPkt *pkt = n->rx_pkt; 16824474e37aSYuri Benditovich uint8_t net_hash_type; 16834474e37aSYuri Benditovich uint32_t hash; 16844474e37aSYuri Benditovich bool isip4, isip6, isudp, istcp; 1685e22f0603SYuri Benditovich static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = { 1686e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv4, 1687e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv4, 1688e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6, 1689e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6, 1690e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6_EX, 1691e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6_EX, 1692e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv4, 1693e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6, 1694e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6_EX 1695e22f0603SYuri Benditovich }; 16964474e37aSYuri Benditovich 16974474e37aSYuri Benditovich net_rx_pkt_set_protocols(pkt, buf + n->host_hdr_len, 16984474e37aSYuri Benditovich size - n->host_hdr_len); 16994474e37aSYuri Benditovich net_rx_pkt_get_protocols(pkt, &isip4, &isip6, &isudp, &istcp); 17004474e37aSYuri Benditovich if (isip4 && (net_rx_pkt_get_ip4_info(pkt)->fragment)) { 17014474e37aSYuri Benditovich istcp = isudp = false; 17024474e37aSYuri Benditovich } 17034474e37aSYuri Benditovich if (isip6 && (net_rx_pkt_get_ip6_info(pkt)->fragment)) { 17044474e37aSYuri Benditovich istcp = isudp = false; 17054474e37aSYuri Benditovich } 17064474e37aSYuri Benditovich net_hash_type = virtio_net_get_hash_type(isip4, isip6, isudp, istcp, 17074474e37aSYuri Benditovich n->rss_data.hash_types); 17084474e37aSYuri Benditovich if (net_hash_type > NetPktRssIpV6UdpEx) { 1709e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1710e22f0603SYuri Benditovich virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0); 1711e22f0603SYuri Benditovich } 1712e22f0603SYuri Benditovich return n->rss_data.redirect ? n->rss_data.default_queue : -1; 17134474e37aSYuri Benditovich } 17144474e37aSYuri Benditovich 17154474e37aSYuri Benditovich hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key); 1716e22f0603SYuri Benditovich 1717e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1718e22f0603SYuri Benditovich virtio_set_packet_hash(buf, reports[net_hash_type], hash); 1719e22f0603SYuri Benditovich } 1720e22f0603SYuri Benditovich 1721e22f0603SYuri Benditovich if (n->rss_data.redirect) { 17224474e37aSYuri Benditovich new_index = hash & (n->rss_data.indirections_len - 1); 17234474e37aSYuri Benditovich new_index = n->rss_data.indirections_table[new_index]; 17244474e37aSYuri Benditovich } 1725e22f0603SYuri Benditovich 1726e22f0603SYuri Benditovich return (index == new_index) ? -1 : new_index; 17274474e37aSYuri Benditovich } 17284474e37aSYuri Benditovich 17294474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf, 17304474e37aSYuri Benditovich size_t size, bool no_rss) 17314474e37aSYuri Benditovich { 17324474e37aSYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 17336e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 173417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1735bedd7e93SJason Wang VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE]; 1736bedd7e93SJason Wang size_t lens[VIRTQUEUE_MAX_SIZE]; 17376e790746SPaolo Bonzini struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE]; 17386e790746SPaolo Bonzini struct virtio_net_hdr_mrg_rxbuf mhdr; 17396e790746SPaolo Bonzini unsigned mhdr_cnt = 0; 1740bedd7e93SJason Wang size_t offset, i, guest_offset, j; 1741bedd7e93SJason Wang ssize_t err; 17426e790746SPaolo Bonzini 17436e790746SPaolo Bonzini if (!virtio_net_can_receive(nc)) { 17446e790746SPaolo Bonzini return -1; 17456e790746SPaolo Bonzini } 17466e790746SPaolo Bonzini 17470145c393SAndrew Melnychenko if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) { 17484474e37aSYuri Benditovich int index = virtio_net_process_rss(nc, buf, size); 17494474e37aSYuri Benditovich if (index >= 0) { 17504474e37aSYuri Benditovich NetClientState *nc2 = qemu_get_subqueue(n->nic, index); 17514474e37aSYuri Benditovich return virtio_net_receive_rcu(nc2, buf, size, true); 17524474e37aSYuri Benditovich } 17534474e37aSYuri Benditovich } 17544474e37aSYuri Benditovich 17556e790746SPaolo Bonzini /* hdr_len refers to the header we supply to the guest */ 17566e790746SPaolo Bonzini if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) { 17576e790746SPaolo Bonzini return 0; 17586e790746SPaolo Bonzini } 17596e790746SPaolo Bonzini 17606e790746SPaolo Bonzini if (!receive_filter(n, buf, size)) 17616e790746SPaolo Bonzini return size; 17626e790746SPaolo Bonzini 17636e790746SPaolo Bonzini offset = i = 0; 17646e790746SPaolo Bonzini 17656e790746SPaolo Bonzini while (offset < size) { 176651b19ebeSPaolo Bonzini VirtQueueElement *elem; 17676e790746SPaolo Bonzini int len, total; 176851b19ebeSPaolo Bonzini const struct iovec *sg; 17696e790746SPaolo Bonzini 17706e790746SPaolo Bonzini total = 0; 17716e790746SPaolo Bonzini 1772bedd7e93SJason Wang if (i == VIRTQUEUE_MAX_SIZE) { 1773bedd7e93SJason Wang virtio_error(vdev, "virtio-net unexpected long buffer chain"); 1774bedd7e93SJason Wang err = size; 1775bedd7e93SJason Wang goto err; 1776bedd7e93SJason Wang } 1777bedd7e93SJason Wang 177851b19ebeSPaolo Bonzini elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement)); 177951b19ebeSPaolo Bonzini if (!elem) { 1780ba10b9c0SGreg Kurz if (i) { 1781ba10b9c0SGreg Kurz virtio_error(vdev, "virtio-net unexpected empty queue: " 17826e790746SPaolo Bonzini "i %zd mergeable %d offset %zd, size %zd, " 1783019a3edbSGerd Hoffmann "guest hdr len %zd, host hdr len %zd " 1784019a3edbSGerd Hoffmann "guest features 0x%" PRIx64, 17856e790746SPaolo Bonzini i, n->mergeable_rx_bufs, offset, size, 1786019a3edbSGerd Hoffmann n->guest_hdr_len, n->host_hdr_len, 1787019a3edbSGerd Hoffmann vdev->guest_features); 1788ba10b9c0SGreg Kurz } 1789bedd7e93SJason Wang err = -1; 1790bedd7e93SJason Wang goto err; 17916e790746SPaolo Bonzini } 17926e790746SPaolo Bonzini 179351b19ebeSPaolo Bonzini if (elem->in_num < 1) { 1794ba10b9c0SGreg Kurz virtio_error(vdev, 1795ba10b9c0SGreg Kurz "virtio-net receive queue contains no in buffers"); 1796ba10b9c0SGreg Kurz virtqueue_detach_element(q->rx_vq, elem, 0); 1797ba10b9c0SGreg Kurz g_free(elem); 1798bedd7e93SJason Wang err = -1; 1799bedd7e93SJason Wang goto err; 18006e790746SPaolo Bonzini } 18016e790746SPaolo Bonzini 180251b19ebeSPaolo Bonzini sg = elem->in_sg; 18036e790746SPaolo Bonzini if (i == 0) { 18046e790746SPaolo Bonzini assert(offset == 0); 18056e790746SPaolo Bonzini if (n->mergeable_rx_bufs) { 18066e790746SPaolo Bonzini mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg), 180751b19ebeSPaolo Bonzini sg, elem->in_num, 18086e790746SPaolo Bonzini offsetof(typeof(mhdr), num_buffers), 18096e790746SPaolo Bonzini sizeof(mhdr.num_buffers)); 18106e790746SPaolo Bonzini } 18116e790746SPaolo Bonzini 181251b19ebeSPaolo Bonzini receive_header(n, sg, elem->in_num, buf, size); 1813e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1814e22f0603SYuri Benditovich offset = sizeof(mhdr); 1815e22f0603SYuri Benditovich iov_from_buf(sg, elem->in_num, offset, 1816e22f0603SYuri Benditovich buf + offset, n->host_hdr_len - sizeof(mhdr)); 1817e22f0603SYuri Benditovich } 18186e790746SPaolo Bonzini offset = n->host_hdr_len; 18196e790746SPaolo Bonzini total += n->guest_hdr_len; 18206e790746SPaolo Bonzini guest_offset = n->guest_hdr_len; 18216e790746SPaolo Bonzini } else { 18226e790746SPaolo Bonzini guest_offset = 0; 18236e790746SPaolo Bonzini } 18246e790746SPaolo Bonzini 18256e790746SPaolo Bonzini /* copy in packet. ugh */ 182651b19ebeSPaolo Bonzini len = iov_from_buf(sg, elem->in_num, guest_offset, 18276e790746SPaolo Bonzini buf + offset, size - offset); 18286e790746SPaolo Bonzini total += len; 18296e790746SPaolo Bonzini offset += len; 18306e790746SPaolo Bonzini /* If buffers can't be merged, at this point we 18316e790746SPaolo Bonzini * must have consumed the complete packet. 18326e790746SPaolo Bonzini * Otherwise, drop it. */ 18336e790746SPaolo Bonzini if (!n->mergeable_rx_bufs && offset < size) { 183427e57efeSLadi Prosek virtqueue_unpop(q->rx_vq, elem, total); 183551b19ebeSPaolo Bonzini g_free(elem); 1836bedd7e93SJason Wang err = size; 1837bedd7e93SJason Wang goto err; 18386e790746SPaolo Bonzini } 18396e790746SPaolo Bonzini 1840bedd7e93SJason Wang elems[i] = elem; 1841bedd7e93SJason Wang lens[i] = total; 1842bedd7e93SJason Wang i++; 18436e790746SPaolo Bonzini } 18446e790746SPaolo Bonzini 18456e790746SPaolo Bonzini if (mhdr_cnt) { 18461399c60dSRusty Russell virtio_stw_p(vdev, &mhdr.num_buffers, i); 18476e790746SPaolo Bonzini iov_from_buf(mhdr_sg, mhdr_cnt, 18486e790746SPaolo Bonzini 0, 18496e790746SPaolo Bonzini &mhdr.num_buffers, sizeof mhdr.num_buffers); 18506e790746SPaolo Bonzini } 18516e790746SPaolo Bonzini 1852bedd7e93SJason Wang for (j = 0; j < i; j++) { 1853bedd7e93SJason Wang /* signal other side */ 1854bedd7e93SJason Wang virtqueue_fill(q->rx_vq, elems[j], lens[j], j); 1855bedd7e93SJason Wang g_free(elems[j]); 1856bedd7e93SJason Wang } 1857bedd7e93SJason Wang 18586e790746SPaolo Bonzini virtqueue_flush(q->rx_vq, i); 185917a0ca55SKONRAD Frederic virtio_notify(vdev, q->rx_vq); 18606e790746SPaolo Bonzini 18616e790746SPaolo Bonzini return size; 1862bedd7e93SJason Wang 1863bedd7e93SJason Wang err: 1864bedd7e93SJason Wang for (j = 0; j < i; j++) { 1865bedd7e93SJason Wang g_free(elems[j]); 1866bedd7e93SJason Wang } 1867bedd7e93SJason Wang 1868bedd7e93SJason Wang return err; 18696e790746SPaolo Bonzini } 18706e790746SPaolo Bonzini 18712974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf, 187297cd965cSPaolo Bonzini size_t size) 187397cd965cSPaolo Bonzini { 1874068ddfa9SDr. David Alan Gilbert RCU_READ_LOCK_GUARD(); 187597cd965cSPaolo Bonzini 18764474e37aSYuri Benditovich return virtio_net_receive_rcu(nc, buf, size, false); 187797cd965cSPaolo Bonzini } 187897cd965cSPaolo Bonzini 18792974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain, 18802974e916SYuri Benditovich const uint8_t *buf, 18812974e916SYuri Benditovich VirtioNetRscUnit *unit) 18822974e916SYuri Benditovich { 18832974e916SYuri Benditovich uint16_t ip_hdrlen; 18842974e916SYuri Benditovich struct ip_header *ip; 18852974e916SYuri Benditovich 18862974e916SYuri Benditovich ip = (struct ip_header *)(buf + chain->n->guest_hdr_len 18872974e916SYuri Benditovich + sizeof(struct eth_header)); 18882974e916SYuri Benditovich unit->ip = (void *)ip; 18892974e916SYuri Benditovich ip_hdrlen = (ip->ip_ver_len & 0xF) << 2; 18902974e916SYuri Benditovich unit->ip_plen = &ip->ip_len; 18912974e916SYuri Benditovich unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen); 18922974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 18932974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen; 18942974e916SYuri Benditovich } 18952974e916SYuri Benditovich 18962974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain, 18972974e916SYuri Benditovich const uint8_t *buf, 18982974e916SYuri Benditovich VirtioNetRscUnit *unit) 18992974e916SYuri Benditovich { 19002974e916SYuri Benditovich struct ip6_header *ip6; 19012974e916SYuri Benditovich 19022974e916SYuri Benditovich ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len 19032974e916SYuri Benditovich + sizeof(struct eth_header)); 19042974e916SYuri Benditovich unit->ip = ip6; 19052974e916SYuri Benditovich unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 190678ee6bd0SPhilippe Mathieu-Daudé unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) 19072974e916SYuri Benditovich + sizeof(struct ip6_header)); 19082974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 19092974e916SYuri Benditovich 19102974e916SYuri Benditovich /* There is a difference between payload lenght in ipv4 and v6, 19112974e916SYuri Benditovich ip header is excluded in ipv6 */ 19122974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen; 19132974e916SYuri Benditovich } 19142974e916SYuri Benditovich 19152974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain, 19162974e916SYuri Benditovich VirtioNetRscSeg *seg) 19172974e916SYuri Benditovich { 19182974e916SYuri Benditovich int ret; 1919dd3d85e8SYuri Benditovich struct virtio_net_hdr_v1 *h; 19202974e916SYuri Benditovich 1921dd3d85e8SYuri Benditovich h = (struct virtio_net_hdr_v1 *)seg->buf; 19222974e916SYuri Benditovich h->flags = 0; 19232974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_NONE; 19242974e916SYuri Benditovich 19252974e916SYuri Benditovich if (seg->is_coalesced) { 1926dd3d85e8SYuri Benditovich h->rsc.segments = seg->packets; 1927dd3d85e8SYuri Benditovich h->rsc.dup_acks = seg->dup_ack; 19282974e916SYuri Benditovich h->flags = VIRTIO_NET_HDR_F_RSC_INFO; 19292974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 19302974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 19312974e916SYuri Benditovich } else { 19322974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 19332974e916SYuri Benditovich } 19342974e916SYuri Benditovich } 19352974e916SYuri Benditovich 19362974e916SYuri Benditovich ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size); 19372974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 19382974e916SYuri Benditovich g_free(seg->buf); 19392974e916SYuri Benditovich g_free(seg); 19402974e916SYuri Benditovich 19412974e916SYuri Benditovich return ret; 19422974e916SYuri Benditovich } 19432974e916SYuri Benditovich 19442974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq) 19452974e916SYuri Benditovich { 19462974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn; 19472974e916SYuri Benditovich VirtioNetRscChain *chain = (VirtioNetRscChain *)opq; 19482974e916SYuri Benditovich 19492974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) { 19502974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 19512974e916SYuri Benditovich chain->stat.purge_failed++; 19522974e916SYuri Benditovich continue; 19532974e916SYuri Benditovich } 19542974e916SYuri Benditovich } 19552974e916SYuri Benditovich 19562974e916SYuri Benditovich chain->stat.timer++; 19572974e916SYuri Benditovich if (!QTAILQ_EMPTY(&chain->buffers)) { 19582974e916SYuri Benditovich timer_mod(chain->drain_timer, 19592974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 19602974e916SYuri Benditovich } 19612974e916SYuri Benditovich } 19622974e916SYuri Benditovich 19632974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n) 19642974e916SYuri Benditovich { 19652974e916SYuri Benditovich VirtioNetRscChain *chain, *rn_chain; 19662974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn_seg; 19672974e916SYuri Benditovich 19682974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) { 19692974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) { 19702974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 19712974e916SYuri Benditovich g_free(seg->buf); 19722974e916SYuri Benditovich g_free(seg); 19732974e916SYuri Benditovich } 19742974e916SYuri Benditovich 19752974e916SYuri Benditovich timer_free(chain->drain_timer); 19762974e916SYuri Benditovich QTAILQ_REMOVE(&n->rsc_chains, chain, next); 19772974e916SYuri Benditovich g_free(chain); 19782974e916SYuri Benditovich } 19792974e916SYuri Benditovich } 19802974e916SYuri Benditovich 19812974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain, 19822974e916SYuri Benditovich NetClientState *nc, 19832974e916SYuri Benditovich const uint8_t *buf, size_t size) 19842974e916SYuri Benditovich { 19852974e916SYuri Benditovich uint16_t hdr_len; 19862974e916SYuri Benditovich VirtioNetRscSeg *seg; 19872974e916SYuri Benditovich 19882974e916SYuri Benditovich hdr_len = chain->n->guest_hdr_len; 19892974e916SYuri Benditovich seg = g_malloc(sizeof(VirtioNetRscSeg)); 19902974e916SYuri Benditovich seg->buf = g_malloc(hdr_len + sizeof(struct eth_header) 19912974e916SYuri Benditovich + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD); 19922974e916SYuri Benditovich memcpy(seg->buf, buf, size); 19932974e916SYuri Benditovich seg->size = size; 19942974e916SYuri Benditovich seg->packets = 1; 19952974e916SYuri Benditovich seg->dup_ack = 0; 19962974e916SYuri Benditovich seg->is_coalesced = 0; 19972974e916SYuri Benditovich seg->nc = nc; 19982974e916SYuri Benditovich 19992974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&chain->buffers, seg, next); 20002974e916SYuri Benditovich chain->stat.cache++; 20012974e916SYuri Benditovich 20022974e916SYuri Benditovich switch (chain->proto) { 20032974e916SYuri Benditovich case ETH_P_IP: 20042974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit); 20052974e916SYuri Benditovich break; 20062974e916SYuri Benditovich case ETH_P_IPV6: 20072974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit); 20082974e916SYuri Benditovich break; 20092974e916SYuri Benditovich default: 20102974e916SYuri Benditovich g_assert_not_reached(); 20112974e916SYuri Benditovich } 20122974e916SYuri Benditovich } 20132974e916SYuri Benditovich 20142974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain, 20152974e916SYuri Benditovich VirtioNetRscSeg *seg, 20162974e916SYuri Benditovich const uint8_t *buf, 20172974e916SYuri Benditovich struct tcp_header *n_tcp, 20182974e916SYuri Benditovich struct tcp_header *o_tcp) 20192974e916SYuri Benditovich { 20202974e916SYuri Benditovich uint32_t nack, oack; 20212974e916SYuri Benditovich uint16_t nwin, owin; 20222974e916SYuri Benditovich 20232974e916SYuri Benditovich nack = htonl(n_tcp->th_ack); 20242974e916SYuri Benditovich nwin = htons(n_tcp->th_win); 20252974e916SYuri Benditovich oack = htonl(o_tcp->th_ack); 20262974e916SYuri Benditovich owin = htons(o_tcp->th_win); 20272974e916SYuri Benditovich 20282974e916SYuri Benditovich if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) { 20292974e916SYuri Benditovich chain->stat.ack_out_of_win++; 20302974e916SYuri Benditovich return RSC_FINAL; 20312974e916SYuri Benditovich } else if (nack == oack) { 20322974e916SYuri Benditovich /* duplicated ack or window probe */ 20332974e916SYuri Benditovich if (nwin == owin) { 20342974e916SYuri Benditovich /* duplicated ack, add dup ack count due to whql test up to 1 */ 20352974e916SYuri Benditovich chain->stat.dup_ack++; 20362974e916SYuri Benditovich return RSC_FINAL; 20372974e916SYuri Benditovich } else { 20382974e916SYuri Benditovich /* Coalesce window update */ 20392974e916SYuri Benditovich o_tcp->th_win = n_tcp->th_win; 20402974e916SYuri Benditovich chain->stat.win_update++; 20412974e916SYuri Benditovich return RSC_COALESCE; 20422974e916SYuri Benditovich } 20432974e916SYuri Benditovich } else { 20442974e916SYuri Benditovich /* pure ack, go to 'C', finalize*/ 20452974e916SYuri Benditovich chain->stat.pure_ack++; 20462974e916SYuri Benditovich return RSC_FINAL; 20472974e916SYuri Benditovich } 20482974e916SYuri Benditovich } 20492974e916SYuri Benditovich 20502974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain, 20512974e916SYuri Benditovich VirtioNetRscSeg *seg, 20522974e916SYuri Benditovich const uint8_t *buf, 20532974e916SYuri Benditovich VirtioNetRscUnit *n_unit) 20542974e916SYuri Benditovich { 20552974e916SYuri Benditovich void *data; 20562974e916SYuri Benditovich uint16_t o_ip_len; 20572974e916SYuri Benditovich uint32_t nseq, oseq; 20582974e916SYuri Benditovich VirtioNetRscUnit *o_unit; 20592974e916SYuri Benditovich 20602974e916SYuri Benditovich o_unit = &seg->unit; 20612974e916SYuri Benditovich o_ip_len = htons(*o_unit->ip_plen); 20622974e916SYuri Benditovich nseq = htonl(n_unit->tcp->th_seq); 20632974e916SYuri Benditovich oseq = htonl(o_unit->tcp->th_seq); 20642974e916SYuri Benditovich 20652974e916SYuri Benditovich /* out of order or retransmitted. */ 20662974e916SYuri Benditovich if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) { 20672974e916SYuri Benditovich chain->stat.data_out_of_win++; 20682974e916SYuri Benditovich return RSC_FINAL; 20692974e916SYuri Benditovich } 20702974e916SYuri Benditovich 20712974e916SYuri Benditovich data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen; 20722974e916SYuri Benditovich if (nseq == oseq) { 20732974e916SYuri Benditovich if ((o_unit->payload == 0) && n_unit->payload) { 20742974e916SYuri Benditovich /* From no payload to payload, normal case, not a dup ack or etc */ 20752974e916SYuri Benditovich chain->stat.data_after_pure_ack++; 20762974e916SYuri Benditovich goto coalesce; 20772974e916SYuri Benditovich } else { 20782974e916SYuri Benditovich return virtio_net_rsc_handle_ack(chain, seg, buf, 20792974e916SYuri Benditovich n_unit->tcp, o_unit->tcp); 20802974e916SYuri Benditovich } 20812974e916SYuri Benditovich } else if ((nseq - oseq) != o_unit->payload) { 20822974e916SYuri Benditovich /* Not a consistent packet, out of order */ 20832974e916SYuri Benditovich chain->stat.data_out_of_order++; 20842974e916SYuri Benditovich return RSC_FINAL; 20852974e916SYuri Benditovich } else { 20862974e916SYuri Benditovich coalesce: 20872974e916SYuri Benditovich if ((o_ip_len + n_unit->payload) > chain->max_payload) { 20882974e916SYuri Benditovich chain->stat.over_size++; 20892974e916SYuri Benditovich return RSC_FINAL; 20902974e916SYuri Benditovich } 20912974e916SYuri Benditovich 20922974e916SYuri Benditovich /* Here comes the right data, the payload length in v4/v6 is different, 20932974e916SYuri Benditovich so use the field value to update and record the new data len */ 20942974e916SYuri Benditovich o_unit->payload += n_unit->payload; /* update new data len */ 20952974e916SYuri Benditovich 20962974e916SYuri Benditovich /* update field in ip header */ 20972974e916SYuri Benditovich *o_unit->ip_plen = htons(o_ip_len + n_unit->payload); 20982974e916SYuri Benditovich 20992974e916SYuri Benditovich /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced 21002974e916SYuri Benditovich for windows guest, while this may change the behavior for linux 21012974e916SYuri Benditovich guest (only if it uses RSC feature). */ 21022974e916SYuri Benditovich o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags; 21032974e916SYuri Benditovich 21042974e916SYuri Benditovich o_unit->tcp->th_ack = n_unit->tcp->th_ack; 21052974e916SYuri Benditovich o_unit->tcp->th_win = n_unit->tcp->th_win; 21062974e916SYuri Benditovich 21072974e916SYuri Benditovich memmove(seg->buf + seg->size, data, n_unit->payload); 21082974e916SYuri Benditovich seg->size += n_unit->payload; 21092974e916SYuri Benditovich seg->packets++; 21102974e916SYuri Benditovich chain->stat.coalesced++; 21112974e916SYuri Benditovich return RSC_COALESCE; 21122974e916SYuri Benditovich } 21132974e916SYuri Benditovich } 21142974e916SYuri Benditovich 21152974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain, 21162974e916SYuri Benditovich VirtioNetRscSeg *seg, 21172974e916SYuri Benditovich const uint8_t *buf, size_t size, 21182974e916SYuri Benditovich VirtioNetRscUnit *unit) 21192974e916SYuri Benditovich { 21202974e916SYuri Benditovich struct ip_header *ip1, *ip2; 21212974e916SYuri Benditovich 21222974e916SYuri Benditovich ip1 = (struct ip_header *)(unit->ip); 21232974e916SYuri Benditovich ip2 = (struct ip_header *)(seg->unit.ip); 21242974e916SYuri Benditovich if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst) 21252974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 21262974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 21272974e916SYuri Benditovich chain->stat.no_match++; 21282974e916SYuri Benditovich return RSC_NO_MATCH; 21292974e916SYuri Benditovich } 21302974e916SYuri Benditovich 21312974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 21322974e916SYuri Benditovich } 21332974e916SYuri Benditovich 21342974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain, 21352974e916SYuri Benditovich VirtioNetRscSeg *seg, 21362974e916SYuri Benditovich const uint8_t *buf, size_t size, 21372974e916SYuri Benditovich VirtioNetRscUnit *unit) 21382974e916SYuri Benditovich { 21392974e916SYuri Benditovich struct ip6_header *ip1, *ip2; 21402974e916SYuri Benditovich 21412974e916SYuri Benditovich ip1 = (struct ip6_header *)(unit->ip); 21422974e916SYuri Benditovich ip2 = (struct ip6_header *)(seg->unit.ip); 21432974e916SYuri Benditovich if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address)) 21442974e916SYuri Benditovich || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address)) 21452974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 21462974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 21472974e916SYuri Benditovich chain->stat.no_match++; 21482974e916SYuri Benditovich return RSC_NO_MATCH; 21492974e916SYuri Benditovich } 21502974e916SYuri Benditovich 21512974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 21522974e916SYuri Benditovich } 21532974e916SYuri Benditovich 21542974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain 21552974e916SYuri Benditovich * to prevent out of order */ 21562974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain, 21572974e916SYuri Benditovich struct tcp_header *tcp) 21582974e916SYuri Benditovich { 21592974e916SYuri Benditovich uint16_t tcp_hdr; 21602974e916SYuri Benditovich uint16_t tcp_flag; 21612974e916SYuri Benditovich 21622974e916SYuri Benditovich tcp_flag = htons(tcp->th_offset_flags); 21632974e916SYuri Benditovich tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10; 21642974e916SYuri Benditovich tcp_flag &= VIRTIO_NET_TCP_FLAG; 21652974e916SYuri Benditovich if (tcp_flag & TH_SYN) { 21662974e916SYuri Benditovich chain->stat.tcp_syn++; 21672974e916SYuri Benditovich return RSC_BYPASS; 21682974e916SYuri Benditovich } 21692974e916SYuri Benditovich 21702974e916SYuri Benditovich if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) { 21712974e916SYuri Benditovich chain->stat.tcp_ctrl_drain++; 21722974e916SYuri Benditovich return RSC_FINAL; 21732974e916SYuri Benditovich } 21742974e916SYuri Benditovich 21752974e916SYuri Benditovich if (tcp_hdr > sizeof(struct tcp_header)) { 21762974e916SYuri Benditovich chain->stat.tcp_all_opt++; 21772974e916SYuri Benditovich return RSC_FINAL; 21782974e916SYuri Benditovich } 21792974e916SYuri Benditovich 21802974e916SYuri Benditovich return RSC_CANDIDATE; 21812974e916SYuri Benditovich } 21822974e916SYuri Benditovich 21832974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain, 21842974e916SYuri Benditovich NetClientState *nc, 21852974e916SYuri Benditovich const uint8_t *buf, size_t size, 21862974e916SYuri Benditovich VirtioNetRscUnit *unit) 21872974e916SYuri Benditovich { 21882974e916SYuri Benditovich int ret; 21892974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 21902974e916SYuri Benditovich 21912974e916SYuri Benditovich if (QTAILQ_EMPTY(&chain->buffers)) { 21922974e916SYuri Benditovich chain->stat.empty_cache++; 21932974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 21942974e916SYuri Benditovich timer_mod(chain->drain_timer, 21952974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 21962974e916SYuri Benditovich return size; 21972974e916SYuri Benditovich } 21982974e916SYuri Benditovich 21992974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 22002974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 22012974e916SYuri Benditovich ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit); 22022974e916SYuri Benditovich } else { 22032974e916SYuri Benditovich ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit); 22042974e916SYuri Benditovich } 22052974e916SYuri Benditovich 22062974e916SYuri Benditovich if (ret == RSC_FINAL) { 22072974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 22082974e916SYuri Benditovich /* Send failed */ 22092974e916SYuri Benditovich chain->stat.final_failed++; 22102974e916SYuri Benditovich return 0; 22112974e916SYuri Benditovich } 22122974e916SYuri Benditovich 22132974e916SYuri Benditovich /* Send current packet */ 22142974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 22152974e916SYuri Benditovich } else if (ret == RSC_NO_MATCH) { 22162974e916SYuri Benditovich continue; 22172974e916SYuri Benditovich } else { 22182974e916SYuri Benditovich /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */ 22192974e916SYuri Benditovich seg->is_coalesced = 1; 22202974e916SYuri Benditovich return size; 22212974e916SYuri Benditovich } 22222974e916SYuri Benditovich } 22232974e916SYuri Benditovich 22242974e916SYuri Benditovich chain->stat.no_match_cache++; 22252974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 22262974e916SYuri Benditovich return size; 22272974e916SYuri Benditovich } 22282974e916SYuri Benditovich 22292974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */ 22302974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain, 22312974e916SYuri Benditovich NetClientState *nc, 22322974e916SYuri Benditovich const uint8_t *buf, size_t size, 22332974e916SYuri Benditovich uint16_t ip_start, uint16_t ip_size, 22342974e916SYuri Benditovich uint16_t tcp_port) 22352974e916SYuri Benditovich { 22362974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 22372974e916SYuri Benditovich uint32_t ppair1, ppair2; 22382974e916SYuri Benditovich 22392974e916SYuri Benditovich ppair1 = *(uint32_t *)(buf + tcp_port); 22402974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 22412974e916SYuri Benditovich ppair2 = *(uint32_t *)(seg->buf + tcp_port); 22422974e916SYuri Benditovich if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size) 22432974e916SYuri Benditovich || (ppair1 != ppair2)) { 22442974e916SYuri Benditovich continue; 22452974e916SYuri Benditovich } 22462974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 22472974e916SYuri Benditovich chain->stat.drain_failed++; 22482974e916SYuri Benditovich } 22492974e916SYuri Benditovich 22502974e916SYuri Benditovich break; 22512974e916SYuri Benditovich } 22522974e916SYuri Benditovich 22532974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 22542974e916SYuri Benditovich } 22552974e916SYuri Benditovich 22562974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain, 22572974e916SYuri Benditovich struct ip_header *ip, 22582974e916SYuri Benditovich const uint8_t *buf, size_t size) 22592974e916SYuri Benditovich { 22602974e916SYuri Benditovich uint16_t ip_len; 22612974e916SYuri Benditovich 22622974e916SYuri Benditovich /* Not an ipv4 packet */ 22632974e916SYuri Benditovich if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) { 22642974e916SYuri Benditovich chain->stat.ip_option++; 22652974e916SYuri Benditovich return RSC_BYPASS; 22662974e916SYuri Benditovich } 22672974e916SYuri Benditovich 22682974e916SYuri Benditovich /* Don't handle packets with ip option */ 22692974e916SYuri Benditovich if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) { 22702974e916SYuri Benditovich chain->stat.ip_option++; 22712974e916SYuri Benditovich return RSC_BYPASS; 22722974e916SYuri Benditovich } 22732974e916SYuri Benditovich 22742974e916SYuri Benditovich if (ip->ip_p != IPPROTO_TCP) { 22752974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 22762974e916SYuri Benditovich return RSC_BYPASS; 22772974e916SYuri Benditovich } 22782974e916SYuri Benditovich 22792974e916SYuri Benditovich /* Don't handle packets with ip fragment */ 22802974e916SYuri Benditovich if (!(htons(ip->ip_off) & IP_DF)) { 22812974e916SYuri Benditovich chain->stat.ip_frag++; 22822974e916SYuri Benditovich return RSC_BYPASS; 22832974e916SYuri Benditovich } 22842974e916SYuri Benditovich 22852974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 22862974e916SYuri Benditovich if (IPTOS_ECN(ip->ip_tos)) { 22872974e916SYuri Benditovich chain->stat.ip_ecn++; 22882974e916SYuri Benditovich return RSC_BYPASS; 22892974e916SYuri Benditovich } 22902974e916SYuri Benditovich 22912974e916SYuri Benditovich ip_len = htons(ip->ip_len); 22922974e916SYuri Benditovich if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header)) 22932974e916SYuri Benditovich || ip_len > (size - chain->n->guest_hdr_len - 22942974e916SYuri Benditovich sizeof(struct eth_header))) { 22952974e916SYuri Benditovich chain->stat.ip_hacked++; 22962974e916SYuri Benditovich return RSC_BYPASS; 22972974e916SYuri Benditovich } 22982974e916SYuri Benditovich 22992974e916SYuri Benditovich return RSC_CANDIDATE; 23002974e916SYuri Benditovich } 23012974e916SYuri Benditovich 23022974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain, 23032974e916SYuri Benditovich NetClientState *nc, 23042974e916SYuri Benditovich const uint8_t *buf, size_t size) 23052974e916SYuri Benditovich { 23062974e916SYuri Benditovich int32_t ret; 23072974e916SYuri Benditovich uint16_t hdr_len; 23082974e916SYuri Benditovich VirtioNetRscUnit unit; 23092974e916SYuri Benditovich 23102974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 23112974e916SYuri Benditovich 23122974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header) 23132974e916SYuri Benditovich + sizeof(struct tcp_header))) { 23142974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 23152974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23162974e916SYuri Benditovich } 23172974e916SYuri Benditovich 23182974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, buf, &unit); 23192974e916SYuri Benditovich if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size) 23202974e916SYuri Benditovich != RSC_CANDIDATE) { 23212974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23222974e916SYuri Benditovich } 23232974e916SYuri Benditovich 23242974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 23252974e916SYuri Benditovich if (ret == RSC_BYPASS) { 23262974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23272974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 23282974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 23292974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 12), 23302974e916SYuri Benditovich VIRTIO_NET_IP4_ADDR_SIZE, 23312974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)); 23322974e916SYuri Benditovich } 23332974e916SYuri Benditovich 23342974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 23352974e916SYuri Benditovich } 23362974e916SYuri Benditovich 23372974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain, 23382974e916SYuri Benditovich struct ip6_header *ip6, 23392974e916SYuri Benditovich const uint8_t *buf, size_t size) 23402974e916SYuri Benditovich { 23412974e916SYuri Benditovich uint16_t ip_len; 23422974e916SYuri Benditovich 23432974e916SYuri Benditovich if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4) 23442974e916SYuri Benditovich != IP_HEADER_VERSION_6) { 23452974e916SYuri Benditovich return RSC_BYPASS; 23462974e916SYuri Benditovich } 23472974e916SYuri Benditovich 23482974e916SYuri Benditovich /* Both option and protocol is checked in this */ 23492974e916SYuri Benditovich if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) { 23502974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 23512974e916SYuri Benditovich return RSC_BYPASS; 23522974e916SYuri Benditovich } 23532974e916SYuri Benditovich 23542974e916SYuri Benditovich ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 23552974e916SYuri Benditovich if (ip_len < sizeof(struct tcp_header) || 23562974e916SYuri Benditovich ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header) 23572974e916SYuri Benditovich - sizeof(struct ip6_header))) { 23582974e916SYuri Benditovich chain->stat.ip_hacked++; 23592974e916SYuri Benditovich return RSC_BYPASS; 23602974e916SYuri Benditovich } 23612974e916SYuri Benditovich 23622974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 23632974e916SYuri Benditovich if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) { 23642974e916SYuri Benditovich chain->stat.ip_ecn++; 23652974e916SYuri Benditovich return RSC_BYPASS; 23662974e916SYuri Benditovich } 23672974e916SYuri Benditovich 23682974e916SYuri Benditovich return RSC_CANDIDATE; 23692974e916SYuri Benditovich } 23702974e916SYuri Benditovich 23712974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc, 23722974e916SYuri Benditovich const uint8_t *buf, size_t size) 23732974e916SYuri Benditovich { 23742974e916SYuri Benditovich int32_t ret; 23752974e916SYuri Benditovich uint16_t hdr_len; 23762974e916SYuri Benditovich VirtioNetRscChain *chain; 23772974e916SYuri Benditovich VirtioNetRscUnit unit; 23782974e916SYuri Benditovich 23792974e916SYuri Benditovich chain = (VirtioNetRscChain *)opq; 23802974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 23812974e916SYuri Benditovich 23822974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header) 23832974e916SYuri Benditovich + sizeof(tcp_header))) { 23842974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23852974e916SYuri Benditovich } 23862974e916SYuri Benditovich 23872974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, buf, &unit); 23882974e916SYuri Benditovich if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain, 23892974e916SYuri Benditovich unit.ip, buf, size)) { 23902974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23912974e916SYuri Benditovich } 23922974e916SYuri Benditovich 23932974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 23942974e916SYuri Benditovich if (ret == RSC_BYPASS) { 23952974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23962974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 23972974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 23982974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 8), 23992974e916SYuri Benditovich VIRTIO_NET_IP6_ADDR_SIZE, 24002974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) 24012974e916SYuri Benditovich + sizeof(struct ip6_header)); 24022974e916SYuri Benditovich } 24032974e916SYuri Benditovich 24042974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 24052974e916SYuri Benditovich } 24062974e916SYuri Benditovich 24072974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n, 24082974e916SYuri Benditovich NetClientState *nc, 24092974e916SYuri Benditovich uint16_t proto) 24102974e916SYuri Benditovich { 24112974e916SYuri Benditovich VirtioNetRscChain *chain; 24122974e916SYuri Benditovich 24132974e916SYuri Benditovich if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) { 24142974e916SYuri Benditovich return NULL; 24152974e916SYuri Benditovich } 24162974e916SYuri Benditovich 24172974e916SYuri Benditovich QTAILQ_FOREACH(chain, &n->rsc_chains, next) { 24182974e916SYuri Benditovich if (chain->proto == proto) { 24192974e916SYuri Benditovich return chain; 24202974e916SYuri Benditovich } 24212974e916SYuri Benditovich } 24222974e916SYuri Benditovich 24232974e916SYuri Benditovich chain = g_malloc(sizeof(*chain)); 24242974e916SYuri Benditovich chain->n = n; 24252974e916SYuri Benditovich chain->proto = proto; 24262974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP) { 24272974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD; 24282974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 24292974e916SYuri Benditovich } else { 24302974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD; 24312974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 24322974e916SYuri Benditovich } 24332974e916SYuri Benditovich chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST, 24342974e916SYuri Benditovich virtio_net_rsc_purge, chain); 24352974e916SYuri Benditovich memset(&chain->stat, 0, sizeof(chain->stat)); 24362974e916SYuri Benditovich 24372974e916SYuri Benditovich QTAILQ_INIT(&chain->buffers); 24382974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next); 24392974e916SYuri Benditovich 24402974e916SYuri Benditovich return chain; 24412974e916SYuri Benditovich } 24422974e916SYuri Benditovich 24432974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc, 24442974e916SYuri Benditovich const uint8_t *buf, 24452974e916SYuri Benditovich size_t size) 24462974e916SYuri Benditovich { 24472974e916SYuri Benditovich uint16_t proto; 24482974e916SYuri Benditovich VirtioNetRscChain *chain; 24492974e916SYuri Benditovich struct eth_header *eth; 24502974e916SYuri Benditovich VirtIONet *n; 24512974e916SYuri Benditovich 24522974e916SYuri Benditovich n = qemu_get_nic_opaque(nc); 24532974e916SYuri Benditovich if (size < (n->host_hdr_len + sizeof(struct eth_header))) { 24542974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24552974e916SYuri Benditovich } 24562974e916SYuri Benditovich 24572974e916SYuri Benditovich eth = (struct eth_header *)(buf + n->guest_hdr_len); 24582974e916SYuri Benditovich proto = htons(eth->h_proto); 24592974e916SYuri Benditovich 24602974e916SYuri Benditovich chain = virtio_net_rsc_lookup_chain(n, nc, proto); 24612974e916SYuri Benditovich if (chain) { 24622974e916SYuri Benditovich chain->stat.received++; 24632974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) { 24642974e916SYuri Benditovich return virtio_net_rsc_receive4(chain, nc, buf, size); 24652974e916SYuri Benditovich } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) { 24662974e916SYuri Benditovich return virtio_net_rsc_receive6(chain, nc, buf, size); 24672974e916SYuri Benditovich } 24682974e916SYuri Benditovich } 24692974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24702974e916SYuri Benditovich } 24712974e916SYuri Benditovich 24722974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, 24732974e916SYuri Benditovich size_t size) 24742974e916SYuri Benditovich { 24752974e916SYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 24762974e916SYuri Benditovich if ((n->rsc4_enabled || n->rsc6_enabled)) { 24772974e916SYuri Benditovich return virtio_net_rsc_receive(nc, buf, size); 24782974e916SYuri Benditovich } else { 24792974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24802974e916SYuri Benditovich } 24812974e916SYuri Benditovich } 24822974e916SYuri Benditovich 24836e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q); 24846e790746SPaolo Bonzini 24856e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len) 24866e790746SPaolo Bonzini { 24876e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 24886e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 248917a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 24906e790746SPaolo Bonzini 249151b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, q->async_tx.elem, 0); 249217a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 24936e790746SPaolo Bonzini 249451b19ebeSPaolo Bonzini g_free(q->async_tx.elem); 249551b19ebeSPaolo Bonzini q->async_tx.elem = NULL; 24966e790746SPaolo Bonzini 24976e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 24986e790746SPaolo Bonzini virtio_net_flush_tx(q); 24996e790746SPaolo Bonzini } 25006e790746SPaolo Bonzini 25016e790746SPaolo Bonzini /* TX */ 25026e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q) 25036e790746SPaolo Bonzini { 25046e790746SPaolo Bonzini VirtIONet *n = q->n; 250517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 250651b19ebeSPaolo Bonzini VirtQueueElement *elem; 25076e790746SPaolo Bonzini int32_t num_packets = 0; 25086e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(q->tx_vq)); 250917a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 25106e790746SPaolo Bonzini return num_packets; 25116e790746SPaolo Bonzini } 25126e790746SPaolo Bonzini 251351b19ebeSPaolo Bonzini if (q->async_tx.elem) { 25146e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 25156e790746SPaolo Bonzini return num_packets; 25166e790746SPaolo Bonzini } 25176e790746SPaolo Bonzini 251851b19ebeSPaolo Bonzini for (;;) { 2519bd89dd98SJason Wang ssize_t ret; 252051b19ebeSPaolo Bonzini unsigned int out_num; 252151b19ebeSPaolo Bonzini struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg; 2522feb93f36SJason Wang struct virtio_net_hdr_mrg_rxbuf mhdr; 25236e790746SPaolo Bonzini 252451b19ebeSPaolo Bonzini elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement)); 252551b19ebeSPaolo Bonzini if (!elem) { 252651b19ebeSPaolo Bonzini break; 252751b19ebeSPaolo Bonzini } 252851b19ebeSPaolo Bonzini 252951b19ebeSPaolo Bonzini out_num = elem->out_num; 253051b19ebeSPaolo Bonzini out_sg = elem->out_sg; 25316e790746SPaolo Bonzini if (out_num < 1) { 2532fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header not in first element"); 2533fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2534fa5e56c2SGreg Kurz g_free(elem); 2535fa5e56c2SGreg Kurz return -EINVAL; 25366e790746SPaolo Bonzini } 25376e790746SPaolo Bonzini 2538032a74a1SCédric Le Goater if (n->has_vnet_hdr) { 2539feb93f36SJason Wang if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) < 2540feb93f36SJason Wang n->guest_hdr_len) { 2541fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header incorrect"); 2542fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2543fa5e56c2SGreg Kurz g_free(elem); 2544fa5e56c2SGreg Kurz return -EINVAL; 2545032a74a1SCédric Le Goater } 25461bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2547feb93f36SJason Wang virtio_net_hdr_swap(vdev, (void *) &mhdr); 2548feb93f36SJason Wang sg2[0].iov_base = &mhdr; 2549feb93f36SJason Wang sg2[0].iov_len = n->guest_hdr_len; 2550feb93f36SJason Wang out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1, 2551feb93f36SJason Wang out_sg, out_num, 2552feb93f36SJason Wang n->guest_hdr_len, -1); 2553feb93f36SJason Wang if (out_num == VIRTQUEUE_MAX_SIZE) { 2554feb93f36SJason Wang goto drop; 2555032a74a1SCédric Le Goater } 2556feb93f36SJason Wang out_num += 1; 2557feb93f36SJason Wang out_sg = sg2; 2558feb93f36SJason Wang } 2559feb93f36SJason Wang } 25606e790746SPaolo Bonzini /* 25616e790746SPaolo Bonzini * If host wants to see the guest header as is, we can 25626e790746SPaolo Bonzini * pass it on unchanged. Otherwise, copy just the parts 25636e790746SPaolo Bonzini * that host is interested in. 25646e790746SPaolo Bonzini */ 25656e790746SPaolo Bonzini assert(n->host_hdr_len <= n->guest_hdr_len); 25666e790746SPaolo Bonzini if (n->host_hdr_len != n->guest_hdr_len) { 25676e790746SPaolo Bonzini unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg), 25686e790746SPaolo Bonzini out_sg, out_num, 25696e790746SPaolo Bonzini 0, n->host_hdr_len); 25706e790746SPaolo Bonzini sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num, 25716e790746SPaolo Bonzini out_sg, out_num, 25726e790746SPaolo Bonzini n->guest_hdr_len, -1); 25736e790746SPaolo Bonzini out_num = sg_num; 25746e790746SPaolo Bonzini out_sg = sg; 25756e790746SPaolo Bonzini } 25766e790746SPaolo Bonzini 25776e790746SPaolo Bonzini ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index), 25786e790746SPaolo Bonzini out_sg, out_num, virtio_net_tx_complete); 25796e790746SPaolo Bonzini if (ret == 0) { 25806e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 25816e790746SPaolo Bonzini q->async_tx.elem = elem; 25826e790746SPaolo Bonzini return -EBUSY; 25836e790746SPaolo Bonzini } 25846e790746SPaolo Bonzini 2585feb93f36SJason Wang drop: 258651b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, elem, 0); 258717a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 258851b19ebeSPaolo Bonzini g_free(elem); 25896e790746SPaolo Bonzini 25906e790746SPaolo Bonzini if (++num_packets >= n->tx_burst) { 25916e790746SPaolo Bonzini break; 25926e790746SPaolo Bonzini } 25936e790746SPaolo Bonzini } 25946e790746SPaolo Bonzini return num_packets; 25956e790746SPaolo Bonzini } 25966e790746SPaolo Bonzini 25976e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq) 25986e790746SPaolo Bonzini { 259917a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 26006e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 26016e790746SPaolo Bonzini 2602283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2603283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2604283e2c2aSYuri Benditovich return; 2605283e2c2aSYuri Benditovich } 2606283e2c2aSYuri Benditovich 26076e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 260817a0ca55SKONRAD Frederic if (!vdev->vm_running) { 26096e790746SPaolo Bonzini q->tx_waiting = 1; 26106e790746SPaolo Bonzini return; 26116e790746SPaolo Bonzini } 26126e790746SPaolo Bonzini 26136e790746SPaolo Bonzini if (q->tx_waiting) { 26146e790746SPaolo Bonzini virtio_queue_set_notification(vq, 1); 2615bc72ad67SAlex Bligh timer_del(q->tx_timer); 26166e790746SPaolo Bonzini q->tx_waiting = 0; 2617fa5e56c2SGreg Kurz if (virtio_net_flush_tx(q) == -EINVAL) { 2618fa5e56c2SGreg Kurz return; 2619fa5e56c2SGreg Kurz } 26206e790746SPaolo Bonzini } else { 2621bc72ad67SAlex Bligh timer_mod(q->tx_timer, 2622bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 26236e790746SPaolo Bonzini q->tx_waiting = 1; 26246e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 26256e790746SPaolo Bonzini } 26266e790746SPaolo Bonzini } 26276e790746SPaolo Bonzini 26286e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq) 26296e790746SPaolo Bonzini { 263017a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 26316e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 26326e790746SPaolo Bonzini 2633283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2634283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2635283e2c2aSYuri Benditovich return; 2636283e2c2aSYuri Benditovich } 2637283e2c2aSYuri Benditovich 26386e790746SPaolo Bonzini if (unlikely(q->tx_waiting)) { 26396e790746SPaolo Bonzini return; 26406e790746SPaolo Bonzini } 26416e790746SPaolo Bonzini q->tx_waiting = 1; 26426e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 264317a0ca55SKONRAD Frederic if (!vdev->vm_running) { 26446e790746SPaolo Bonzini return; 26456e790746SPaolo Bonzini } 26466e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 26476e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 26486e790746SPaolo Bonzini } 26496e790746SPaolo Bonzini 26506e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque) 26516e790746SPaolo Bonzini { 26526e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 26536e790746SPaolo Bonzini VirtIONet *n = q->n; 265417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2655e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2656e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2657e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2658e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2659e8bcf842SMichael S. Tsirkin return; 2660e8bcf842SMichael S. Tsirkin } 26616e790746SPaolo Bonzini 26626e790746SPaolo Bonzini q->tx_waiting = 0; 26636e790746SPaolo Bonzini 26646e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 266517a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 26666e790746SPaolo Bonzini return; 266717a0ca55SKONRAD Frederic } 26686e790746SPaolo Bonzini 26696e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 26706e790746SPaolo Bonzini virtio_net_flush_tx(q); 26716e790746SPaolo Bonzini } 26726e790746SPaolo Bonzini 26736e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque) 26746e790746SPaolo Bonzini { 26756e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 26766e790746SPaolo Bonzini VirtIONet *n = q->n; 267717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 26786e790746SPaolo Bonzini int32_t ret; 26796e790746SPaolo Bonzini 2680e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2681e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2682e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2683e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2684e8bcf842SMichael S. Tsirkin return; 2685e8bcf842SMichael S. Tsirkin } 26866e790746SPaolo Bonzini 26876e790746SPaolo Bonzini q->tx_waiting = 0; 26886e790746SPaolo Bonzini 26896e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 269017a0ca55SKONRAD Frederic if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) { 26916e790746SPaolo Bonzini return; 269217a0ca55SKONRAD Frederic } 26936e790746SPaolo Bonzini 26946e790746SPaolo Bonzini ret = virtio_net_flush_tx(q); 2695fa5e56c2SGreg Kurz if (ret == -EBUSY || ret == -EINVAL) { 2696fa5e56c2SGreg Kurz return; /* Notification re-enable handled by tx_complete or device 2697fa5e56c2SGreg Kurz * broken */ 26986e790746SPaolo Bonzini } 26996e790746SPaolo Bonzini 27006e790746SPaolo Bonzini /* If we flush a full burst of packets, assume there are 27016e790746SPaolo Bonzini * more coming and immediately reschedule */ 27026e790746SPaolo Bonzini if (ret >= n->tx_burst) { 27036e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 27046e790746SPaolo Bonzini q->tx_waiting = 1; 27056e790746SPaolo Bonzini return; 27066e790746SPaolo Bonzini } 27076e790746SPaolo Bonzini 27086e790746SPaolo Bonzini /* If less than a full burst, re-enable notification and flush 27096e790746SPaolo Bonzini * anything that may have come in while we weren't looking. If 27106e790746SPaolo Bonzini * we find something, assume the guest is still active and reschedule */ 27116e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2712fa5e56c2SGreg Kurz ret = virtio_net_flush_tx(q); 2713fa5e56c2SGreg Kurz if (ret == -EINVAL) { 2714fa5e56c2SGreg Kurz return; 2715fa5e56c2SGreg Kurz } else if (ret > 0) { 27166e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27176e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 27186e790746SPaolo Bonzini q->tx_waiting = 1; 27196e790746SPaolo Bonzini } 27206e790746SPaolo Bonzini } 27216e790746SPaolo Bonzini 2722f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index) 2723f9d6dbf0SWen Congyang { 2724f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2725f9d6dbf0SWen Congyang 27261c0fbfa3SMichael S. Tsirkin n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size, 27271c0fbfa3SMichael S. Tsirkin virtio_net_handle_rx); 27289b02e161SWei Wang 2729f9d6dbf0SWen Congyang if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) { 2730f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 27319b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 27329b02e161SWei Wang virtio_net_handle_tx_timer); 2733f9d6dbf0SWen Congyang n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, 2734f9d6dbf0SWen Congyang virtio_net_tx_timer, 2735f9d6dbf0SWen Congyang &n->vqs[index]); 2736f9d6dbf0SWen Congyang } else { 2737f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 27389b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 27399b02e161SWei Wang virtio_net_handle_tx_bh); 2740f9d6dbf0SWen Congyang n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]); 2741f9d6dbf0SWen Congyang } 2742f9d6dbf0SWen Congyang 2743f9d6dbf0SWen Congyang n->vqs[index].tx_waiting = 0; 2744f9d6dbf0SWen Congyang n->vqs[index].n = n; 2745f9d6dbf0SWen Congyang } 2746f9d6dbf0SWen Congyang 2747f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index) 2748f9d6dbf0SWen Congyang { 2749f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2750f9d6dbf0SWen Congyang VirtIONetQueue *q = &n->vqs[index]; 2751f9d6dbf0SWen Congyang NetClientState *nc = qemu_get_subqueue(n->nic, index); 2752f9d6dbf0SWen Congyang 2753f9d6dbf0SWen Congyang qemu_purge_queued_packets(nc); 2754f9d6dbf0SWen Congyang 2755f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2); 2756f9d6dbf0SWen Congyang if (q->tx_timer) { 2757f9d6dbf0SWen Congyang timer_free(q->tx_timer); 2758f989c30cSYunjian Wang q->tx_timer = NULL; 2759f9d6dbf0SWen Congyang } else { 2760f9d6dbf0SWen Congyang qemu_bh_delete(q->tx_bh); 2761f989c30cSYunjian Wang q->tx_bh = NULL; 2762f9d6dbf0SWen Congyang } 2763f989c30cSYunjian Wang q->tx_waiting = 0; 2764f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2 + 1); 2765f9d6dbf0SWen Congyang } 2766f9d6dbf0SWen Congyang 2767441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs) 2768f9d6dbf0SWen Congyang { 2769f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2770f9d6dbf0SWen Congyang int old_num_queues = virtio_get_num_queues(vdev); 2771441537f1SJason Wang int new_num_queues = new_max_queue_pairs * 2 + 1; 2772f9d6dbf0SWen Congyang int i; 2773f9d6dbf0SWen Congyang 2774f9d6dbf0SWen Congyang assert(old_num_queues >= 3); 2775f9d6dbf0SWen Congyang assert(old_num_queues % 2 == 1); 2776f9d6dbf0SWen Congyang 2777f9d6dbf0SWen Congyang if (old_num_queues == new_num_queues) { 2778f9d6dbf0SWen Congyang return; 2779f9d6dbf0SWen Congyang } 2780f9d6dbf0SWen Congyang 2781f9d6dbf0SWen Congyang /* 2782f9d6dbf0SWen Congyang * We always need to remove and add ctrl vq if 2783f9d6dbf0SWen Congyang * old_num_queues != new_num_queues. Remove ctrl_vq first, 278420f86a75SYuval Shaia * and then we only enter one of the following two loops. 2785f9d6dbf0SWen Congyang */ 2786f9d6dbf0SWen Congyang virtio_del_queue(vdev, old_num_queues - 1); 2787f9d6dbf0SWen Congyang 2788f9d6dbf0SWen Congyang for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) { 2789f9d6dbf0SWen Congyang /* new_num_queues < old_num_queues */ 2790f9d6dbf0SWen Congyang virtio_net_del_queue(n, i / 2); 2791f9d6dbf0SWen Congyang } 2792f9d6dbf0SWen Congyang 2793f9d6dbf0SWen Congyang for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) { 2794f9d6dbf0SWen Congyang /* new_num_queues > old_num_queues */ 2795f9d6dbf0SWen Congyang virtio_net_add_queue(n, i / 2); 2796f9d6dbf0SWen Congyang } 2797f9d6dbf0SWen Congyang 2798f9d6dbf0SWen Congyang /* add ctrl_vq last */ 2799f9d6dbf0SWen Congyang n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 2800f9d6dbf0SWen Congyang } 2801f9d6dbf0SWen Congyang 2802ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue) 28036e790746SPaolo Bonzini { 2804441537f1SJason Wang int max = multiqueue ? n->max_queue_pairs : 1; 2805f9d6dbf0SWen Congyang 28066e790746SPaolo Bonzini n->multiqueue = multiqueue; 2807441537f1SJason Wang virtio_net_change_num_queue_pairs(n, max); 28086e790746SPaolo Bonzini 2809441537f1SJason Wang virtio_net_set_queue_pairs(n); 28106e790746SPaolo Bonzini } 28116e790746SPaolo Bonzini 2812982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id) 2813037dab2fSGreg Kurz { 2814982b78c5SDr. David Alan Gilbert VirtIONet *n = opaque; 2815982b78c5SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 2816037dab2fSGreg Kurz int i, link_down; 2817037dab2fSGreg Kurz 28189d8c6a25SDr. David Alan Gilbert trace_virtio_net_post_load_device(); 2819982b78c5SDr. David Alan Gilbert virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs, 282095129d6fSCornelia Huck virtio_vdev_has_feature(vdev, 2821e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 2822e22f0603SYuri Benditovich virtio_vdev_has_feature(vdev, 2823e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 28246e790746SPaolo Bonzini 28256e790746SPaolo Bonzini /* MAC_TABLE_ENTRIES may be different from the saved image */ 2826982b78c5SDr. David Alan Gilbert if (n->mac_table.in_use > MAC_TABLE_ENTRIES) { 28276e790746SPaolo Bonzini n->mac_table.in_use = 0; 28286e790746SPaolo Bonzini } 28296e790746SPaolo Bonzini 2830982b78c5SDr. David Alan Gilbert if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 28316c666823SMichael S. Tsirkin n->curr_guest_offloads = virtio_net_supported_guest_offloads(n); 28326c666823SMichael S. Tsirkin } 28336c666823SMichael S. Tsirkin 28347788c3f2SMikhail Sennikovsky /* 28357788c3f2SMikhail Sennikovsky * curr_guest_offloads will be later overwritten by the 28367788c3f2SMikhail Sennikovsky * virtio_set_features_nocheck call done from the virtio_load. 28377788c3f2SMikhail Sennikovsky * Here we make sure it is preserved and restored accordingly 28387788c3f2SMikhail Sennikovsky * in the virtio_net_post_load_virtio callback. 28397788c3f2SMikhail Sennikovsky */ 28407788c3f2SMikhail Sennikovsky n->saved_guest_offloads = n->curr_guest_offloads; 28416c666823SMichael S. Tsirkin 2842441537f1SJason Wang virtio_net_set_queue_pairs(n); 28436e790746SPaolo Bonzini 28446e790746SPaolo Bonzini /* Find the first multicast entry in the saved MAC filter */ 28456e790746SPaolo Bonzini for (i = 0; i < n->mac_table.in_use; i++) { 28466e790746SPaolo Bonzini if (n->mac_table.macs[i * ETH_ALEN] & 1) { 28476e790746SPaolo Bonzini break; 28486e790746SPaolo Bonzini } 28496e790746SPaolo Bonzini } 28506e790746SPaolo Bonzini n->mac_table.first_multi = i; 28516e790746SPaolo Bonzini 28526e790746SPaolo Bonzini /* nc.link_down can't be migrated, so infer link_down according 28536e790746SPaolo Bonzini * to link status bit in n->status */ 28546e790746SPaolo Bonzini link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0; 2855441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 28566e790746SPaolo Bonzini qemu_get_subqueue(n->nic, i)->link_down = link_down; 28576e790746SPaolo Bonzini } 28586e790746SPaolo Bonzini 28596c666823SMichael S. Tsirkin if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 28606c666823SMichael S. Tsirkin virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 28619d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 28629d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 28639d8c6a25SDr. David Alan Gilbert virtio_net_announce_timer, n); 28649d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 28659d8c6a25SDr. David Alan Gilbert timer_mod(n->announce_timer.tm, 28669d8c6a25SDr. David Alan Gilbert qemu_clock_get_ms(n->announce_timer.type)); 28679d8c6a25SDr. David Alan Gilbert } else { 2868944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 28699d8c6a25SDr. David Alan Gilbert } 28706c666823SMichael S. Tsirkin } 28716c666823SMichael S. Tsirkin 2872e41b7114SYuri Benditovich if (n->rss_data.enabled) { 28730145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = n->rss_data.populate_hash; 28740145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 28750145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 28760145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 28770145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS for vhost"); 28780145c393SAndrew Melnychenko } else { 28790145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS - " 28800145c393SAndrew Melnychenko "fallback to software RSS"); 28810145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 28820145c393SAndrew Melnychenko } 28830145c393SAndrew Melnychenko } 28840145c393SAndrew Melnychenko } 28850145c393SAndrew Melnychenko 2886e41b7114SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 2887e41b7114SYuri Benditovich n->rss_data.indirections_len, 2888e41b7114SYuri Benditovich sizeof(n->rss_data.key)); 2889e41b7114SYuri Benditovich } else { 2890e41b7114SYuri Benditovich trace_virtio_net_rss_disable(); 2891e41b7114SYuri Benditovich } 28926e790746SPaolo Bonzini return 0; 28936e790746SPaolo Bonzini } 28946e790746SPaolo Bonzini 28957788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev) 28967788c3f2SMikhail Sennikovsky { 28977788c3f2SMikhail Sennikovsky VirtIONet *n = VIRTIO_NET(vdev); 28987788c3f2SMikhail Sennikovsky /* 28997788c3f2SMikhail Sennikovsky * The actual needed state is now in saved_guest_offloads, 29007788c3f2SMikhail Sennikovsky * see virtio_net_post_load_device for detail. 29017788c3f2SMikhail Sennikovsky * Restore it back and apply the desired offloads. 29027788c3f2SMikhail Sennikovsky */ 29037788c3f2SMikhail Sennikovsky n->curr_guest_offloads = n->saved_guest_offloads; 29047788c3f2SMikhail Sennikovsky if (peer_has_vnet_hdr(n)) { 29057788c3f2SMikhail Sennikovsky virtio_net_apply_guest_offloads(n); 29067788c3f2SMikhail Sennikovsky } 29077788c3f2SMikhail Sennikovsky 29087788c3f2SMikhail Sennikovsky return 0; 29097788c3f2SMikhail Sennikovsky } 29107788c3f2SMikhail Sennikovsky 2911982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */ 2912982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = { 2913982b78c5SDr. David Alan Gilbert .name = "virtio-net-queue-tx_waiting", 2914982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 2915982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(tx_waiting, VirtIONetQueue), 2916982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 2917982b78c5SDr. David Alan Gilbert }, 2918982b78c5SDr. David Alan Gilbert }; 2919982b78c5SDr. David Alan Gilbert 2920441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id) 2921982b78c5SDr. David Alan Gilbert { 2922441537f1SJason Wang return VIRTIO_NET(opaque)->max_queue_pairs > 1; 2923982b78c5SDr. David Alan Gilbert } 2924982b78c5SDr. David Alan Gilbert 2925982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id) 2926982b78c5SDr. David Alan Gilbert { 2927982b78c5SDr. David Alan Gilbert return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque), 2928982b78c5SDr. David Alan Gilbert VIRTIO_NET_F_CTRL_GUEST_OFFLOADS); 2929982b78c5SDr. David Alan Gilbert } 2930982b78c5SDr. David Alan Gilbert 2931982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id) 2932982b78c5SDr. David Alan Gilbert { 2933982b78c5SDr. David Alan Gilbert return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES; 2934982b78c5SDr. David Alan Gilbert } 2935982b78c5SDr. David Alan Gilbert 2936982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id) 2937982b78c5SDr. David Alan Gilbert { 2938982b78c5SDr. David Alan Gilbert return !mac_table_fits(opaque, version_id); 2939982b78c5SDr. David Alan Gilbert } 2940982b78c5SDr. David Alan Gilbert 2941982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods 2942982b78c5SDr. David Alan Gilbert * although only some fields are used by each. 2943982b78c5SDr. David Alan Gilbert */ 2944982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp { 2945982b78c5SDr. David Alan Gilbert VirtIONet *parent; 2946982b78c5SDr. David Alan Gilbert VirtIONetQueue *vqs_1; 2947441537f1SJason Wang uint16_t curr_queue_pairs_1; 2948982b78c5SDr. David Alan Gilbert uint8_t has_ufo; 2949982b78c5SDr. David Alan Gilbert uint32_t has_vnet_hdr; 2950982b78c5SDr. David Alan Gilbert }; 2951982b78c5SDr. David Alan Gilbert 2952982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than 2953441537f1SJason Wang * the 1st entry in the queue_pairs and only if there's more than one 2954982b78c5SDr. David Alan Gilbert * entry. We use the tmp mechanism to calculate a temporary 2955982b78c5SDr. David Alan Gilbert * pointer and count and also validate the count. 2956982b78c5SDr. David Alan Gilbert */ 2957982b78c5SDr. David Alan Gilbert 295844b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque) 2959982b78c5SDr. David Alan Gilbert { 2960982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 2961982b78c5SDr. David Alan Gilbert 2962982b78c5SDr. David Alan Gilbert tmp->vqs_1 = tmp->parent->vqs + 1; 2963441537f1SJason Wang tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1; 2964441537f1SJason Wang if (tmp->parent->curr_queue_pairs == 0) { 2965441537f1SJason Wang tmp->curr_queue_pairs_1 = 0; 2966982b78c5SDr. David Alan Gilbert } 296744b1ff31SDr. David Alan Gilbert 296844b1ff31SDr. David Alan Gilbert return 0; 2969982b78c5SDr. David Alan Gilbert } 2970982b78c5SDr. David Alan Gilbert 2971982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque) 2972982b78c5SDr. David Alan Gilbert { 2973982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 2974982b78c5SDr. David Alan Gilbert 2975982b78c5SDr. David Alan Gilbert /* Reuse the pointer setup from save */ 2976982b78c5SDr. David Alan Gilbert virtio_net_tx_waiting_pre_save(opaque); 2977982b78c5SDr. David Alan Gilbert 2978441537f1SJason Wang if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) { 2979441537f1SJason Wang error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x", 2980441537f1SJason Wang tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs); 2981982b78c5SDr. David Alan Gilbert 2982982b78c5SDr. David Alan Gilbert return -EINVAL; 2983982b78c5SDr. David Alan Gilbert } 2984982b78c5SDr. David Alan Gilbert 2985982b78c5SDr. David Alan Gilbert return 0; /* all good */ 2986982b78c5SDr. David Alan Gilbert } 2987982b78c5SDr. David Alan Gilbert 2988982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = { 2989982b78c5SDr. David Alan Gilbert .name = "virtio-net-tx_waiting", 2990982b78c5SDr. David Alan Gilbert .pre_load = virtio_net_tx_waiting_pre_load, 2991982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_tx_waiting_pre_save, 2992982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 2993982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp, 2994441537f1SJason Wang curr_queue_pairs_1, 2995982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 2996982b78c5SDr. David Alan Gilbert struct VirtIONetQueue), 2997982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 2998982b78c5SDr. David Alan Gilbert }, 2999982b78c5SDr. David Alan Gilbert }; 3000982b78c5SDr. David Alan Gilbert 3001982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the 3002982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3003982b78c5SDr. David Alan Gilbert */ 3004982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id) 3005982b78c5SDr. David Alan Gilbert { 3006982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3007982b78c5SDr. David Alan Gilbert 3008982b78c5SDr. David Alan Gilbert if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) { 3009982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires TUN_F_UFO support"); 3010982b78c5SDr. David Alan Gilbert return -EINVAL; 3011982b78c5SDr. David Alan Gilbert } 3012982b78c5SDr. David Alan Gilbert 3013982b78c5SDr. David Alan Gilbert return 0; 3014982b78c5SDr. David Alan Gilbert } 3015982b78c5SDr. David Alan Gilbert 301644b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque) 3017982b78c5SDr. David Alan Gilbert { 3018982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3019982b78c5SDr. David Alan Gilbert 3020982b78c5SDr. David Alan Gilbert tmp->has_ufo = tmp->parent->has_ufo; 302144b1ff31SDr. David Alan Gilbert 302244b1ff31SDr. David Alan Gilbert return 0; 3023982b78c5SDr. David Alan Gilbert } 3024982b78c5SDr. David Alan Gilbert 3025982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = { 3026982b78c5SDr. David Alan Gilbert .name = "virtio-net-ufo", 3027982b78c5SDr. David Alan Gilbert .post_load = virtio_net_ufo_post_load, 3028982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_ufo_pre_save, 3029982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3030982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp), 3031982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3032982b78c5SDr. David Alan Gilbert }, 3033982b78c5SDr. David Alan Gilbert }; 3034982b78c5SDr. David Alan Gilbert 3035982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the 3036982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3037982b78c5SDr. David Alan Gilbert */ 3038982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id) 3039982b78c5SDr. David Alan Gilbert { 3040982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3041982b78c5SDr. David Alan Gilbert 3042982b78c5SDr. David Alan Gilbert if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) { 3043982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires vnet_hdr=on"); 3044982b78c5SDr. David Alan Gilbert return -EINVAL; 3045982b78c5SDr. David Alan Gilbert } 3046982b78c5SDr. David Alan Gilbert 3047982b78c5SDr. David Alan Gilbert return 0; 3048982b78c5SDr. David Alan Gilbert } 3049982b78c5SDr. David Alan Gilbert 305044b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque) 3051982b78c5SDr. David Alan Gilbert { 3052982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3053982b78c5SDr. David Alan Gilbert 3054982b78c5SDr. David Alan Gilbert tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr; 305544b1ff31SDr. David Alan Gilbert 305644b1ff31SDr. David Alan Gilbert return 0; 3057982b78c5SDr. David Alan Gilbert } 3058982b78c5SDr. David Alan Gilbert 3059982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = { 3060982b78c5SDr. David Alan Gilbert .name = "virtio-net-vnet", 3061982b78c5SDr. David Alan Gilbert .post_load = virtio_net_vnet_post_load, 3062982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_vnet_pre_save, 3063982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3064982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp), 3065982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3066982b78c5SDr. David Alan Gilbert }, 3067982b78c5SDr. David Alan Gilbert }; 3068982b78c5SDr. David Alan Gilbert 3069e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque) 3070e41b7114SYuri Benditovich { 3071e41b7114SYuri Benditovich return VIRTIO_NET(opaque)->rss_data.enabled; 3072e41b7114SYuri Benditovich } 3073e41b7114SYuri Benditovich 3074e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = { 3075e41b7114SYuri Benditovich .name = "virtio-net-device/rss", 3076e41b7114SYuri Benditovich .version_id = 1, 3077e41b7114SYuri Benditovich .minimum_version_id = 1, 3078e41b7114SYuri Benditovich .needed = virtio_net_rss_needed, 3079e41b7114SYuri Benditovich .fields = (VMStateField[]) { 3080e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.enabled, VirtIONet), 3081e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.redirect, VirtIONet), 3082e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.populate_hash, VirtIONet), 3083e41b7114SYuri Benditovich VMSTATE_UINT32(rss_data.hash_types, VirtIONet), 3084e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.indirections_len, VirtIONet), 3085e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.default_queue, VirtIONet), 3086e41b7114SYuri Benditovich VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet, 3087e41b7114SYuri Benditovich VIRTIO_NET_RSS_MAX_KEY_SIZE), 3088e41b7114SYuri Benditovich VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet, 3089e41b7114SYuri Benditovich rss_data.indirections_len, 0, 3090e41b7114SYuri Benditovich vmstate_info_uint16, uint16_t), 3091e41b7114SYuri Benditovich VMSTATE_END_OF_LIST() 3092e41b7114SYuri Benditovich }, 3093e41b7114SYuri Benditovich }; 3094e41b7114SYuri Benditovich 3095982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = { 3096982b78c5SDr. David Alan Gilbert .name = "virtio-net-device", 3097982b78c5SDr. David Alan Gilbert .version_id = VIRTIO_NET_VM_VERSION, 3098982b78c5SDr. David Alan Gilbert .minimum_version_id = VIRTIO_NET_VM_VERSION, 3099982b78c5SDr. David Alan Gilbert .post_load = virtio_net_post_load_device, 3100982b78c5SDr. David Alan Gilbert .fields = (VMStateField[]) { 3101982b78c5SDr. David Alan Gilbert VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN), 3102982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_POINTER(vqs, VirtIONet, 3103982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3104982b78c5SDr. David Alan Gilbert VirtIONetQueue), 3105982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet), 3106982b78c5SDr. David Alan Gilbert VMSTATE_UINT16(status, VirtIONet), 3107982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(promisc, VirtIONet), 3108982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(allmulti, VirtIONet), 3109982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mac_table.in_use, VirtIONet), 3110982b78c5SDr. David Alan Gilbert 3111982b78c5SDr. David Alan Gilbert /* Guarded pair: If it fits we load it, else we throw it away 3112982b78c5SDr. David Alan Gilbert * - can happen if source has a larger MAC table.; post-load 3113982b78c5SDr. David Alan Gilbert * sets flags in this case. 3114982b78c5SDr. David Alan Gilbert */ 3115982b78c5SDr. David Alan Gilbert VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet, 3116982b78c5SDr. David Alan Gilbert 0, mac_table_fits, mac_table.in_use, 3117982b78c5SDr. David Alan Gilbert ETH_ALEN), 3118982b78c5SDr. David Alan Gilbert VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0, 3119982b78c5SDr. David Alan Gilbert mac_table.in_use, ETH_ALEN), 3120982b78c5SDr. David Alan Gilbert 3121982b78c5SDr. David Alan Gilbert /* Note: This is an array of uint32's that's always been saved as a 3122982b78c5SDr. David Alan Gilbert * buffer; hold onto your endiannesses; it's actually used as a bitmap 3123982b78c5SDr. David Alan Gilbert * but based on the uint. 3124982b78c5SDr. David Alan Gilbert */ 3125982b78c5SDr. David Alan Gilbert VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3), 3126982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3127982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_vnet), 3128982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet), 3129982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet), 3130982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(alluni, VirtIONet), 3131982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nomulti, VirtIONet), 3132982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nouni, VirtIONet), 3133982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nobcast, VirtIONet), 3134982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3135982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_ufo), 3136441537f1SJason Wang VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0, 3137982b78c5SDr. David Alan Gilbert vmstate_info_uint16_equal, uint16_t), 3138441537f1SJason Wang VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1), 3139982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3140982b78c5SDr. David Alan Gilbert vmstate_virtio_net_tx_waiting), 3141982b78c5SDr. David Alan Gilbert VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet, 3142982b78c5SDr. David Alan Gilbert has_ctrl_guest_offloads), 3143982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3144982b78c5SDr. David Alan Gilbert }, 3145e41b7114SYuri Benditovich .subsections = (const VMStateDescription * []) { 3146e41b7114SYuri Benditovich &vmstate_virtio_net_rss, 3147e41b7114SYuri Benditovich NULL 3148e41b7114SYuri Benditovich } 3149982b78c5SDr. David Alan Gilbert }; 3150982b78c5SDr. David Alan Gilbert 31516e790746SPaolo Bonzini static NetClientInfo net_virtio_info = { 3152f394b2e2SEric Blake .type = NET_CLIENT_DRIVER_NIC, 31536e790746SPaolo Bonzini .size = sizeof(NICState), 31546e790746SPaolo Bonzini .can_receive = virtio_net_can_receive, 31556e790746SPaolo Bonzini .receive = virtio_net_receive, 31566e790746SPaolo Bonzini .link_status_changed = virtio_net_set_link_status, 3157b1be4280SAmos Kong .query_rx_filter = virtio_net_query_rxfilter, 3158b2c929f0SDr. David Alan Gilbert .announce = virtio_net_announce, 31596e790746SPaolo Bonzini }; 31606e790746SPaolo Bonzini 31616e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx) 31626e790746SPaolo Bonzini { 316317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 31646e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx)); 31656e790746SPaolo Bonzini assert(n->vhost_started); 3166ed8b4afeSNikolay Nikolaev return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx); 31676e790746SPaolo Bonzini } 31686e790746SPaolo Bonzini 31696e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx, 31706e790746SPaolo Bonzini bool mask) 31716e790746SPaolo Bonzini { 317217a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 31736e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx)); 31746e790746SPaolo Bonzini assert(n->vhost_started); 3175ed8b4afeSNikolay Nikolaev vhost_net_virtqueue_mask(get_vhost_net(nc->peer), 31766e790746SPaolo Bonzini vdev, idx, mask); 31776e790746SPaolo Bonzini } 31786e790746SPaolo Bonzini 3179019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features) 31806e790746SPaolo Bonzini { 31810cd09c3aSCornelia Huck virtio_add_feature(&host_features, VIRTIO_NET_F_MAC); 3182a93e599dSMaxime Coquelin 3183ba550851SStefano Garzarella n->config_size = virtio_feature_get_config_size(feature_sizes, 3184ba550851SStefano Garzarella host_features); 318517ec5a86SKONRAD Frederic } 31866e790746SPaolo Bonzini 31878a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name, 31888a253ec2SKONRAD Frederic const char *type) 31898a253ec2SKONRAD Frederic { 31908a253ec2SKONRAD Frederic /* 31918a253ec2SKONRAD Frederic * The name can be NULL, the netclient name will be type.x. 31928a253ec2SKONRAD Frederic */ 31938a253ec2SKONRAD Frederic assert(type != NULL); 31948a253ec2SKONRAD Frederic 31958a253ec2SKONRAD Frederic g_free(n->netclient_name); 31968a253ec2SKONRAD Frederic g_free(n->netclient_type); 31978a253ec2SKONRAD Frederic n->netclient_name = g_strdup(name); 31988a253ec2SKONRAD Frederic n->netclient_type = g_strdup(type); 31998a253ec2SKONRAD Frederic } 32008a253ec2SKONRAD Frederic 32010e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev) 32029711cd0dSJens Freimann { 32039711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 32049711cd0dSJens Freimann PCIDevice *pci_dev; 32059711cd0dSJens Freimann Error *err = NULL; 32069711cd0dSJens Freimann 32070e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 32089711cd0dSJens Freimann if (hotplug_ctrl) { 32090e9a65c5SJuan Quintela pci_dev = PCI_DEVICE(dev); 32109711cd0dSJens Freimann pci_dev->partially_hotplugged = true; 32110e9a65c5SJuan Quintela hotplug_handler_unplug_request(hotplug_ctrl, dev, &err); 32129711cd0dSJens Freimann if (err) { 32139711cd0dSJens Freimann error_report_err(err); 32149711cd0dSJens Freimann return false; 32159711cd0dSJens Freimann } 32169711cd0dSJens Freimann } else { 32179711cd0dSJens Freimann return false; 32189711cd0dSJens Freimann } 32199711cd0dSJens Freimann return true; 32209711cd0dSJens Freimann } 32219711cd0dSJens Freimann 32220e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev, 32230e9a65c5SJuan Quintela Error **errp) 32249711cd0dSJens Freimann { 32255a0948d3SMarkus Armbruster Error *err = NULL; 32269711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 32270e9a65c5SJuan Quintela PCIDevice *pdev = PCI_DEVICE(dev); 322878274682SJuan Quintela BusState *primary_bus; 32299711cd0dSJens Freimann 32309711cd0dSJens Freimann if (!pdev->partially_hotplugged) { 32319711cd0dSJens Freimann return true; 32329711cd0dSJens Freimann } 32330e9a65c5SJuan Quintela primary_bus = dev->parent_bus; 323478274682SJuan Quintela if (!primary_bus) { 3235150ab54aSJens Freimann error_setg(errp, "virtio_net: couldn't find primary bus"); 32365a0948d3SMarkus Armbruster return false; 32379711cd0dSJens Freimann } 32380e9a65c5SJuan Quintela qdev_set_parent_bus(dev, primary_bus, &error_abort); 3239e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 32400e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 32419711cd0dSJens Freimann if (hotplug_ctrl) { 32420e9a65c5SJuan Quintela hotplug_handler_pre_plug(hotplug_ctrl, dev, &err); 32435a0948d3SMarkus Armbruster if (err) { 32445a0948d3SMarkus Armbruster goto out; 32455a0948d3SMarkus Armbruster } 32460e9a65c5SJuan Quintela hotplug_handler_plug(hotplug_ctrl, dev, &err); 32479711cd0dSJens Freimann } 3248109c20eaSLaurent Vivier pdev->partially_hotplugged = false; 3249150ab54aSJens Freimann 3250150ab54aSJens Freimann out: 32515a0948d3SMarkus Armbruster error_propagate(errp, err); 32525a0948d3SMarkus Armbruster return !err; 32539711cd0dSJens Freimann } 32549711cd0dSJens Freimann 325507a5d816SJuan Quintela static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationState *s) 32569711cd0dSJens Freimann { 32579711cd0dSJens Freimann bool should_be_hidden; 32589711cd0dSJens Freimann Error *err = NULL; 325907a5d816SJuan Quintela DeviceState *dev = failover_find_primary_device(n); 326007a5d816SJuan Quintela 326107a5d816SJuan Quintela if (!dev) { 326207a5d816SJuan Quintela return; 326307a5d816SJuan Quintela } 32649711cd0dSJens Freimann 3265e2bde83eSJuan Quintela should_be_hidden = qatomic_read(&n->failover_primary_hidden); 32669711cd0dSJens Freimann 32674dbac1aeSMarkus Armbruster if (migration_in_setup(s) && !should_be_hidden) { 326807a5d816SJuan Quintela if (failover_unplug_primary(n, dev)) { 326907a5d816SJuan Quintela vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev); 327007a5d816SJuan Quintela qapi_event_send_unplug_primary(dev->id); 3271e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 32729711cd0dSJens Freimann } else { 32739711cd0dSJens Freimann warn_report("couldn't unplug primary device"); 32749711cd0dSJens Freimann } 32759711cd0dSJens Freimann } else if (migration_has_failed(s)) { 3276150ab54aSJens Freimann /* We already unplugged the device let's plug it back */ 327707a5d816SJuan Quintela if (!failover_replug_primary(n, dev, &err)) { 32789711cd0dSJens Freimann if (err) { 32799711cd0dSJens Freimann error_report_err(err); 32809711cd0dSJens Freimann } 32819711cd0dSJens Freimann } 32829711cd0dSJens Freimann } 32839711cd0dSJens Freimann } 32849711cd0dSJens Freimann 32859711cd0dSJens Freimann static void virtio_net_migration_state_notifier(Notifier *notifier, void *data) 32869711cd0dSJens Freimann { 32879711cd0dSJens Freimann MigrationState *s = data; 32889711cd0dSJens Freimann VirtIONet *n = container_of(notifier, VirtIONet, migration_state); 32899711cd0dSJens Freimann virtio_net_handle_migration_primary(n, s); 32909711cd0dSJens Freimann } 32919711cd0dSJens Freimann 3292b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener, 3293f3558b1bSKevin Wolf const QDict *device_opts, 3294f3558b1bSKevin Wolf bool from_json, 3295f3558b1bSKevin Wolf Error **errp) 32969711cd0dSJens Freimann { 32979711cd0dSJens Freimann VirtIONet *n = container_of(listener, VirtIONet, primary_listener); 32984f0303aeSJuan Quintela const char *standby_id; 32999711cd0dSJens Freimann 33004d0e59acSJens Freimann if (!device_opts) { 330189631fedSJuan Quintela return false; 33024d0e59acSJens Freimann } 3303bcfc906bSLaurent Vivier 3304bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "failover_pair_id")) { 3305bcfc906bSLaurent Vivier return false; 3306bcfc906bSLaurent Vivier } 3307bcfc906bSLaurent Vivier 3308bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "id")) { 3309bcfc906bSLaurent Vivier error_setg(errp, "Device with failover_pair_id needs to have id"); 3310bcfc906bSLaurent Vivier return false; 3311bcfc906bSLaurent Vivier } 3312bcfc906bSLaurent Vivier 3313bcfc906bSLaurent Vivier standby_id = qdict_get_str(device_opts, "failover_pair_id"); 331489631fedSJuan Quintela if (g_strcmp0(standby_id, n->netclient_name) != 0) { 331589631fedSJuan Quintela return false; 33169711cd0dSJens Freimann } 33179711cd0dSJens Freimann 33187fe7791eSLaurent Vivier /* 33197fe7791eSLaurent Vivier * The hide helper can be called several times for a given device. 33207fe7791eSLaurent Vivier * Check there is only one primary for a virtio-net device but 33217fe7791eSLaurent Vivier * don't duplicate the qdict several times if it's called for the same 33227fe7791eSLaurent Vivier * device. 33237fe7791eSLaurent Vivier */ 3324259a10dbSKevin Wolf if (n->primary_opts) { 33257fe7791eSLaurent Vivier const char *old, *new; 33267fe7791eSLaurent Vivier /* devices with failover_pair_id always have an id */ 33277fe7791eSLaurent Vivier old = qdict_get_str(n->primary_opts, "id"); 33287fe7791eSLaurent Vivier new = qdict_get_str(device_opts, "id"); 33297fe7791eSLaurent Vivier if (strcmp(old, new) != 0) { 33307fe7791eSLaurent Vivier error_setg(errp, "Cannot attach more than one primary device to " 33317fe7791eSLaurent Vivier "'%s': '%s' and '%s'", n->netclient_name, old, new); 3332259a10dbSKevin Wolf return false; 3333259a10dbSKevin Wolf } 33347fe7791eSLaurent Vivier } else { 3335f3558b1bSKevin Wolf n->primary_opts = qdict_clone_shallow(device_opts); 3336f3558b1bSKevin Wolf n->primary_opts_from_json = from_json; 33377fe7791eSLaurent Vivier } 3338259a10dbSKevin Wolf 3339e2bde83eSJuan Quintela /* failover_primary_hidden is set during feature negotiation */ 33403abad4a2SJuan Quintela return qatomic_read(&n->failover_primary_hidden); 33419711cd0dSJens Freimann } 33429711cd0dSJens Freimann 3343e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp) 334417ec5a86SKONRAD Frederic { 3345e6f746b3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3346284a32f0SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3347284a32f0SAndreas Färber NetClientState *nc; 33481773d9eeSKONRAD Frederic int i; 334917ec5a86SKONRAD Frederic 3350a93e599dSMaxime Coquelin if (n->net_conf.mtu) { 3351127833eeSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_MTU); 3352a93e599dSMaxime Coquelin } 3353a93e599dSMaxime Coquelin 33549473939eSJason Baron if (n->net_conf.duplex_str) { 33559473939eSJason Baron if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) { 33569473939eSJason Baron n->net_conf.duplex = DUPLEX_HALF; 33579473939eSJason Baron } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) { 33589473939eSJason Baron n->net_conf.duplex = DUPLEX_FULL; 33599473939eSJason Baron } else { 33609473939eSJason Baron error_setg(errp, "'duplex' must be 'half' or 'full'"); 3361843c4cfcSMarkus Armbruster return; 33629473939eSJason Baron } 33639473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 33649473939eSJason Baron } else { 33659473939eSJason Baron n->net_conf.duplex = DUPLEX_UNKNOWN; 33669473939eSJason Baron } 33679473939eSJason Baron 33689473939eSJason Baron if (n->net_conf.speed < SPEED_UNKNOWN) { 33699473939eSJason Baron error_setg(errp, "'speed' must be between 0 and INT_MAX"); 3370843c4cfcSMarkus Armbruster return; 3371843c4cfcSMarkus Armbruster } 3372843c4cfcSMarkus Armbruster if (n->net_conf.speed >= 0) { 33739473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 33749473939eSJason Baron } 33759473939eSJason Baron 33769711cd0dSJens Freimann if (n->failover) { 3377b91ad981SJuan Quintela n->primary_listener.hide_device = failover_hide_primary_device; 3378e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 33799711cd0dSJens Freimann device_listener_register(&n->primary_listener); 33809711cd0dSJens Freimann n->migration_state.notify = virtio_net_migration_state_notifier; 33819711cd0dSJens Freimann add_migration_state_change_notifier(&n->migration_state); 33829711cd0dSJens Freimann n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY); 33839711cd0dSJens Freimann } 33849711cd0dSJens Freimann 3385da3e8a23SShannon Zhao virtio_net_set_config_size(n, n->host_features); 3386284a32f0SAndreas Färber virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size); 338717ec5a86SKONRAD Frederic 33881c0fbfa3SMichael S. Tsirkin /* 33891c0fbfa3SMichael S. Tsirkin * We set a lower limit on RX queue size to what it always was. 33901c0fbfa3SMichael S. Tsirkin * Guests that want a smaller ring can always resize it without 33911c0fbfa3SMichael S. Tsirkin * help from us (using virtio 1 and up). 33921c0fbfa3SMichael S. Tsirkin */ 33931c0fbfa3SMichael S. Tsirkin if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE || 33941c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE || 33955f997fd1SMichal Privoznik !is_power_of_2(n->net_conf.rx_queue_size)) { 33961c0fbfa3SMichael S. Tsirkin error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), " 33971c0fbfa3SMichael S. Tsirkin "must be a power of 2 between %d and %d.", 33981c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE, 33991c0fbfa3SMichael S. Tsirkin VIRTQUEUE_MAX_SIZE); 34001c0fbfa3SMichael S. Tsirkin virtio_cleanup(vdev); 34011c0fbfa3SMichael S. Tsirkin return; 34021c0fbfa3SMichael S. Tsirkin } 34031c0fbfa3SMichael S. Tsirkin 34049b02e161SWei Wang if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE || 34059b02e161SWei Wang n->net_conf.tx_queue_size > VIRTQUEUE_MAX_SIZE || 34069b02e161SWei Wang !is_power_of_2(n->net_conf.tx_queue_size)) { 34079b02e161SWei Wang error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), " 34089b02e161SWei Wang "must be a power of 2 between %d and %d", 34099b02e161SWei Wang n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE, 34109b02e161SWei Wang VIRTQUEUE_MAX_SIZE); 34119b02e161SWei Wang virtio_cleanup(vdev); 34129b02e161SWei Wang return; 34139b02e161SWei Wang } 34149b02e161SWei Wang 3415*22288fe5SJason Wang n->max_ncs = MAX(n->nic_conf.peers.queues, 1); 3416*22288fe5SJason Wang 3417*22288fe5SJason Wang /* 3418*22288fe5SJason Wang * Figure out the datapath queue pairs since the backend could 3419*22288fe5SJason Wang * provide control queue via peers as well. 3420*22288fe5SJason Wang */ 3421*22288fe5SJason Wang if (n->nic_conf.peers.queues) { 3422*22288fe5SJason Wang for (i = 0; i < n->max_ncs; i++) { 3423*22288fe5SJason Wang if (n->nic_conf.peers.ncs[i]->is_datapath) { 3424*22288fe5SJason Wang ++n->max_queue_pairs; 3425*22288fe5SJason Wang } 3426*22288fe5SJason Wang } 3427*22288fe5SJason Wang } 3428*22288fe5SJason Wang n->max_queue_pairs = MAX(n->max_queue_pairs, 1); 3429*22288fe5SJason Wang 3430441537f1SJason Wang if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) { 3431*22288fe5SJason Wang error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), " 3432631b22eaSStefan Weil "must be a positive integer less than %d.", 3433441537f1SJason Wang n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2); 34347e0e736eSJason Wang virtio_cleanup(vdev); 34357e0e736eSJason Wang return; 34367e0e736eSJason Wang } 3437441537f1SJason Wang n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queue_pairs); 3438441537f1SJason Wang n->curr_queue_pairs = 1; 34391773d9eeSKONRAD Frederic n->tx_timeout = n->net_conf.txtimer; 34406e790746SPaolo Bonzini 34411773d9eeSKONRAD Frederic if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer") 34421773d9eeSKONRAD Frederic && strcmp(n->net_conf.tx, "bh")) { 34430765691eSMarkus Armbruster warn_report("virtio-net: " 34446e790746SPaolo Bonzini "Unknown option tx=%s, valid options: \"timer\" \"bh\"", 34451773d9eeSKONRAD Frederic n->net_conf.tx); 34460765691eSMarkus Armbruster error_printf("Defaulting to \"bh\""); 34476e790746SPaolo Bonzini } 34486e790746SPaolo Bonzini 34492eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n), 34502eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size); 34519b02e161SWei Wang 3452441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3453f9d6dbf0SWen Congyang virtio_net_add_queue(n, i); 3454da51a335SJason Wang } 3455da51a335SJason Wang 345617a0ca55SKONRAD Frederic n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 34571773d9eeSKONRAD Frederic qemu_macaddr_default_if_unset(&n->nic_conf.macaddr); 34581773d9eeSKONRAD Frederic memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac)); 34596e790746SPaolo Bonzini n->status = VIRTIO_NET_S_LINK_UP; 34609d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 34619d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 3462f57fcf70SJason Wang virtio_net_announce_timer, n); 3463b2c929f0SDr. David Alan Gilbert n->announce_timer.round = 0; 34646e790746SPaolo Bonzini 34658a253ec2SKONRAD Frederic if (n->netclient_type) { 34668a253ec2SKONRAD Frederic /* 34678a253ec2SKONRAD Frederic * Happen when virtio_net_set_netclient_name has been called. 34688a253ec2SKONRAD Frederic */ 34698a253ec2SKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 34708a253ec2SKONRAD Frederic n->netclient_type, n->netclient_name, n); 34718a253ec2SKONRAD Frederic } else { 34721773d9eeSKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 3473284a32f0SAndreas Färber object_get_typename(OBJECT(dev)), dev->id, n); 34748a253ec2SKONRAD Frederic } 34758a253ec2SKONRAD Frederic 3476441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3477d4c62930SBin Meng n->nic->ncs[i].do_not_pad = true; 3478d4c62930SBin Meng } 3479d4c62930SBin Meng 34806e790746SPaolo Bonzini peer_test_vnet_hdr(n); 34816e790746SPaolo Bonzini if (peer_has_vnet_hdr(n)) { 3482441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3483d6085e3aSStefan Hajnoczi qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true); 34846e790746SPaolo Bonzini } 34856e790746SPaolo Bonzini n->host_hdr_len = sizeof(struct virtio_net_hdr); 34866e790746SPaolo Bonzini } else { 34876e790746SPaolo Bonzini n->host_hdr_len = 0; 34886e790746SPaolo Bonzini } 34896e790746SPaolo Bonzini 34901773d9eeSKONRAD Frederic qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a); 34916e790746SPaolo Bonzini 34926e790746SPaolo Bonzini n->vqs[0].tx_waiting = 0; 34931773d9eeSKONRAD Frederic n->tx_burst = n->net_conf.txburst; 3494e22f0603SYuri Benditovich virtio_net_set_mrg_rx_bufs(n, 0, 0, 0); 34956e790746SPaolo Bonzini n->promisc = 1; /* for compatibility */ 34966e790746SPaolo Bonzini 34976e790746SPaolo Bonzini n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 34986e790746SPaolo Bonzini 34996e790746SPaolo Bonzini n->vlans = g_malloc0(MAX_VLAN >> 3); 35006e790746SPaolo Bonzini 3501b1be4280SAmos Kong nc = qemu_get_queue(n->nic); 3502b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 3503b1be4280SAmos Kong 3504e87936eaSCindy Lu if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 3505e87936eaSCindy Lu struct virtio_net_config netcfg = {}; 3506e87936eaSCindy Lu memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN); 3507e87936eaSCindy Lu vhost_net_set_config(get_vhost_net(nc->peer), 3508e87936eaSCindy Lu (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_MASTER); 3509e87936eaSCindy Lu } 35102974e916SYuri Benditovich QTAILQ_INIT(&n->rsc_chains); 3511284a32f0SAndreas Färber n->qdev = dev; 35124474e37aSYuri Benditovich 35134474e37aSYuri Benditovich net_rx_pkt_init(&n->rx_pkt, false); 35140145c393SAndrew Melnychenko 35150145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 35160145c393SAndrew Melnychenko virtio_net_load_ebpf(n); 35170145c393SAndrew Melnychenko } 351817ec5a86SKONRAD Frederic } 351917ec5a86SKONRAD Frederic 3520b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev) 352117ec5a86SKONRAD Frederic { 3522306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3523306ec6c3SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3524441537f1SJason Wang int i, max_queue_pairs; 352517ec5a86SKONRAD Frederic 35260145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 35270145c393SAndrew Melnychenko virtio_net_unload_ebpf(n); 35280145c393SAndrew Melnychenko } 35290145c393SAndrew Melnychenko 353017ec5a86SKONRAD Frederic /* This will stop vhost backend if appropriate. */ 353117ec5a86SKONRAD Frederic virtio_net_set_status(vdev, 0); 353217ec5a86SKONRAD Frederic 35338a253ec2SKONRAD Frederic g_free(n->netclient_name); 35348a253ec2SKONRAD Frederic n->netclient_name = NULL; 35358a253ec2SKONRAD Frederic g_free(n->netclient_type); 35368a253ec2SKONRAD Frederic n->netclient_type = NULL; 35378a253ec2SKONRAD Frederic 353817ec5a86SKONRAD Frederic g_free(n->mac_table.macs); 353917ec5a86SKONRAD Frederic g_free(n->vlans); 354017ec5a86SKONRAD Frederic 35419711cd0dSJens Freimann if (n->failover) { 3542f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 354365018100SJuan Quintela device_listener_unregister(&n->primary_listener); 35441e157667SLaurent Vivier remove_migration_state_change_notifier(&n->migration_state); 3545f3558b1bSKevin Wolf } else { 3546f3558b1bSKevin Wolf assert(n->primary_opts == NULL); 35479711cd0dSJens Freimann } 35489711cd0dSJens Freimann 3549441537f1SJason Wang max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3550441537f1SJason Wang for (i = 0; i < max_queue_pairs; i++) { 3551f9d6dbf0SWen Congyang virtio_net_del_queue(n, i); 355217ec5a86SKONRAD Frederic } 3553d945d9f1SYuri Benditovich /* delete also control vq */ 3554441537f1SJason Wang virtio_del_queue(vdev, max_queue_pairs * 2); 3555944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 355617ec5a86SKONRAD Frederic g_free(n->vqs); 355717ec5a86SKONRAD Frederic qemu_del_nic(n->nic); 35582974e916SYuri Benditovich virtio_net_rsc_cleanup(n); 355959079029SYuri Benditovich g_free(n->rss_data.indirections_table); 35604474e37aSYuri Benditovich net_rx_pkt_uninit(n->rx_pkt); 35616a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 356217ec5a86SKONRAD Frederic } 356317ec5a86SKONRAD Frederic 356417ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj) 356517ec5a86SKONRAD Frederic { 356617ec5a86SKONRAD Frederic VirtIONet *n = VIRTIO_NET(obj); 356717ec5a86SKONRAD Frederic 356817ec5a86SKONRAD Frederic /* 356917ec5a86SKONRAD Frederic * The default config_size is sizeof(struct virtio_net_config). 357017ec5a86SKONRAD Frederic * Can be overriden with virtio_net_set_config_size. 357117ec5a86SKONRAD Frederic */ 357217ec5a86SKONRAD Frederic n->config_size = sizeof(struct virtio_net_config); 3573aa4197c3SGonglei device_add_bootindex_property(obj, &n->nic_conf.bootindex, 3574aa4197c3SGonglei "bootindex", "/ethernet-phy@0", 357540c2281cSMarkus Armbruster DEVICE(n)); 35760145c393SAndrew Melnychenko 35770145c393SAndrew Melnychenko ebpf_rss_init(&n->ebpf_rss); 357817ec5a86SKONRAD Frederic } 357917ec5a86SKONRAD Frederic 358044b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque) 35814d45dcfbSHalil Pasic { 35824d45dcfbSHalil Pasic VirtIONet *n = opaque; 35834d45dcfbSHalil Pasic 35844d45dcfbSHalil Pasic /* At this point, backend must be stopped, otherwise 35854d45dcfbSHalil Pasic * it might keep writing to memory. */ 35864d45dcfbSHalil Pasic assert(!n->vhost_started); 358744b1ff31SDr. David Alan Gilbert 358844b1ff31SDr. David Alan Gilbert return 0; 35894d45dcfbSHalil Pasic } 35904d45dcfbSHalil Pasic 35919711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque) 35929711cd0dSJens Freimann { 35939711cd0dSJens Freimann DeviceState *dev = opaque; 359421e8709bSJuan Quintela DeviceState *primary; 35959711cd0dSJens Freimann VirtIODevice *vdev = VIRTIO_DEVICE(dev); 35969711cd0dSJens Freimann VirtIONet *n = VIRTIO_NET(vdev); 35979711cd0dSJens Freimann 3598284f42a5SJens Freimann if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) { 3599284f42a5SJens Freimann return false; 3600284f42a5SJens Freimann } 360121e8709bSJuan Quintela primary = failover_find_primary_device(n); 360221e8709bSJuan Quintela return primary ? primary->pending_deleted_event : false; 36039711cd0dSJens Freimann } 36049711cd0dSJens Freimann 36059711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque) 36069711cd0dSJens Freimann { 36079711cd0dSJens Freimann DeviceState *dev = opaque; 36089711cd0dSJens Freimann VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev); 36099711cd0dSJens Freimann 36109711cd0dSJens Freimann return vdc->primary_unplug_pending(dev); 36119711cd0dSJens Freimann } 36129711cd0dSJens Freimann 36134d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = { 36144d45dcfbSHalil Pasic .name = "virtio-net", 36154d45dcfbSHalil Pasic .minimum_version_id = VIRTIO_NET_VM_VERSION, 36164d45dcfbSHalil Pasic .version_id = VIRTIO_NET_VM_VERSION, 36174d45dcfbSHalil Pasic .fields = (VMStateField[]) { 36184d45dcfbSHalil Pasic VMSTATE_VIRTIO_DEVICE, 36194d45dcfbSHalil Pasic VMSTATE_END_OF_LIST() 36204d45dcfbSHalil Pasic }, 36214d45dcfbSHalil Pasic .pre_save = virtio_net_pre_save, 36229711cd0dSJens Freimann .dev_unplug_pending = dev_unplug_pending, 36234d45dcfbSHalil Pasic }; 3624290c2428SDr. David Alan Gilbert 362517ec5a86SKONRAD Frederic static Property virtio_net_properties[] = { 3626127833eeSJason Baron DEFINE_PROP_BIT64("csum", VirtIONet, host_features, 3627127833eeSJason Baron VIRTIO_NET_F_CSUM, true), 3628127833eeSJason Baron DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features, 362987108bb2SShannon Zhao VIRTIO_NET_F_GUEST_CSUM, true), 3630127833eeSJason Baron DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true), 3631127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features, 363287108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO4, true), 3633127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features, 363487108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO6, true), 3635127833eeSJason Baron DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features, 363687108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ECN, true), 3637127833eeSJason Baron DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features, 363887108bb2SShannon Zhao VIRTIO_NET_F_GUEST_UFO, true), 3639127833eeSJason Baron DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features, 364087108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ANNOUNCE, true), 3641127833eeSJason Baron DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features, 364287108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO4, true), 3643127833eeSJason Baron DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features, 364487108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO6, true), 3645127833eeSJason Baron DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features, 364687108bb2SShannon Zhao VIRTIO_NET_F_HOST_ECN, true), 3647127833eeSJason Baron DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features, 364887108bb2SShannon Zhao VIRTIO_NET_F_HOST_UFO, true), 3649127833eeSJason Baron DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features, 365087108bb2SShannon Zhao VIRTIO_NET_F_MRG_RXBUF, true), 3651127833eeSJason Baron DEFINE_PROP_BIT64("status", VirtIONet, host_features, 365287108bb2SShannon Zhao VIRTIO_NET_F_STATUS, true), 3653127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features, 365487108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VQ, true), 3655127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features, 365687108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX, true), 3657127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features, 365887108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VLAN, true), 3659127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features, 366087108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX_EXTRA, true), 3661127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features, 366287108bb2SShannon Zhao VIRTIO_NET_F_CTRL_MAC_ADDR, true), 3663127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features, 366487108bb2SShannon Zhao VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true), 3665127833eeSJason Baron DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false), 366659079029SYuri Benditovich DEFINE_PROP_BIT64("rss", VirtIONet, host_features, 366759079029SYuri Benditovich VIRTIO_NET_F_RSS, false), 3668e22f0603SYuri Benditovich DEFINE_PROP_BIT64("hash", VirtIONet, host_features, 3669e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT, false), 36702974e916SYuri Benditovich DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features, 36712974e916SYuri Benditovich VIRTIO_NET_F_RSC_EXT, false), 36722974e916SYuri Benditovich DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout, 36732974e916SYuri Benditovich VIRTIO_NET_RSC_DEFAULT_INTERVAL), 367417ec5a86SKONRAD Frederic DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf), 367517ec5a86SKONRAD Frederic DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer, 367617ec5a86SKONRAD Frederic TX_TIMER_INTERVAL), 367717ec5a86SKONRAD Frederic DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST), 367817ec5a86SKONRAD Frederic DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx), 36791c0fbfa3SMichael S. Tsirkin DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size, 36801c0fbfa3SMichael S. Tsirkin VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE), 36819b02e161SWei Wang DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size, 36829b02e161SWei Wang VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE), 3683a93e599dSMaxime Coquelin DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0), 368475ebec11SMaxime Coquelin DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend, 368575ebec11SMaxime Coquelin true), 36869473939eSJason Baron DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN), 36879473939eSJason Baron DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str), 36889711cd0dSJens Freimann DEFINE_PROP_BOOL("failover", VirtIONet, failover, false), 368917ec5a86SKONRAD Frederic DEFINE_PROP_END_OF_LIST(), 369017ec5a86SKONRAD Frederic }; 369117ec5a86SKONRAD Frederic 369217ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data) 369317ec5a86SKONRAD Frederic { 369417ec5a86SKONRAD Frederic DeviceClass *dc = DEVICE_CLASS(klass); 369517ec5a86SKONRAD Frederic VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 3696e6f746b3SAndreas Färber 36974f67d30bSMarc-André Lureau device_class_set_props(dc, virtio_net_properties); 3698290c2428SDr. David Alan Gilbert dc->vmsd = &vmstate_virtio_net; 3699125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_NETWORK, dc->categories); 3700e6f746b3SAndreas Färber vdc->realize = virtio_net_device_realize; 3701306ec6c3SAndreas Färber vdc->unrealize = virtio_net_device_unrealize; 370217ec5a86SKONRAD Frederic vdc->get_config = virtio_net_get_config; 370317ec5a86SKONRAD Frederic vdc->set_config = virtio_net_set_config; 370417ec5a86SKONRAD Frederic vdc->get_features = virtio_net_get_features; 370517ec5a86SKONRAD Frederic vdc->set_features = virtio_net_set_features; 370617ec5a86SKONRAD Frederic vdc->bad_features = virtio_net_bad_features; 370717ec5a86SKONRAD Frederic vdc->reset = virtio_net_reset; 370817ec5a86SKONRAD Frederic vdc->set_status = virtio_net_set_status; 370917ec5a86SKONRAD Frederic vdc->guest_notifier_mask = virtio_net_guest_notifier_mask; 371017ec5a86SKONRAD Frederic vdc->guest_notifier_pending = virtio_net_guest_notifier_pending; 37112a083ffdSMichael S. Tsirkin vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO); 37127788c3f2SMikhail Sennikovsky vdc->post_load = virtio_net_post_load_virtio; 3713982b78c5SDr. David Alan Gilbert vdc->vmsd = &vmstate_virtio_net_device; 37149711cd0dSJens Freimann vdc->primary_unplug_pending = primary_unplug_pending; 371517ec5a86SKONRAD Frederic } 371617ec5a86SKONRAD Frederic 371717ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = { 371817ec5a86SKONRAD Frederic .name = TYPE_VIRTIO_NET, 371917ec5a86SKONRAD Frederic .parent = TYPE_VIRTIO_DEVICE, 372017ec5a86SKONRAD Frederic .instance_size = sizeof(VirtIONet), 372117ec5a86SKONRAD Frederic .instance_init = virtio_net_instance_init, 372217ec5a86SKONRAD Frederic .class_init = virtio_net_class_init, 372317ec5a86SKONRAD Frederic }; 372417ec5a86SKONRAD Frederic 372517ec5a86SKONRAD Frederic static void virtio_register_types(void) 372617ec5a86SKONRAD Frederic { 372717ec5a86SKONRAD Frederic type_register_static(&virtio_net_info); 372817ec5a86SKONRAD Frederic } 372917ec5a86SKONRAD Frederic 373017ec5a86SKONRAD Frederic type_init(virtio_register_types) 3731