16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Network Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 149b8bfe21SPeter Maydell #include "qemu/osdep.h" 159711cd0dSJens Freimann #include "qemu/atomic.h" 166e790746SPaolo Bonzini #include "qemu/iov.h" 1768b0a639SSi-Wei Liu #include "qemu/log.h" 18db725815SMarkus Armbruster #include "qemu/main-loop.h" 190b8fa32fSMarkus Armbruster #include "qemu/module.h" 206e790746SPaolo Bonzini #include "hw/virtio/virtio.h" 216e790746SPaolo Bonzini #include "net/net.h" 226e790746SPaolo Bonzini #include "net/checksum.h" 236e790746SPaolo Bonzini #include "net/tap.h" 246e790746SPaolo Bonzini #include "qemu/error-report.h" 256e790746SPaolo Bonzini #include "qemu/timer.h" 269711cd0dSJens Freimann #include "qemu/option.h" 279711cd0dSJens Freimann #include "qemu/option_int.h" 289711cd0dSJens Freimann #include "qemu/config-file.h" 299711cd0dSJens Freimann #include "qapi/qmp/qdict.h" 306e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h" 316e790746SPaolo Bonzini #include "net/vhost_net.h" 329d8c6a25SDr. David Alan Gilbert #include "net/announce.h" 3317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h" 34e688df6bSMarkus Armbruster #include "qapi/error.h" 359af23989SMarkus Armbruster #include "qapi/qapi-events-net.h" 36a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h" 379711cd0dSJens Freimann #include "qapi/qapi-types-migration.h" 389711cd0dSJens Freimann #include "qapi/qapi-events-migration.h" 391399c60dSRusty Russell #include "hw/virtio/virtio-access.h" 40f8d806c9SJuan Quintela #include "migration/misc.h" 419473939eSJason Baron #include "standard-headers/linux/ethtool.h" 422f780b6aSMarkus Armbruster #include "sysemu/sysemu.h" 439d8c6a25SDr. David Alan Gilbert #include "trace.h" 449711cd0dSJens Freimann #include "monitor/qdev.h" 456b230b7dSAndrew Melnychenko #include "monitor/monitor.h" 46edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h" 474474e37aSYuri Benditovich #include "net_rx_pkt.h" 48108a6481SCindy Lu #include "hw/virtio/vhost.h" 491b529d90SLaurent Vivier #include "sysemu/qtest.h" 506e790746SPaolo Bonzini 516e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION 11 526e790746SPaolo Bonzini 531c0fbfa3SMichael S. Tsirkin /* previously fixed value */ 541c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256 559b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256 569b02e161SWei Wang 57441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */ 581c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 599b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 601c0fbfa3SMichael S. Tsirkin 612974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE 8 /* ipv4 saddr + daddr */ 622974e916SYuri Benditovich 632974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG 0x3F 642974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH 0xF000 652974e916SYuri Benditovich 662974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */ 672974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header)) 682974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535 692974e916SYuri Benditovich 702974e916SYuri Benditovich /* header length value in ip header without option */ 712974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5 722974e916SYuri Benditovich 732974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE 32 /* ipv6 saddr + daddr */ 742974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD 752974e916SYuri Benditovich 762974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance 772974e916SYuri Benditovich a lot, and should be tuned carefully, '300000'(300us) is the recommended 782974e916SYuri Benditovich value to pass the WHQL test, '50000' can gain 2x netperf throughput with 792974e916SYuri Benditovich tso/gso/gro 'off'. */ 802974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000 812974e916SYuri Benditovich 8259079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \ 8359079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \ 8459079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \ 8559079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \ 8659079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \ 8759079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \ 8859079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \ 8959079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \ 9059079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) 9159079029SYuri Benditovich 92ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = { 93127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MAC, 945d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mac)}, 95127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_STATUS, 965d5b33c0SMax Reitz .end = endof(struct virtio_net_config, status)}, 97127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MQ, 985d5b33c0SMax Reitz .end = endof(struct virtio_net_config, max_virtqueue_pairs)}, 99127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MTU, 1005d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mtu)}, 1019473939eSJason Baron {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX, 1025d5b33c0SMax Reitz .end = endof(struct virtio_net_config, duplex)}, 103e22f0603SYuri Benditovich {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT), 10459079029SYuri Benditovich .end = endof(struct virtio_net_config, supported_hash_types)}, 1056e790746SPaolo Bonzini {} 1066e790746SPaolo Bonzini }; 1076e790746SPaolo Bonzini 108d74c30c8SDaniil Tatianin static const VirtIOConfigSizeParams cfg_size_params = { 109d74c30c8SDaniil Tatianin .min_size = endof(struct virtio_net_config, mac), 110d74c30c8SDaniil Tatianin .max_size = sizeof(struct virtio_net_config), 111d74c30c8SDaniil Tatianin .feature_sizes = feature_sizes 112d74c30c8SDaniil Tatianin }; 113d74c30c8SDaniil Tatianin 1146e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc) 1156e790746SPaolo Bonzini { 1166e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1176e790746SPaolo Bonzini 1186e790746SPaolo Bonzini return &n->vqs[nc->queue_index]; 1196e790746SPaolo Bonzini } 1206e790746SPaolo Bonzini 1216e790746SPaolo Bonzini static int vq2q(int queue_index) 1226e790746SPaolo Bonzini { 1236e790746SPaolo Bonzini return queue_index / 2; 1246e790746SPaolo Bonzini } 1256e790746SPaolo Bonzini 1264fdf69abSKangjie Xu static void flush_or_purge_queued_packets(NetClientState *nc) 1274fdf69abSKangjie Xu { 1284fdf69abSKangjie Xu if (!nc->peer) { 1294fdf69abSKangjie Xu return; 1304fdf69abSKangjie Xu } 1314fdf69abSKangjie Xu 1324fdf69abSKangjie Xu qemu_flush_or_purge_queued_packets(nc->peer, true); 1334fdf69abSKangjie Xu assert(!virtio_net_get_subqueue(nc)->async_tx.elem); 1344fdf69abSKangjie Xu } 1354fdf69abSKangjie Xu 1366e790746SPaolo Bonzini /* TODO 1376e790746SPaolo Bonzini * - we could suppress RX interrupt if we were so inclined. 1386e790746SPaolo Bonzini */ 1396e790746SPaolo Bonzini 1406e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config) 1416e790746SPaolo Bonzini { 14217a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1436e790746SPaolo Bonzini struct virtio_net_config netcfg; 144c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 145fb592882SCindy Lu static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } }; 1466e790746SPaolo Bonzini 147108a6481SCindy Lu int ret = 0; 148108a6481SCindy Lu memset(&netcfg, 0 , sizeof(struct virtio_net_config)); 1491399c60dSRusty Russell virtio_stw_p(vdev, &netcfg.status, n->status); 150441537f1SJason Wang virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs); 151a93e599dSMaxime Coquelin virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu); 1526e790746SPaolo Bonzini memcpy(netcfg.mac, n->mac, ETH_ALEN); 1539473939eSJason Baron virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed); 1549473939eSJason Baron netcfg.duplex = n->net_conf.duplex; 15559079029SYuri Benditovich netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE; 15659079029SYuri Benditovich virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length, 157e22f0603SYuri Benditovich virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ? 158e22f0603SYuri Benditovich VIRTIO_NET_RSS_MAX_TABLE_LEN : 1); 15959079029SYuri Benditovich virtio_stl_p(vdev, &netcfg.supported_hash_types, 16059079029SYuri Benditovich VIRTIO_NET_RSS_SUPPORTED_HASHES); 1616e790746SPaolo Bonzini memcpy(config, &netcfg, n->config_size); 162108a6481SCindy Lu 163c546ecf2SJason Wang /* 164c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 165c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 166c546ecf2SJason Wang */ 167c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 168108a6481SCindy Lu ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg, 169108a6481SCindy Lu n->config_size); 170ebc141a6SEugenio Pérez if (ret == -1) { 171ebc141a6SEugenio Pérez return; 172ebc141a6SEugenio Pérez } 173ebc141a6SEugenio Pérez 174fb592882SCindy Lu /* 175ebc141a6SEugenio Pérez * Some NIC/kernel combinations present 0 as the mac address. As that 176ebc141a6SEugenio Pérez * is not a legal address, try to proceed with the address from the 177ebc141a6SEugenio Pérez * QEMU command line in the hope that the address has been configured 178ebc141a6SEugenio Pérez * correctly elsewhere - just not reported by the device. 179fb592882SCindy Lu */ 180fb592882SCindy Lu if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) { 181fb592882SCindy Lu info_report("Zero hardware mac address detected. Ignoring."); 182fb592882SCindy Lu memcpy(netcfg.mac, n->mac, ETH_ALEN); 183fb592882SCindy Lu } 184ebc141a6SEugenio Pérez 1854f93aafcSEugenio Pérez netcfg.status |= virtio_tswap16(vdev, 1864f93aafcSEugenio Pérez n->status & VIRTIO_NET_S_ANNOUNCE); 187108a6481SCindy Lu memcpy(config, &netcfg, n->config_size); 188108a6481SCindy Lu } 189108a6481SCindy Lu } 1906e790746SPaolo Bonzini 1916e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config) 1926e790746SPaolo Bonzini { 19317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1946e790746SPaolo Bonzini struct virtio_net_config netcfg = {}; 195c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 1966e790746SPaolo Bonzini 1976e790746SPaolo Bonzini memcpy(&netcfg, config, n->config_size); 1986e790746SPaolo Bonzini 19995129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) && 20095129d6fSCornelia Huck !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) && 2016e790746SPaolo Bonzini memcmp(netcfg.mac, n->mac, ETH_ALEN)) { 2026e790746SPaolo Bonzini memcpy(n->mac, netcfg.mac, ETH_ALEN); 2036e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 2046e790746SPaolo Bonzini } 205108a6481SCindy Lu 206c546ecf2SJason Wang /* 207c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 208c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 209c546ecf2SJason Wang */ 210c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 211c546ecf2SJason Wang vhost_net_set_config(get_vhost_net(nc->peer), 212c546ecf2SJason Wang (uint8_t *)&netcfg, 0, n->config_size, 213f8ed3648SManos Pitsidianakis VHOST_SET_CONFIG_TYPE_FRONTEND); 214108a6481SCindy Lu } 2156e790746SPaolo Bonzini } 2166e790746SPaolo Bonzini 2176e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status) 2186e790746SPaolo Bonzini { 21917a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2206e790746SPaolo Bonzini return (status & VIRTIO_CONFIG_S_DRIVER_OK) && 22117a0ca55SKONRAD Frederic (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running; 2226e790746SPaolo Bonzini } 2236e790746SPaolo Bonzini 224b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net) 225b2c929f0SDr. David Alan Gilbert { 226b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(net); 227b2c929f0SDr. David Alan Gilbert trace_virtio_net_announce_notify(); 228b2c929f0SDr. David Alan Gilbert 229b2c929f0SDr. David Alan Gilbert net->status |= VIRTIO_NET_S_ANNOUNCE; 230b2c929f0SDr. David Alan Gilbert virtio_notify_config(vdev); 231b2c929f0SDr. David Alan Gilbert } 232b2c929f0SDr. David Alan Gilbert 233f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque) 234f57fcf70SJason Wang { 235f57fcf70SJason Wang VirtIONet *n = opaque; 2369d8c6a25SDr. David Alan Gilbert trace_virtio_net_announce_timer(n->announce_timer.round); 237f57fcf70SJason Wang 2389d8c6a25SDr. David Alan Gilbert n->announce_timer.round--; 239b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 240b2c929f0SDr. David Alan Gilbert } 241b2c929f0SDr. David Alan Gilbert 242b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc) 243b2c929f0SDr. David Alan Gilbert { 244b2c929f0SDr. David Alan Gilbert VirtIONet *n = qemu_get_nic_opaque(nc); 245b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 246b2c929f0SDr. David Alan Gilbert 247b2c929f0SDr. David Alan Gilbert /* 248b2c929f0SDr. David Alan Gilbert * Make sure the virtio migration announcement timer isn't running 249b2c929f0SDr. David Alan Gilbert * If it is, let it trigger announcement so that we do not cause 250b2c929f0SDr. David Alan Gilbert * confusion. 251b2c929f0SDr. David Alan Gilbert */ 252b2c929f0SDr. David Alan Gilbert if (n->announce_timer.round) { 253b2c929f0SDr. David Alan Gilbert return; 254b2c929f0SDr. David Alan Gilbert } 255b2c929f0SDr. David Alan Gilbert 256b2c929f0SDr. David Alan Gilbert if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 257b2c929f0SDr. David Alan Gilbert virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 258b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 259b2c929f0SDr. David Alan Gilbert } 260f57fcf70SJason Wang } 261f57fcf70SJason Wang 2626e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status) 2636e790746SPaolo Bonzini { 26417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2656e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 266441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 267aa858194SSi-Wei Liu int cvq = virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ) ? 268aa858194SSi-Wei Liu n->max_ncs - n->max_queue_pairs : 0; 2696e790746SPaolo Bonzini 270ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 2716e790746SPaolo Bonzini return; 2726e790746SPaolo Bonzini } 2736e790746SPaolo Bonzini 2748c1ac475SRadim Krčmář if ((virtio_net_started(n, status) && !nc->peer->link_down) == 2758c1ac475SRadim Krčmář !!n->vhost_started) { 2766e790746SPaolo Bonzini return; 2776e790746SPaolo Bonzini } 2786e790746SPaolo Bonzini if (!n->vhost_started) { 279086abc1cSMichael S. Tsirkin int r, i; 280086abc1cSMichael S. Tsirkin 2811bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2821bfa316cSGreg Kurz error_report("backend does not support %s vnet headers; " 2831bfa316cSGreg Kurz "falling back on userspace virtio", 2841bfa316cSGreg Kurz virtio_is_big_endian(vdev) ? "BE" : "LE"); 2851bfa316cSGreg Kurz return; 2861bfa316cSGreg Kurz } 2871bfa316cSGreg Kurz 288086abc1cSMichael S. Tsirkin /* Any packets outstanding? Purge them to avoid touching rings 289086abc1cSMichael S. Tsirkin * when vhost is running. 290086abc1cSMichael S. Tsirkin */ 291441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 292086abc1cSMichael S. Tsirkin NetClientState *qnc = qemu_get_subqueue(n->nic, i); 293086abc1cSMichael S. Tsirkin 294086abc1cSMichael S. Tsirkin /* Purge both directions: TX and RX. */ 295086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->peer->incoming_queue, qnc); 296086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->incoming_queue, qnc->peer); 297086abc1cSMichael S. Tsirkin } 298086abc1cSMichael S. Tsirkin 299a93e599dSMaxime Coquelin if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) { 300a93e599dSMaxime Coquelin r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu); 301a93e599dSMaxime Coquelin if (r < 0) { 302a93e599dSMaxime Coquelin error_report("%uBytes MTU not supported by the backend", 303a93e599dSMaxime Coquelin n->net_conf.mtu); 304a93e599dSMaxime Coquelin 305a93e599dSMaxime Coquelin return; 306a93e599dSMaxime Coquelin } 307a93e599dSMaxime Coquelin } 308a93e599dSMaxime Coquelin 3096e790746SPaolo Bonzini n->vhost_started = 1; 31022288fe5SJason Wang r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq); 3116e790746SPaolo Bonzini if (r < 0) { 3126e790746SPaolo Bonzini error_report("unable to start vhost net: %d: " 3136e790746SPaolo Bonzini "falling back on userspace virtio", -r); 3146e790746SPaolo Bonzini n->vhost_started = 0; 3156e790746SPaolo Bonzini } 3166e790746SPaolo Bonzini } else { 31722288fe5SJason Wang vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq); 3186e790746SPaolo Bonzini n->vhost_started = 0; 3196e790746SPaolo Bonzini } 3206e790746SPaolo Bonzini } 3216e790746SPaolo Bonzini 3221bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev, 3231bfa316cSGreg Kurz NetClientState *peer, 3241bfa316cSGreg Kurz bool enable) 3251bfa316cSGreg Kurz { 3261bfa316cSGreg Kurz if (virtio_is_big_endian(vdev)) { 3271bfa316cSGreg Kurz return qemu_set_vnet_be(peer, enable); 3281bfa316cSGreg Kurz } else { 3291bfa316cSGreg Kurz return qemu_set_vnet_le(peer, enable); 3301bfa316cSGreg Kurz } 3311bfa316cSGreg Kurz } 3321bfa316cSGreg Kurz 3331bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs, 334441537f1SJason Wang int queue_pairs, bool enable) 3351bfa316cSGreg Kurz { 3361bfa316cSGreg Kurz int i; 3371bfa316cSGreg Kurz 338441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 3391bfa316cSGreg Kurz if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 && 3401bfa316cSGreg Kurz enable) { 3411bfa316cSGreg Kurz while (--i >= 0) { 3421bfa316cSGreg Kurz virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false); 3431bfa316cSGreg Kurz } 3441bfa316cSGreg Kurz 3451bfa316cSGreg Kurz return true; 3461bfa316cSGreg Kurz } 3471bfa316cSGreg Kurz } 3481bfa316cSGreg Kurz 3491bfa316cSGreg Kurz return false; 3501bfa316cSGreg Kurz } 3511bfa316cSGreg Kurz 3521bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status) 3531bfa316cSGreg Kurz { 3541bfa316cSGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(n); 355441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3561bfa316cSGreg Kurz 3571bfa316cSGreg Kurz if (virtio_net_started(n, status)) { 3581bfa316cSGreg Kurz /* Before using the device, we tell the network backend about the 3591bfa316cSGreg Kurz * endianness to use when parsing vnet headers. If the backend 3601bfa316cSGreg Kurz * can't do it, we fallback onto fixing the headers in the core 3611bfa316cSGreg Kurz * virtio-net code. 3621bfa316cSGreg Kurz */ 363ad57f700SAkihiko Odaki n->needs_vnet_hdr_swap = n->has_vnet_hdr && 364ad57f700SAkihiko Odaki virtio_net_set_vnet_endian(vdev, n->nic->ncs, 365441537f1SJason Wang queue_pairs, true); 3661bfa316cSGreg Kurz } else if (virtio_net_started(n, vdev->status)) { 3671bfa316cSGreg Kurz /* After using the device, we need to reset the network backend to 3681bfa316cSGreg Kurz * the default (guest native endianness), otherwise the guest may 3691bfa316cSGreg Kurz * lose network connectivity if it is rebooted into a different 3701bfa316cSGreg Kurz * endianness. 3711bfa316cSGreg Kurz */ 372441537f1SJason Wang virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false); 3731bfa316cSGreg Kurz } 3741bfa316cSGreg Kurz } 3751bfa316cSGreg Kurz 376283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq) 377283e2c2aSYuri Benditovich { 378283e2c2aSYuri Benditovich unsigned int dropped = virtqueue_drop_all(vq); 379283e2c2aSYuri Benditovich if (dropped) { 380283e2c2aSYuri Benditovich virtio_notify(vdev, vq); 381283e2c2aSYuri Benditovich } 382283e2c2aSYuri Benditovich } 383283e2c2aSYuri Benditovich 3846e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status) 3856e790746SPaolo Bonzini { 38617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 3876e790746SPaolo Bonzini VirtIONetQueue *q; 3886e790746SPaolo Bonzini int i; 3896e790746SPaolo Bonzini uint8_t queue_status; 3906e790746SPaolo Bonzini 3911bfa316cSGreg Kurz virtio_net_vnet_endian_status(n, status); 3926e790746SPaolo Bonzini virtio_net_vhost_status(n, status); 3936e790746SPaolo Bonzini 394441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 39538705bb5SFam Zheng NetClientState *ncs = qemu_get_subqueue(n->nic, i); 39638705bb5SFam Zheng bool queue_started; 3976e790746SPaolo Bonzini q = &n->vqs[i]; 3986e790746SPaolo Bonzini 399441537f1SJason Wang if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) { 4006e790746SPaolo Bonzini queue_status = 0; 4016e790746SPaolo Bonzini } else { 4026e790746SPaolo Bonzini queue_status = status; 4036e790746SPaolo Bonzini } 40438705bb5SFam Zheng queue_started = 40538705bb5SFam Zheng virtio_net_started(n, queue_status) && !n->vhost_started; 40638705bb5SFam Zheng 40738705bb5SFam Zheng if (queue_started) { 40838705bb5SFam Zheng qemu_flush_queued_packets(ncs); 40938705bb5SFam Zheng } 4106e790746SPaolo Bonzini 4116e790746SPaolo Bonzini if (!q->tx_waiting) { 4126e790746SPaolo Bonzini continue; 4136e790746SPaolo Bonzini } 4146e790746SPaolo Bonzini 41538705bb5SFam Zheng if (queue_started) { 4166e790746SPaolo Bonzini if (q->tx_timer) { 417bc72ad67SAlex Bligh timer_mod(q->tx_timer, 418bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 4196e790746SPaolo Bonzini } else { 4206e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 4216e790746SPaolo Bonzini } 4226e790746SPaolo Bonzini } else { 4236e790746SPaolo Bonzini if (q->tx_timer) { 424bc72ad67SAlex Bligh timer_del(q->tx_timer); 4256e790746SPaolo Bonzini } else { 4266e790746SPaolo Bonzini qemu_bh_cancel(q->tx_bh); 4276e790746SPaolo Bonzini } 428283e2c2aSYuri Benditovich if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 && 42970e53e6eSJason Wang (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) && 43070e53e6eSJason Wang vdev->vm_running) { 431283e2c2aSYuri Benditovich /* if tx is waiting we are likely have some packets in tx queue 432283e2c2aSYuri Benditovich * and disabled notification */ 433283e2c2aSYuri Benditovich q->tx_waiting = 0; 434283e2c2aSYuri Benditovich virtio_queue_set_notification(q->tx_vq, 1); 435283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, q->tx_vq); 436283e2c2aSYuri Benditovich } 4376e790746SPaolo Bonzini } 4386e790746SPaolo Bonzini } 4396e790746SPaolo Bonzini } 4406e790746SPaolo Bonzini 4416e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc) 4426e790746SPaolo Bonzini { 4436e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 44417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 4456e790746SPaolo Bonzini uint16_t old_status = n->status; 4466e790746SPaolo Bonzini 4476e790746SPaolo Bonzini if (nc->link_down) 4486e790746SPaolo Bonzini n->status &= ~VIRTIO_NET_S_LINK_UP; 4496e790746SPaolo Bonzini else 4506e790746SPaolo Bonzini n->status |= VIRTIO_NET_S_LINK_UP; 4516e790746SPaolo Bonzini 4526e790746SPaolo Bonzini if (n->status != old_status) 45317a0ca55SKONRAD Frederic virtio_notify_config(vdev); 4546e790746SPaolo Bonzini 45517a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 4566e790746SPaolo Bonzini } 4576e790746SPaolo Bonzini 458b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc) 459b1be4280SAmos Kong { 460b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 461b1be4280SAmos Kong 462b1be4280SAmos Kong if (nc->rxfilter_notify_enabled) { 463ddfb0baaSMarkus Armbruster char *path = object_get_canonical_path(OBJECT(n->qdev)); 4647480874aSMarkus Armbruster qapi_event_send_nic_rx_filter_changed(n->netclient_name, path); 46596e35046SAmos Kong g_free(path); 466b1be4280SAmos Kong 467b1be4280SAmos Kong /* disable event notification to avoid events flooding */ 468b1be4280SAmos Kong nc->rxfilter_notify_enabled = 0; 469b1be4280SAmos Kong } 470b1be4280SAmos Kong } 471b1be4280SAmos Kong 472f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n) 473f7bc8ef8SAmos Kong { 47454aa3de7SEric Blake intList *list; 475f7bc8ef8SAmos Kong int i, j; 476f7bc8ef8SAmos Kong 477f7bc8ef8SAmos Kong list = NULL; 478f7bc8ef8SAmos Kong for (i = 0; i < MAX_VLAN >> 5; i++) { 479f7bc8ef8SAmos Kong for (j = 0; n->vlans[i] && j <= 0x1f; j++) { 480f7bc8ef8SAmos Kong if (n->vlans[i] & (1U << j)) { 48154aa3de7SEric Blake QAPI_LIST_PREPEND(list, (i << 5) + j); 482f7bc8ef8SAmos Kong } 483f7bc8ef8SAmos Kong } 484f7bc8ef8SAmos Kong } 485f7bc8ef8SAmos Kong 486f7bc8ef8SAmos Kong return list; 487f7bc8ef8SAmos Kong } 488f7bc8ef8SAmos Kong 489b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc) 490b1be4280SAmos Kong { 491b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 492f7bc8ef8SAmos Kong VirtIODevice *vdev = VIRTIO_DEVICE(n); 493b1be4280SAmos Kong RxFilterInfo *info; 49454aa3de7SEric Blake strList *str_list; 495f7bc8ef8SAmos Kong int i; 496b1be4280SAmos Kong 497b1be4280SAmos Kong info = g_malloc0(sizeof(*info)); 498b1be4280SAmos Kong info->name = g_strdup(nc->name); 499b1be4280SAmos Kong info->promiscuous = n->promisc; 500b1be4280SAmos Kong 501b1be4280SAmos Kong if (n->nouni) { 502b1be4280SAmos Kong info->unicast = RX_STATE_NONE; 503b1be4280SAmos Kong } else if (n->alluni) { 504b1be4280SAmos Kong info->unicast = RX_STATE_ALL; 505b1be4280SAmos Kong } else { 506b1be4280SAmos Kong info->unicast = RX_STATE_NORMAL; 507b1be4280SAmos Kong } 508b1be4280SAmos Kong 509b1be4280SAmos Kong if (n->nomulti) { 510b1be4280SAmos Kong info->multicast = RX_STATE_NONE; 511b1be4280SAmos Kong } else if (n->allmulti) { 512b1be4280SAmos Kong info->multicast = RX_STATE_ALL; 513b1be4280SAmos Kong } else { 514b1be4280SAmos Kong info->multicast = RX_STATE_NORMAL; 515b1be4280SAmos Kong } 516b1be4280SAmos Kong 517b1be4280SAmos Kong info->broadcast_allowed = n->nobcast; 518b1be4280SAmos Kong info->multicast_overflow = n->mac_table.multi_overflow; 519b1be4280SAmos Kong info->unicast_overflow = n->mac_table.uni_overflow; 520b1be4280SAmos Kong 521b0575ba4SScott Feldman info->main_mac = qemu_mac_strdup_printf(n->mac); 522b1be4280SAmos Kong 523b1be4280SAmos Kong str_list = NULL; 524b1be4280SAmos Kong for (i = 0; i < n->mac_table.first_multi; i++) { 52554aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 52654aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 527b1be4280SAmos Kong } 528b1be4280SAmos Kong info->unicast_table = str_list; 529b1be4280SAmos Kong 530b1be4280SAmos Kong str_list = NULL; 531b1be4280SAmos Kong for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 53254aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 53354aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 534b1be4280SAmos Kong } 535b1be4280SAmos Kong info->multicast_table = str_list; 536f7bc8ef8SAmos Kong info->vlan_table = get_vlan_table(n); 537b1be4280SAmos Kong 53895129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) { 539f7bc8ef8SAmos Kong info->vlan = RX_STATE_ALL; 540f7bc8ef8SAmos Kong } else if (!info->vlan_table) { 541f7bc8ef8SAmos Kong info->vlan = RX_STATE_NONE; 542f7bc8ef8SAmos Kong } else { 543f7bc8ef8SAmos Kong info->vlan = RX_STATE_NORMAL; 544b1be4280SAmos Kong } 545b1be4280SAmos Kong 546b1be4280SAmos Kong /* enable event notification after query */ 547b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 548b1be4280SAmos Kong 549b1be4280SAmos Kong return info; 550b1be4280SAmos Kong } 551b1be4280SAmos Kong 5527dc6be52SXuan Zhuo static void virtio_net_queue_reset(VirtIODevice *vdev, uint32_t queue_index) 5537dc6be52SXuan Zhuo { 5547dc6be52SXuan Zhuo VirtIONet *n = VIRTIO_NET(vdev); 555f47af0afSXuan Zhuo NetClientState *nc; 556f47af0afSXuan Zhuo 557f47af0afSXuan Zhuo /* validate queue_index and skip for cvq */ 558f47af0afSXuan Zhuo if (queue_index >= n->max_queue_pairs * 2) { 559f47af0afSXuan Zhuo return; 560f47af0afSXuan Zhuo } 561f47af0afSXuan Zhuo 562f47af0afSXuan Zhuo nc = qemu_get_subqueue(n->nic, vq2q(queue_index)); 5637dc6be52SXuan Zhuo 5647dc6be52SXuan Zhuo if (!nc->peer) { 5657dc6be52SXuan Zhuo return; 5667dc6be52SXuan Zhuo } 5677dc6be52SXuan Zhuo 5687dc6be52SXuan Zhuo if (get_vhost_net(nc->peer) && 5697dc6be52SXuan Zhuo nc->peer->info->type == NET_CLIENT_DRIVER_TAP) { 5707dc6be52SXuan Zhuo vhost_net_virtqueue_reset(vdev, nc, queue_index); 5717dc6be52SXuan Zhuo } 5727dc6be52SXuan Zhuo 5737dc6be52SXuan Zhuo flush_or_purge_queued_packets(nc); 5747dc6be52SXuan Zhuo } 5757dc6be52SXuan Zhuo 5767f863302SKangjie Xu static void virtio_net_queue_enable(VirtIODevice *vdev, uint32_t queue_index) 5777f863302SKangjie Xu { 5787f863302SKangjie Xu VirtIONet *n = VIRTIO_NET(vdev); 579f47af0afSXuan Zhuo NetClientState *nc; 5807f863302SKangjie Xu int r; 5817f863302SKangjie Xu 582f47af0afSXuan Zhuo /* validate queue_index and skip for cvq */ 583f47af0afSXuan Zhuo if (queue_index >= n->max_queue_pairs * 2) { 584f47af0afSXuan Zhuo return; 585f47af0afSXuan Zhuo } 586f47af0afSXuan Zhuo 587f47af0afSXuan Zhuo nc = qemu_get_subqueue(n->nic, vq2q(queue_index)); 588f47af0afSXuan Zhuo 5897f863302SKangjie Xu if (!nc->peer || !vdev->vhost_started) { 5907f863302SKangjie Xu return; 5917f863302SKangjie Xu } 5927f863302SKangjie Xu 5937f863302SKangjie Xu if (get_vhost_net(nc->peer) && 5947f863302SKangjie Xu nc->peer->info->type == NET_CLIENT_DRIVER_TAP) { 5957f863302SKangjie Xu r = vhost_net_virtqueue_restart(vdev, nc, queue_index); 5967f863302SKangjie Xu if (r < 0) { 5977f863302SKangjie Xu error_report("unable to restart vhost net virtqueue: %d, " 5987f863302SKangjie Xu "when resetting the queue", queue_index); 5997f863302SKangjie Xu } 6007f863302SKangjie Xu } 6017f863302SKangjie Xu } 6027f863302SKangjie Xu 6036e790746SPaolo Bonzini static void virtio_net_reset(VirtIODevice *vdev) 6046e790746SPaolo Bonzini { 60517a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 60694b52958SGreg Kurz int i; 6076e790746SPaolo Bonzini 6086e790746SPaolo Bonzini /* Reset back to compatibility mode */ 6096e790746SPaolo Bonzini n->promisc = 1; 6106e790746SPaolo Bonzini n->allmulti = 0; 6116e790746SPaolo Bonzini n->alluni = 0; 6126e790746SPaolo Bonzini n->nomulti = 0; 6136e790746SPaolo Bonzini n->nouni = 0; 6146e790746SPaolo Bonzini n->nobcast = 0; 6156e790746SPaolo Bonzini /* multiqueue is disabled by default */ 616441537f1SJason Wang n->curr_queue_pairs = 1; 6179d8c6a25SDr. David Alan Gilbert timer_del(n->announce_timer.tm); 6189d8c6a25SDr. David Alan Gilbert n->announce_timer.round = 0; 619f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 6206e790746SPaolo Bonzini 6216e790746SPaolo Bonzini /* Flush any MAC and VLAN filter table state */ 6226e790746SPaolo Bonzini n->mac_table.in_use = 0; 6236e790746SPaolo Bonzini n->mac_table.first_multi = 0; 6246e790746SPaolo Bonzini n->mac_table.multi_overflow = 0; 6256e790746SPaolo Bonzini n->mac_table.uni_overflow = 0; 6266e790746SPaolo Bonzini memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN); 6276e790746SPaolo Bonzini memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac)); 628702d66a8SMichael S. Tsirkin qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 6296e790746SPaolo Bonzini memset(n->vlans, 0, MAX_VLAN >> 3); 63094b52958SGreg Kurz 63194b52958SGreg Kurz /* Flush any async TX */ 632441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6334fdf69abSKangjie Xu flush_or_purge_queued_packets(qemu_get_subqueue(n->nic, i)); 63494b52958SGreg Kurz } 6356e790746SPaolo Bonzini } 6366e790746SPaolo Bonzini 6376e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n) 6386e790746SPaolo Bonzini { 6396e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 6406e790746SPaolo Bonzini if (!nc->peer) { 6416e790746SPaolo Bonzini return; 6426e790746SPaolo Bonzini } 6436e790746SPaolo Bonzini 644d6085e3aSStefan Hajnoczi n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer); 6456e790746SPaolo Bonzini } 6466e790746SPaolo Bonzini 6476e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n) 6486e790746SPaolo Bonzini { 6496e790746SPaolo Bonzini return n->has_vnet_hdr; 6506e790746SPaolo Bonzini } 6516e790746SPaolo Bonzini 6526e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n) 6536e790746SPaolo Bonzini { 6546e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) 6556e790746SPaolo Bonzini return 0; 6566e790746SPaolo Bonzini 657d6085e3aSStefan Hajnoczi n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer); 6586e790746SPaolo Bonzini 6596e790746SPaolo Bonzini return n->has_ufo; 6606e790746SPaolo Bonzini } 6616e790746SPaolo Bonzini 66253da8b5aSYuri Benditovich static int peer_has_uso(VirtIONet *n) 66353da8b5aSYuri Benditovich { 66453da8b5aSYuri Benditovich if (!peer_has_vnet_hdr(n)) { 66553da8b5aSYuri Benditovich return 0; 66653da8b5aSYuri Benditovich } 66753da8b5aSYuri Benditovich 66853da8b5aSYuri Benditovich return qemu_has_uso(qemu_get_queue(n->nic)->peer); 66953da8b5aSYuri Benditovich } 67053da8b5aSYuri Benditovich 671bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs, 672e22f0603SYuri Benditovich int version_1, int hash_report) 6736e790746SPaolo Bonzini { 6746e790746SPaolo Bonzini int i; 6756e790746SPaolo Bonzini NetClientState *nc; 6766e790746SPaolo Bonzini 6776e790746SPaolo Bonzini n->mergeable_rx_bufs = mergeable_rx_bufs; 6786e790746SPaolo Bonzini 679bb9d17f8SCornelia Huck if (version_1) { 680e22f0603SYuri Benditovich n->guest_hdr_len = hash_report ? 681e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_v1_hash) : 682e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_mrg_rxbuf); 683e22f0603SYuri Benditovich n->rss_data.populate_hash = !!hash_report; 684bb9d17f8SCornelia Huck } else { 6856e790746SPaolo Bonzini n->guest_hdr_len = n->mergeable_rx_bufs ? 686bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr_mrg_rxbuf) : 687bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr); 688bb9d17f8SCornelia Huck } 6896e790746SPaolo Bonzini 690441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6916e790746SPaolo Bonzini nc = qemu_get_subqueue(n->nic, i); 6926e790746SPaolo Bonzini 6936e790746SPaolo Bonzini if (peer_has_vnet_hdr(n) && 694d6085e3aSStefan Hajnoczi qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) { 695d6085e3aSStefan Hajnoczi qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len); 6966e790746SPaolo Bonzini n->host_hdr_len = n->guest_hdr_len; 6976e790746SPaolo Bonzini } 6986e790746SPaolo Bonzini } 6996e790746SPaolo Bonzini } 7006e790746SPaolo Bonzini 7012eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n) 7022eef278bSMichael S. Tsirkin { 7032eef278bSMichael S. Tsirkin NetClientState *peer = n->nic_conf.peers.ncs[0]; 7042eef278bSMichael S. Tsirkin 7052eef278bSMichael S. Tsirkin /* 7060ea5778fSEugenio Pérez * Backends other than vhost-user or vhost-vdpa don't support max queue 7070ea5778fSEugenio Pérez * size. 7082eef278bSMichael S. Tsirkin */ 7092eef278bSMichael S. Tsirkin if (!peer) { 7102eef278bSMichael S. Tsirkin return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 7112eef278bSMichael S. Tsirkin } 7122eef278bSMichael S. Tsirkin 7130ea5778fSEugenio Pérez switch(peer->info->type) { 7140ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_USER: 7150ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_VDPA: 7162eef278bSMichael S. Tsirkin return VIRTQUEUE_MAX_SIZE; 7170ea5778fSEugenio Pérez default: 7180ea5778fSEugenio Pérez return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 7190ea5778fSEugenio Pérez }; 7202eef278bSMichael S. Tsirkin } 7212eef278bSMichael S. Tsirkin 7226e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index) 7236e790746SPaolo Bonzini { 7246e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 7256e790746SPaolo Bonzini 7266e790746SPaolo Bonzini if (!nc->peer) { 7276e790746SPaolo Bonzini return 0; 7286e790746SPaolo Bonzini } 7296e790746SPaolo Bonzini 730f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 7317263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 1); 7327263a0adSChangchun Ouyang } 7337263a0adSChangchun Ouyang 734f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 7356e790746SPaolo Bonzini return 0; 7366e790746SPaolo Bonzini } 7376e790746SPaolo Bonzini 738441537f1SJason Wang if (n->max_queue_pairs == 1) { 7391074b879SJason Wang return 0; 7401074b879SJason Wang } 7411074b879SJason Wang 7426e790746SPaolo Bonzini return tap_enable(nc->peer); 7436e790746SPaolo Bonzini } 7446e790746SPaolo Bonzini 7456e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index) 7466e790746SPaolo Bonzini { 7476e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 7486e790746SPaolo Bonzini 7496e790746SPaolo Bonzini if (!nc->peer) { 7506e790746SPaolo Bonzini return 0; 7516e790746SPaolo Bonzini } 7526e790746SPaolo Bonzini 753f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 7547263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 0); 7557263a0adSChangchun Ouyang } 7567263a0adSChangchun Ouyang 757f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 7586e790746SPaolo Bonzini return 0; 7596e790746SPaolo Bonzini } 7606e790746SPaolo Bonzini 7616e790746SPaolo Bonzini return tap_disable(nc->peer); 7626e790746SPaolo Bonzini } 7636e790746SPaolo Bonzini 764441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n) 7656e790746SPaolo Bonzini { 7666e790746SPaolo Bonzini int i; 767ddfa83eaSJoel Stanley int r; 7686e790746SPaolo Bonzini 76968b5f314SYuri Benditovich if (n->nic->peer_deleted) { 77068b5f314SYuri Benditovich return; 77168b5f314SYuri Benditovich } 77268b5f314SYuri Benditovich 773441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 774441537f1SJason Wang if (i < n->curr_queue_pairs) { 775ddfa83eaSJoel Stanley r = peer_attach(n, i); 776ddfa83eaSJoel Stanley assert(!r); 7776e790746SPaolo Bonzini } else { 778ddfa83eaSJoel Stanley r = peer_detach(n, i); 779ddfa83eaSJoel Stanley assert(!r); 7806e790746SPaolo Bonzini } 7816e790746SPaolo Bonzini } 7826e790746SPaolo Bonzini } 7836e790746SPaolo Bonzini 784ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue); 7856e790746SPaolo Bonzini 7869d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features, 7879d5b731dSJason Wang Error **errp) 7886e790746SPaolo Bonzini { 78917a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 7906e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 7916e790746SPaolo Bonzini 792da3e8a23SShannon Zhao /* Firstly sync all virtio-net possible supported features */ 793da3e8a23SShannon Zhao features |= n->host_features; 794da3e8a23SShannon Zhao 7950cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7966e790746SPaolo Bonzini 7976e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) { 7980cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_CSUM); 7990cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4); 8000cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6); 8010cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN); 8026e790746SPaolo Bonzini 8030cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM); 8040cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4); 8050cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6); 8060cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN); 807e22f0603SYuri Benditovich 80853da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HOST_USO); 80953da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO4); 81053da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO6); 81153da8b5aSYuri Benditovich 812e22f0603SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT); 8136e790746SPaolo Bonzini } 8146e790746SPaolo Bonzini 8156e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) { 8160cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO); 8170cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO); 8186e790746SPaolo Bonzini } 8196e790746SPaolo Bonzini 82053da8b5aSYuri Benditovich if (!peer_has_uso(n)) { 82153da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HOST_USO); 82253da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO4); 82353da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO6); 82453da8b5aSYuri Benditovich } 82553da8b5aSYuri Benditovich 826ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 8276e790746SPaolo Bonzini return features; 8286e790746SPaolo Bonzini } 8292974e916SYuri Benditovich 8300145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 83159079029SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_RSS); 8320145c393SAndrew Melnychenko } 83375ebec11SMaxime Coquelin features = vhost_net_get_features(get_vhost_net(nc->peer), features); 83475ebec11SMaxime Coquelin vdev->backend_features = features; 83575ebec11SMaxime Coquelin 83675ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 83775ebec11SMaxime Coquelin (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) { 83875ebec11SMaxime Coquelin features |= (1ULL << VIRTIO_NET_F_MTU); 83975ebec11SMaxime Coquelin } 84075ebec11SMaxime Coquelin 841cd69d47cSEugenio Pérez /* 842cd69d47cSEugenio Pérez * Since GUEST_ANNOUNCE is emulated the feature bit could be set without 843cd69d47cSEugenio Pérez * enabled. This happens in the vDPA case. 844cd69d47cSEugenio Pérez * 845cd69d47cSEugenio Pérez * Make sure the feature set is not incoherent, as the driver could refuse 846cd69d47cSEugenio Pérez * to start. 847cd69d47cSEugenio Pérez * 848cd69d47cSEugenio Pérez * TODO: QEMU is able to emulate a CVQ just for guest_announce purposes, 849cd69d47cSEugenio Pérez * helping guest to notify the new location with vDPA devices that does not 850cd69d47cSEugenio Pérez * support it. 851cd69d47cSEugenio Pérez */ 852cd69d47cSEugenio Pérez if (!virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_CTRL_VQ)) { 853cd69d47cSEugenio Pérez virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ANNOUNCE); 854cd69d47cSEugenio Pérez } 855cd69d47cSEugenio Pérez 85675ebec11SMaxime Coquelin return features; 8576e790746SPaolo Bonzini } 8586e790746SPaolo Bonzini 859019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev) 8606e790746SPaolo Bonzini { 861019a3edbSGerd Hoffmann uint64_t features = 0; 8626e790746SPaolo Bonzini 8636e790746SPaolo Bonzini /* Linux kernel 2.6.25. It understood MAC (as everyone must), 8646e790746SPaolo Bonzini * but also these: */ 8650cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 8660cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_CSUM); 8670cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4); 8680cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6); 8690cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN); 8706e790746SPaolo Bonzini 8716e790746SPaolo Bonzini return features; 8726e790746SPaolo Bonzini } 8736e790746SPaolo Bonzini 874644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n) 875644c9858SDmitry Fleytman { 876ad37bb3bSStefan Hajnoczi qemu_set_offload(qemu_get_queue(n->nic)->peer, 877644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)), 878644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)), 879644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)), 880644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)), 8812ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)), 8822ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_USO4)), 8832ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_USO6))); 884644c9858SDmitry Fleytman } 885644c9858SDmitry Fleytman 88653da8b5aSYuri Benditovich static uint64_t virtio_net_guest_offloads_by_features(uint64_t features) 887644c9858SDmitry Fleytman { 888644c9858SDmitry Fleytman static const uint64_t guest_offloads_mask = 889644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_CSUM) | 890644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO4) | 891644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO6) | 892644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_ECN) | 89353da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_UFO) | 89453da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_USO4) | 89553da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_USO6); 896644c9858SDmitry Fleytman 897644c9858SDmitry Fleytman return guest_offloads_mask & features; 898644c9858SDmitry Fleytman } 899644c9858SDmitry Fleytman 9000b545b1eSHawkins Jiawei uint64_t virtio_net_supported_guest_offloads(const VirtIONet *n) 901644c9858SDmitry Fleytman { 902644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 903644c9858SDmitry Fleytman return virtio_net_guest_offloads_by_features(vdev->guest_features); 904644c9858SDmitry Fleytman } 905644c9858SDmitry Fleytman 906f5e1847bSJuan Quintela typedef struct { 907f5e1847bSJuan Quintela VirtIONet *n; 90812b2fad7SKevin Wolf DeviceState *dev; 90912b2fad7SKevin Wolf } FailoverDevice; 910f5e1847bSJuan Quintela 911f5e1847bSJuan Quintela /** 91212b2fad7SKevin Wolf * Set the failover primary device 913f5e1847bSJuan Quintela * 914f5e1847bSJuan Quintela * @opaque: FailoverId to setup 915f5e1847bSJuan Quintela * @opts: opts for device we are handling 916f5e1847bSJuan Quintela * @errp: returns an error if this function fails 917f5e1847bSJuan Quintela */ 91812b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque) 919f5e1847bSJuan Quintela { 92012b2fad7SKevin Wolf FailoverDevice *fdev = opaque; 92112b2fad7SKevin Wolf PCIDevice *pci_dev = (PCIDevice *) 92212b2fad7SKevin Wolf object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE); 923f5e1847bSJuan Quintela 92412b2fad7SKevin Wolf if (!pci_dev) { 92512b2fad7SKevin Wolf return 0; 92612b2fad7SKevin Wolf } 92712b2fad7SKevin Wolf 92812b2fad7SKevin Wolf if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) { 92912b2fad7SKevin Wolf fdev->dev = dev; 930f5e1847bSJuan Quintela return 1; 931f5e1847bSJuan Quintela } 932f5e1847bSJuan Quintela 933f5e1847bSJuan Quintela return 0; 934f5e1847bSJuan Quintela } 935f5e1847bSJuan Quintela 936f5e1847bSJuan Quintela /** 93785d3b931SJuan Quintela * Find the primary device for this failover virtio-net 93885d3b931SJuan Quintela * 93985d3b931SJuan Quintela * @n: VirtIONet device 94085d3b931SJuan Quintela * @errp: returns an error if this function fails 94185d3b931SJuan Quintela */ 9420a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n) 9439711cd0dSJens Freimann { 94412b2fad7SKevin Wolf FailoverDevice fdev = { 94512b2fad7SKevin Wolf .n = n, 94612b2fad7SKevin Wolf }; 9479711cd0dSJens Freimann 94812b2fad7SKevin Wolf qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL, 94912b2fad7SKevin Wolf NULL, NULL, &fdev); 95012b2fad7SKevin Wolf return fdev.dev; 9519711cd0dSJens Freimann } 9529711cd0dSJens Freimann 95321e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp) 95421e8709bSJuan Quintela { 95521e8709bSJuan Quintela Error *err = NULL; 95621e8709bSJuan Quintela DeviceState *dev = failover_find_primary_device(n); 95721e8709bSJuan Quintela 95821e8709bSJuan Quintela if (dev) { 95921e8709bSJuan Quintela return; 96021e8709bSJuan Quintela } 96121e8709bSJuan Quintela 962259a10dbSKevin Wolf if (!n->primary_opts) { 96397ca9c59SLaurent Vivier error_setg(errp, "Primary device not found"); 96497ca9c59SLaurent Vivier error_append_hint(errp, "Virtio-net failover will not work. Make " 96597ca9c59SLaurent Vivier "sure primary device has parameter" 96697ca9c59SLaurent Vivier " failover_pair_id=%s\n", n->netclient_name); 96721e8709bSJuan Quintela return; 96821e8709bSJuan Quintela } 969259a10dbSKevin Wolf 970f3558b1bSKevin Wolf dev = qdev_device_add_from_qdict(n->primary_opts, 971f3558b1bSKevin Wolf n->primary_opts_from_json, 972f3558b1bSKevin Wolf &err); 97321e8709bSJuan Quintela if (err) { 974f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 975259a10dbSKevin Wolf n->primary_opts = NULL; 97600e7b129SLaurent Vivier } else { 97700e7b129SLaurent Vivier object_unref(OBJECT(dev)); 97821e8709bSJuan Quintela } 97921e8709bSJuan Quintela error_propagate(errp, err); 98021e8709bSJuan Quintela } 98121e8709bSJuan Quintela 982d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features) 9836e790746SPaolo Bonzini { 98417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 9859711cd0dSJens Freimann Error *err = NULL; 9866e790746SPaolo Bonzini int i; 9876e790746SPaolo Bonzini 98875ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 98975ebec11SMaxime Coquelin !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) { 99075ebec11SMaxime Coquelin features &= ~(1ULL << VIRTIO_NET_F_MTU); 99175ebec11SMaxime Coquelin } 99275ebec11SMaxime Coquelin 993ef546f12SCornelia Huck virtio_net_set_multiqueue(n, 99459079029SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_RSS) || 99595129d6fSCornelia Huck virtio_has_feature(features, VIRTIO_NET_F_MQ)); 9966e790746SPaolo Bonzini 997ef546f12SCornelia Huck virtio_net_set_mrg_rx_bufs(n, 99895129d6fSCornelia Huck virtio_has_feature(features, 999bb9d17f8SCornelia Huck VIRTIO_NET_F_MRG_RXBUF), 100095129d6fSCornelia Huck virtio_has_feature(features, 1001e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 1002e22f0603SYuri Benditovich virtio_has_feature(features, 1003e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 10046e790746SPaolo Bonzini 10052974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 10062974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4); 10072974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 10082974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6); 1009e22f0603SYuri Benditovich n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS); 10102974e916SYuri Benditovich 10116e790746SPaolo Bonzini if (n->has_vnet_hdr) { 1012644c9858SDmitry Fleytman n->curr_guest_offloads = 1013644c9858SDmitry Fleytman virtio_net_guest_offloads_by_features(features); 1014644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 10156e790746SPaolo Bonzini } 10166e790746SPaolo Bonzini 1017441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 10186e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, i); 10196e790746SPaolo Bonzini 1020ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 10216e790746SPaolo Bonzini continue; 10226e790746SPaolo Bonzini } 1023ed8b4afeSNikolay Nikolaev vhost_net_ack_features(get_vhost_net(nc->peer), features); 1024c9bdc449SHyman Huang(黄勇) 1025c9bdc449SHyman Huang(黄勇) /* 1026c9bdc449SHyman Huang(黄勇) * keep acked_features in NetVhostUserState up-to-date so it 1027c9bdc449SHyman Huang(黄勇) * can't miss any features configured by guest virtio driver. 1028c9bdc449SHyman Huang(黄勇) */ 1029c9bdc449SHyman Huang(黄勇) vhost_net_save_acked_features(nc->peer); 10306e790746SPaolo Bonzini } 10310b1eaa88SStefan Fritsch 103206b636a1SHawkins Jiawei if (!virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) { 10330b1eaa88SStefan Fritsch memset(n->vlans, 0xff, MAX_VLAN >> 3); 10340b1eaa88SStefan Fritsch } 10359711cd0dSJens Freimann 10369711cd0dSJens Freimann if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) { 10379711cd0dSJens Freimann qapi_event_send_failover_negotiated(n->netclient_name); 1038e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 10399711cd0dSJens Freimann failover_add_primary(n, &err); 10409711cd0dSJens Freimann if (err) { 10411b529d90SLaurent Vivier if (!qtest_enabled()) { 10429711cd0dSJens Freimann warn_report_err(err); 10431b529d90SLaurent Vivier } else { 10441b529d90SLaurent Vivier error_free(err); 10451b529d90SLaurent Vivier } 10469711cd0dSJens Freimann } 10476e790746SPaolo Bonzini } 104821e8709bSJuan Quintela } 10496e790746SPaolo Bonzini 10506e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd, 10516e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 10526e790746SPaolo Bonzini { 10536e790746SPaolo Bonzini uint8_t on; 10546e790746SPaolo Bonzini size_t s; 1055b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 10566e790746SPaolo Bonzini 10576e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on)); 10586e790746SPaolo Bonzini if (s != sizeof(on)) { 10596e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10606e790746SPaolo Bonzini } 10616e790746SPaolo Bonzini 10626e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) { 10636e790746SPaolo Bonzini n->promisc = on; 10646e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) { 10656e790746SPaolo Bonzini n->allmulti = on; 10666e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) { 10676e790746SPaolo Bonzini n->alluni = on; 10686e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) { 10696e790746SPaolo Bonzini n->nomulti = on; 10706e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) { 10716e790746SPaolo Bonzini n->nouni = on; 10726e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) { 10736e790746SPaolo Bonzini n->nobcast = on; 10746e790746SPaolo Bonzini } else { 10756e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10766e790746SPaolo Bonzini } 10776e790746SPaolo Bonzini 1078b1be4280SAmos Kong rxfilter_notify(nc); 1079b1be4280SAmos Kong 10806e790746SPaolo Bonzini return VIRTIO_NET_OK; 10816e790746SPaolo Bonzini } 10826e790746SPaolo Bonzini 1083644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd, 1084644c9858SDmitry Fleytman struct iovec *iov, unsigned int iov_cnt) 1085644c9858SDmitry Fleytman { 1086644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 1087644c9858SDmitry Fleytman uint64_t offloads; 1088644c9858SDmitry Fleytman size_t s; 1089644c9858SDmitry Fleytman 109095129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 1091644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1092644c9858SDmitry Fleytman } 1093644c9858SDmitry Fleytman 1094644c9858SDmitry Fleytman s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads)); 1095644c9858SDmitry Fleytman if (s != sizeof(offloads)) { 1096644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1097644c9858SDmitry Fleytman } 1098644c9858SDmitry Fleytman 1099644c9858SDmitry Fleytman if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) { 1100644c9858SDmitry Fleytman uint64_t supported_offloads; 1101644c9858SDmitry Fleytman 1102189ae6bbSJason Wang offloads = virtio_ldq_p(vdev, &offloads); 1103189ae6bbSJason Wang 1104644c9858SDmitry Fleytman if (!n->has_vnet_hdr) { 1105644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1106644c9858SDmitry Fleytman } 1107644c9858SDmitry Fleytman 11082974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 11092974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4); 11102974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 11112974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6); 11122974e916SYuri Benditovich virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT); 11132974e916SYuri Benditovich 1114644c9858SDmitry Fleytman supported_offloads = virtio_net_supported_guest_offloads(n); 1115644c9858SDmitry Fleytman if (offloads & ~supported_offloads) { 1116644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1117644c9858SDmitry Fleytman } 1118644c9858SDmitry Fleytman 1119644c9858SDmitry Fleytman n->curr_guest_offloads = offloads; 1120644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 1121644c9858SDmitry Fleytman 1122644c9858SDmitry Fleytman return VIRTIO_NET_OK; 1123644c9858SDmitry Fleytman } else { 1124644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1125644c9858SDmitry Fleytman } 1126644c9858SDmitry Fleytman } 1127644c9858SDmitry Fleytman 11286e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd, 11296e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 11306e790746SPaolo Bonzini { 11311399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 11326e790746SPaolo Bonzini struct virtio_net_ctrl_mac mac_data; 11336e790746SPaolo Bonzini size_t s; 1134b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 11356e790746SPaolo Bonzini 11366e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) { 11376e790746SPaolo Bonzini if (iov_size(iov, iov_cnt) != sizeof(n->mac)) { 11386e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11396e790746SPaolo Bonzini } 11406e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac)); 11416e790746SPaolo Bonzini assert(s == sizeof(n->mac)); 11426e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1143b1be4280SAmos Kong rxfilter_notify(nc); 1144b1be4280SAmos Kong 11456e790746SPaolo Bonzini return VIRTIO_NET_OK; 11466e790746SPaolo Bonzini } 11476e790746SPaolo Bonzini 11486e790746SPaolo Bonzini if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) { 11496e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11506e790746SPaolo Bonzini } 11516e790746SPaolo Bonzini 1152cae2e556SAmos Kong int in_use = 0; 1153cae2e556SAmos Kong int first_multi = 0; 1154cae2e556SAmos Kong uint8_t uni_overflow = 0; 1155cae2e556SAmos Kong uint8_t multi_overflow = 0; 1156cae2e556SAmos Kong uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 11576e790746SPaolo Bonzini 11586e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 11596e790746SPaolo Bonzini sizeof(mac_data.entries)); 11601399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 11616e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1162b1be4280SAmos Kong goto error; 11636e790746SPaolo Bonzini } 11646e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 11656e790746SPaolo Bonzini 11666e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) { 1167b1be4280SAmos Kong goto error; 11686e790746SPaolo Bonzini } 11696e790746SPaolo Bonzini 11706e790746SPaolo Bonzini if (mac_data.entries <= MAC_TABLE_ENTRIES) { 1171cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, macs, 11726e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 11736e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1174b1be4280SAmos Kong goto error; 11756e790746SPaolo Bonzini } 1176cae2e556SAmos Kong in_use += mac_data.entries; 11776e790746SPaolo Bonzini } else { 1178cae2e556SAmos Kong uni_overflow = 1; 11796e790746SPaolo Bonzini } 11806e790746SPaolo Bonzini 11816e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN); 11826e790746SPaolo Bonzini 1183cae2e556SAmos Kong first_multi = in_use; 11846e790746SPaolo Bonzini 11856e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 11866e790746SPaolo Bonzini sizeof(mac_data.entries)); 11871399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 11886e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1189b1be4280SAmos Kong goto error; 11906e790746SPaolo Bonzini } 11916e790746SPaolo Bonzini 11926e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 11936e790746SPaolo Bonzini 11946e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) { 1195b1be4280SAmos Kong goto error; 11966e790746SPaolo Bonzini } 11976e790746SPaolo Bonzini 1198edc24385SMichael S. Tsirkin if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) { 1199cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN], 12006e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 12016e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1202b1be4280SAmos Kong goto error; 12036e790746SPaolo Bonzini } 1204cae2e556SAmos Kong in_use += mac_data.entries; 12056e790746SPaolo Bonzini } else { 1206cae2e556SAmos Kong multi_overflow = 1; 12076e790746SPaolo Bonzini } 12086e790746SPaolo Bonzini 1209cae2e556SAmos Kong n->mac_table.in_use = in_use; 1210cae2e556SAmos Kong n->mac_table.first_multi = first_multi; 1211cae2e556SAmos Kong n->mac_table.uni_overflow = uni_overflow; 1212cae2e556SAmos Kong n->mac_table.multi_overflow = multi_overflow; 1213cae2e556SAmos Kong memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN); 1214cae2e556SAmos Kong g_free(macs); 1215b1be4280SAmos Kong rxfilter_notify(nc); 1216b1be4280SAmos Kong 12176e790746SPaolo Bonzini return VIRTIO_NET_OK; 1218b1be4280SAmos Kong 1219b1be4280SAmos Kong error: 1220cae2e556SAmos Kong g_free(macs); 1221b1be4280SAmos Kong return VIRTIO_NET_ERR; 12226e790746SPaolo Bonzini } 12236e790746SPaolo Bonzini 12246e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd, 12256e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 12266e790746SPaolo Bonzini { 12271399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 12286e790746SPaolo Bonzini uint16_t vid; 12296e790746SPaolo Bonzini size_t s; 1230b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 12316e790746SPaolo Bonzini 12326e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid)); 12331399c60dSRusty Russell vid = virtio_lduw_p(vdev, &vid); 12346e790746SPaolo Bonzini if (s != sizeof(vid)) { 12356e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12366e790746SPaolo Bonzini } 12376e790746SPaolo Bonzini 12386e790746SPaolo Bonzini if (vid >= MAX_VLAN) 12396e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12406e790746SPaolo Bonzini 12416e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_VLAN_ADD) 12426e790746SPaolo Bonzini n->vlans[vid >> 5] |= (1U << (vid & 0x1f)); 12436e790746SPaolo Bonzini else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL) 12446e790746SPaolo Bonzini n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f)); 12456e790746SPaolo Bonzini else 12466e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12476e790746SPaolo Bonzini 1248b1be4280SAmos Kong rxfilter_notify(nc); 1249b1be4280SAmos Kong 12506e790746SPaolo Bonzini return VIRTIO_NET_OK; 12516e790746SPaolo Bonzini } 12526e790746SPaolo Bonzini 1253f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd, 1254f57fcf70SJason Wang struct iovec *iov, unsigned int iov_cnt) 1255f57fcf70SJason Wang { 12569d8c6a25SDr. David Alan Gilbert trace_virtio_net_handle_announce(n->announce_timer.round); 1257f57fcf70SJason Wang if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK && 1258f57fcf70SJason Wang n->status & VIRTIO_NET_S_ANNOUNCE) { 1259f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 12609d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 12619d8c6a25SDr. David Alan Gilbert qemu_announce_timer_step(&n->announce_timer); 1262f57fcf70SJason Wang } 1263f57fcf70SJason Wang return VIRTIO_NET_OK; 1264f57fcf70SJason Wang } else { 1265f57fcf70SJason Wang return VIRTIO_NET_ERR; 1266f57fcf70SJason Wang } 1267f57fcf70SJason Wang } 1268f57fcf70SJason Wang 12690145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n); 12700145c393SAndrew Melnychenko 127159079029SYuri Benditovich static void virtio_net_disable_rss(VirtIONet *n) 127259079029SYuri Benditovich { 127359079029SYuri Benditovich if (n->rss_data.enabled) { 127459079029SYuri Benditovich trace_virtio_net_rss_disable(); 127559079029SYuri Benditovich } 127659079029SYuri Benditovich n->rss_data.enabled = false; 12770145c393SAndrew Melnychenko 12780145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 12790145c393SAndrew Melnychenko } 12800145c393SAndrew Melnychenko 12810145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd) 12820145c393SAndrew Melnychenko { 12830145c393SAndrew Melnychenko NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0); 12840145c393SAndrew Melnychenko if (nc == NULL || nc->info->set_steering_ebpf == NULL) { 12850145c393SAndrew Melnychenko return false; 12860145c393SAndrew Melnychenko } 12870145c393SAndrew Melnychenko 12880145c393SAndrew Melnychenko return nc->info->set_steering_ebpf(nc, prog_fd); 12890145c393SAndrew Melnychenko } 12900145c393SAndrew Melnychenko 12910145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data, 12920145c393SAndrew Melnychenko struct EBPFRSSConfig *config) 12930145c393SAndrew Melnychenko { 12940145c393SAndrew Melnychenko config->redirect = data->redirect; 12950145c393SAndrew Melnychenko config->populate_hash = data->populate_hash; 12960145c393SAndrew Melnychenko config->hash_types = data->hash_types; 12970145c393SAndrew Melnychenko config->indirections_len = data->indirections_len; 12980145c393SAndrew Melnychenko config->default_queue = data->default_queue; 12990145c393SAndrew Melnychenko } 13000145c393SAndrew Melnychenko 13010145c393SAndrew Melnychenko static bool virtio_net_attach_epbf_rss(VirtIONet *n) 13020145c393SAndrew Melnychenko { 13030145c393SAndrew Melnychenko struct EBPFRSSConfig config = {}; 13040145c393SAndrew Melnychenko 13050145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 13060145c393SAndrew Melnychenko return false; 13070145c393SAndrew Melnychenko } 13080145c393SAndrew Melnychenko 13090145c393SAndrew Melnychenko rss_data_to_rss_config(&n->rss_data, &config); 13100145c393SAndrew Melnychenko 13110145c393SAndrew Melnychenko if (!ebpf_rss_set_all(&n->ebpf_rss, &config, 13120145c393SAndrew Melnychenko n->rss_data.indirections_table, n->rss_data.key)) { 13130145c393SAndrew Melnychenko return false; 13140145c393SAndrew Melnychenko } 13150145c393SAndrew Melnychenko 13160145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) { 13170145c393SAndrew Melnychenko return false; 13180145c393SAndrew Melnychenko } 13190145c393SAndrew Melnychenko 13200145c393SAndrew Melnychenko return true; 13210145c393SAndrew Melnychenko } 13220145c393SAndrew Melnychenko 13230145c393SAndrew Melnychenko static void virtio_net_detach_epbf_rss(VirtIONet *n) 13240145c393SAndrew Melnychenko { 13250145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 13260145c393SAndrew Melnychenko } 13270145c393SAndrew Melnychenko 1328283be596SAkihiko Odaki static bool virtio_net_load_ebpf_fds(VirtIONet *n) 13290145c393SAndrew Melnychenko { 13306b230b7dSAndrew Melnychenko int fds[EBPF_RSS_MAX_FDS] = { [0 ... EBPF_RSS_MAX_FDS - 1] = -1}; 13316b230b7dSAndrew Melnychenko int ret = true; 13326b230b7dSAndrew Melnychenko int i = 0; 13336b230b7dSAndrew Melnychenko 13346b230b7dSAndrew Melnychenko if (n->nr_ebpf_rss_fds != EBPF_RSS_MAX_FDS) { 1335283be596SAkihiko Odaki warn_report("Expected %d file descriptors but got %d", 13366b230b7dSAndrew Melnychenko EBPF_RSS_MAX_FDS, n->nr_ebpf_rss_fds); 13370145c393SAndrew Melnychenko return false; 13380145c393SAndrew Melnychenko } 13390145c393SAndrew Melnychenko 13406b230b7dSAndrew Melnychenko for (i = 0; i < n->nr_ebpf_rss_fds; i++) { 1341283be596SAkihiko Odaki fds[i] = monitor_fd_param(monitor_cur(), n->ebpf_rss_fds[i], 1342283be596SAkihiko Odaki &error_warn); 1343283be596SAkihiko Odaki if (fds[i] < 0) { 13446b230b7dSAndrew Melnychenko ret = false; 13456b230b7dSAndrew Melnychenko goto exit; 13466b230b7dSAndrew Melnychenko } 13476b230b7dSAndrew Melnychenko } 13486b230b7dSAndrew Melnychenko 13496b230b7dSAndrew Melnychenko ret = ebpf_rss_load_fds(&n->ebpf_rss, fds[0], fds[1], fds[2], fds[3]); 13506b230b7dSAndrew Melnychenko 13516b230b7dSAndrew Melnychenko exit: 1352283be596SAkihiko Odaki if (!ret) { 13536b230b7dSAndrew Melnychenko for (i = 0; i < n->nr_ebpf_rss_fds && fds[i] != -1; i++) { 13546b230b7dSAndrew Melnychenko close(fds[i]); 13556b230b7dSAndrew Melnychenko } 13566b230b7dSAndrew Melnychenko } 13576b230b7dSAndrew Melnychenko 13586b230b7dSAndrew Melnychenko return ret; 13596b230b7dSAndrew Melnychenko } 13606b230b7dSAndrew Melnychenko 1361283be596SAkihiko Odaki static bool virtio_net_load_ebpf(VirtIONet *n) 13626b230b7dSAndrew Melnychenko { 13636b230b7dSAndrew Melnychenko bool ret = false; 13646b230b7dSAndrew Melnychenko 13656b230b7dSAndrew Melnychenko if (virtio_net_attach_ebpf_to_backend(n->nic, -1)) { 1366283be596SAkihiko Odaki if (!(n->ebpf_rss_fds && virtio_net_load_ebpf_fds(n))) { 13676b230b7dSAndrew Melnychenko ret = ebpf_rss_load(&n->ebpf_rss); 13686b230b7dSAndrew Melnychenko } 13696b230b7dSAndrew Melnychenko } 13706b230b7dSAndrew Melnychenko 13716b230b7dSAndrew Melnychenko return ret; 13720145c393SAndrew Melnychenko } 13730145c393SAndrew Melnychenko 13740145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n) 13750145c393SAndrew Melnychenko { 13760145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 13770145c393SAndrew Melnychenko ebpf_rss_unload(&n->ebpf_rss); 137859079029SYuri Benditovich } 137959079029SYuri Benditovich 138059079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n, 1381e22f0603SYuri Benditovich struct iovec *iov, 1382e22f0603SYuri Benditovich unsigned int iov_cnt, 1383e22f0603SYuri Benditovich bool do_rss) 138459079029SYuri Benditovich { 138559079029SYuri Benditovich VirtIODevice *vdev = VIRTIO_DEVICE(n); 138659079029SYuri Benditovich struct virtio_net_rss_config cfg; 138759079029SYuri Benditovich size_t s, offset = 0, size_get; 1388441537f1SJason Wang uint16_t queue_pairs, i; 138959079029SYuri Benditovich struct { 139059079029SYuri Benditovich uint16_t us; 139159079029SYuri Benditovich uint8_t b; 139259079029SYuri Benditovich } QEMU_PACKED temp; 139359079029SYuri Benditovich const char *err_msg = ""; 139459079029SYuri Benditovich uint32_t err_value = 0; 139559079029SYuri Benditovich 1396e22f0603SYuri Benditovich if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) { 139759079029SYuri Benditovich err_msg = "RSS is not negotiated"; 139859079029SYuri Benditovich goto error; 139959079029SYuri Benditovich } 1400e22f0603SYuri Benditovich if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) { 1401e22f0603SYuri Benditovich err_msg = "Hash report is not negotiated"; 1402e22f0603SYuri Benditovich goto error; 1403e22f0603SYuri Benditovich } 140459079029SYuri Benditovich size_get = offsetof(struct virtio_net_rss_config, indirection_table); 140559079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get); 140659079029SYuri Benditovich if (s != size_get) { 140759079029SYuri Benditovich err_msg = "Short command buffer"; 140859079029SYuri Benditovich err_value = (uint32_t)s; 140959079029SYuri Benditovich goto error; 141059079029SYuri Benditovich } 141159079029SYuri Benditovich n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types); 141259079029SYuri Benditovich n->rss_data.indirections_len = 141359079029SYuri Benditovich virtio_lduw_p(vdev, &cfg.indirection_table_mask); 141459079029SYuri Benditovich n->rss_data.indirections_len++; 1415e22f0603SYuri Benditovich if (!do_rss) { 1416e22f0603SYuri Benditovich n->rss_data.indirections_len = 1; 1417e22f0603SYuri Benditovich } 141859079029SYuri Benditovich if (!is_power_of_2(n->rss_data.indirections_len)) { 141959079029SYuri Benditovich err_msg = "Invalid size of indirection table"; 142059079029SYuri Benditovich err_value = n->rss_data.indirections_len; 142159079029SYuri Benditovich goto error; 142259079029SYuri Benditovich } 142359079029SYuri Benditovich if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) { 142459079029SYuri Benditovich err_msg = "Too large indirection table"; 142559079029SYuri Benditovich err_value = n->rss_data.indirections_len; 142659079029SYuri Benditovich goto error; 142759079029SYuri Benditovich } 1428e22f0603SYuri Benditovich n->rss_data.default_queue = do_rss ? 1429e22f0603SYuri Benditovich virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0; 1430441537f1SJason Wang if (n->rss_data.default_queue >= n->max_queue_pairs) { 143159079029SYuri Benditovich err_msg = "Invalid default queue"; 143259079029SYuri Benditovich err_value = n->rss_data.default_queue; 143359079029SYuri Benditovich goto error; 143459079029SYuri Benditovich } 143559079029SYuri Benditovich offset += size_get; 143659079029SYuri Benditovich size_get = sizeof(uint16_t) * n->rss_data.indirections_len; 143759079029SYuri Benditovich g_free(n->rss_data.indirections_table); 143859079029SYuri Benditovich n->rss_data.indirections_table = g_malloc(size_get); 143959079029SYuri Benditovich if (!n->rss_data.indirections_table) { 144059079029SYuri Benditovich err_msg = "Can't allocate indirections table"; 144159079029SYuri Benditovich err_value = n->rss_data.indirections_len; 144259079029SYuri Benditovich goto error; 144359079029SYuri Benditovich } 144459079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, 144559079029SYuri Benditovich n->rss_data.indirections_table, size_get); 144659079029SYuri Benditovich if (s != size_get) { 144759079029SYuri Benditovich err_msg = "Short indirection table buffer"; 144859079029SYuri Benditovich err_value = (uint32_t)s; 144959079029SYuri Benditovich goto error; 145059079029SYuri Benditovich } 145159079029SYuri Benditovich for (i = 0; i < n->rss_data.indirections_len; ++i) { 145259079029SYuri Benditovich uint16_t val = n->rss_data.indirections_table[i]; 145359079029SYuri Benditovich n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val); 145459079029SYuri Benditovich } 145559079029SYuri Benditovich offset += size_get; 145659079029SYuri Benditovich size_get = sizeof(temp); 145759079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get); 145859079029SYuri Benditovich if (s != size_get) { 1459441537f1SJason Wang err_msg = "Can't get queue_pairs"; 146059079029SYuri Benditovich err_value = (uint32_t)s; 146159079029SYuri Benditovich goto error; 146259079029SYuri Benditovich } 1463441537f1SJason Wang queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs; 1464441537f1SJason Wang if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) { 1465441537f1SJason Wang err_msg = "Invalid number of queue_pairs"; 1466441537f1SJason Wang err_value = queue_pairs; 146759079029SYuri Benditovich goto error; 146859079029SYuri Benditovich } 146959079029SYuri Benditovich if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) { 147059079029SYuri Benditovich err_msg = "Invalid key size"; 147159079029SYuri Benditovich err_value = temp.b; 147259079029SYuri Benditovich goto error; 147359079029SYuri Benditovich } 147459079029SYuri Benditovich if (!temp.b && n->rss_data.hash_types) { 147559079029SYuri Benditovich err_msg = "No key provided"; 147659079029SYuri Benditovich err_value = 0; 147759079029SYuri Benditovich goto error; 147859079029SYuri Benditovich } 147959079029SYuri Benditovich if (!temp.b && !n->rss_data.hash_types) { 148059079029SYuri Benditovich virtio_net_disable_rss(n); 1481441537f1SJason Wang return queue_pairs; 148259079029SYuri Benditovich } 148359079029SYuri Benditovich offset += size_get; 148459079029SYuri Benditovich size_get = temp.b; 148559079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get); 148659079029SYuri Benditovich if (s != size_get) { 148759079029SYuri Benditovich err_msg = "Can get key buffer"; 148859079029SYuri Benditovich err_value = (uint32_t)s; 148959079029SYuri Benditovich goto error; 149059079029SYuri Benditovich } 149159079029SYuri Benditovich n->rss_data.enabled = true; 14920145c393SAndrew Melnychenko 14930145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 14940145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 14950145c393SAndrew Melnychenko /* EBPF must be loaded for vhost */ 14960145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 14970145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS for vhost"); 14980145c393SAndrew Melnychenko goto error; 14990145c393SAndrew Melnychenko } 15000145c393SAndrew Melnychenko /* fallback to software RSS */ 15010145c393SAndrew Melnychenko warn_report("Can't load eBPF RSS - fallback to software RSS"); 15020145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 15030145c393SAndrew Melnychenko } 15040145c393SAndrew Melnychenko } else { 15050145c393SAndrew Melnychenko /* use software RSS for hash populating */ 15060145c393SAndrew Melnychenko /* and detach eBPF if was loaded before */ 15070145c393SAndrew Melnychenko virtio_net_detach_epbf_rss(n); 15080145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 15090145c393SAndrew Melnychenko } 15100145c393SAndrew Melnychenko 151159079029SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 151259079029SYuri Benditovich n->rss_data.indirections_len, 151359079029SYuri Benditovich temp.b); 1514441537f1SJason Wang return queue_pairs; 151559079029SYuri Benditovich error: 151659079029SYuri Benditovich trace_virtio_net_rss_error(err_msg, err_value); 151759079029SYuri Benditovich virtio_net_disable_rss(n); 151859079029SYuri Benditovich return 0; 151959079029SYuri Benditovich } 152059079029SYuri Benditovich 15216e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd, 15226e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 15236e790746SPaolo Bonzini { 152417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1525441537f1SJason Wang uint16_t queue_pairs; 15262a7888ccSSi-Wei Liu NetClientState *nc = qemu_get_queue(n->nic); 15276e790746SPaolo Bonzini 152859079029SYuri Benditovich virtio_net_disable_rss(n); 1529e22f0603SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) { 1530441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false); 1531441537f1SJason Wang return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR; 1532e22f0603SYuri Benditovich } 153359079029SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) { 1534441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true); 153559079029SYuri Benditovich } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) { 153659079029SYuri Benditovich struct virtio_net_ctrl_mq mq; 153759079029SYuri Benditovich size_t s; 153859079029SYuri Benditovich if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) { 153959079029SYuri Benditovich return VIRTIO_NET_ERR; 154059079029SYuri Benditovich } 15416e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq)); 15426e790746SPaolo Bonzini if (s != sizeof(mq)) { 15436e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15446e790746SPaolo Bonzini } 1545441537f1SJason Wang queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs); 15466e790746SPaolo Bonzini 154759079029SYuri Benditovich } else { 15486e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15496e790746SPaolo Bonzini } 15506e790746SPaolo Bonzini 1551441537f1SJason Wang if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN || 1552441537f1SJason Wang queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX || 1553441537f1SJason Wang queue_pairs > n->max_queue_pairs || 15546e790746SPaolo Bonzini !n->multiqueue) { 15556e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15566e790746SPaolo Bonzini } 15576e790746SPaolo Bonzini 1558441537f1SJason Wang n->curr_queue_pairs = queue_pairs; 1559ca8717f9SEugenio Pérez if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 1560ca8717f9SEugenio Pérez /* 1561ca8717f9SEugenio Pérez * Avoid updating the backend for a vdpa device: We're only interested 1562ca8717f9SEugenio Pérez * in updating the device model queues. 1563ca8717f9SEugenio Pérez */ 1564ca8717f9SEugenio Pérez return VIRTIO_NET_OK; 1565ca8717f9SEugenio Pérez } 1566441537f1SJason Wang /* stop the backend before changing the number of queue_pairs to avoid handling a 15676e790746SPaolo Bonzini * disabled queue */ 156817a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 1569441537f1SJason Wang virtio_net_set_queue_pairs(n); 15706e790746SPaolo Bonzini 15716e790746SPaolo Bonzini return VIRTIO_NET_OK; 15726e790746SPaolo Bonzini } 1573ba7eadb5SGreg Kurz 1574640b8a1cSEugenio Pérez size_t virtio_net_handle_ctrl_iov(VirtIODevice *vdev, 1575640b8a1cSEugenio Pérez const struct iovec *in_sg, unsigned in_num, 1576640b8a1cSEugenio Pérez const struct iovec *out_sg, 1577640b8a1cSEugenio Pérez unsigned out_num) 15786e790746SPaolo Bonzini { 157917a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 15806e790746SPaolo Bonzini struct virtio_net_ctrl_hdr ctrl; 15816e790746SPaolo Bonzini virtio_net_ctrl_ack status = VIRTIO_NET_ERR; 15826e790746SPaolo Bonzini size_t s; 1583771b6ed3SJason Wang struct iovec *iov, *iov2; 1584640b8a1cSEugenio Pérez 1585640b8a1cSEugenio Pérez if (iov_size(in_sg, in_num) < sizeof(status) || 1586640b8a1cSEugenio Pérez iov_size(out_sg, out_num) < sizeof(ctrl)) { 1587640b8a1cSEugenio Pérez virtio_error(vdev, "virtio-net ctrl missing headers"); 1588640b8a1cSEugenio Pérez return 0; 1589640b8a1cSEugenio Pérez } 1590640b8a1cSEugenio Pérez 1591640b8a1cSEugenio Pérez iov2 = iov = g_memdup2(out_sg, sizeof(struct iovec) * out_num); 1592640b8a1cSEugenio Pérez s = iov_to_buf(iov, out_num, 0, &ctrl, sizeof(ctrl)); 1593640b8a1cSEugenio Pérez iov_discard_front(&iov, &out_num, sizeof(ctrl)); 1594640b8a1cSEugenio Pérez if (s != sizeof(ctrl)) { 1595640b8a1cSEugenio Pérez status = VIRTIO_NET_ERR; 1596640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_RX) { 1597640b8a1cSEugenio Pérez status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, out_num); 1598640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) { 1599640b8a1cSEugenio Pérez status = virtio_net_handle_mac(n, ctrl.cmd, iov, out_num); 1600640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) { 1601640b8a1cSEugenio Pérez status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, out_num); 1602640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) { 1603640b8a1cSEugenio Pérez status = virtio_net_handle_announce(n, ctrl.cmd, iov, out_num); 1604640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) { 1605640b8a1cSEugenio Pérez status = virtio_net_handle_mq(n, ctrl.cmd, iov, out_num); 1606640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) { 1607640b8a1cSEugenio Pérez status = virtio_net_handle_offloads(n, ctrl.cmd, iov, out_num); 1608640b8a1cSEugenio Pérez } 1609640b8a1cSEugenio Pérez 1610640b8a1cSEugenio Pérez s = iov_from_buf(in_sg, in_num, 0, &status, sizeof(status)); 1611640b8a1cSEugenio Pérez assert(s == sizeof(status)); 1612640b8a1cSEugenio Pérez 1613640b8a1cSEugenio Pérez g_free(iov2); 1614640b8a1cSEugenio Pérez return sizeof(status); 1615640b8a1cSEugenio Pérez } 1616640b8a1cSEugenio Pérez 1617640b8a1cSEugenio Pérez static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq) 1618640b8a1cSEugenio Pérez { 1619640b8a1cSEugenio Pérez VirtQueueElement *elem; 16206e790746SPaolo Bonzini 162151b19ebeSPaolo Bonzini for (;;) { 1622640b8a1cSEugenio Pérez size_t written; 162351b19ebeSPaolo Bonzini elem = virtqueue_pop(vq, sizeof(VirtQueueElement)); 162451b19ebeSPaolo Bonzini if (!elem) { 162551b19ebeSPaolo Bonzini break; 162651b19ebeSPaolo Bonzini } 1627640b8a1cSEugenio Pérez 1628640b8a1cSEugenio Pérez written = virtio_net_handle_ctrl_iov(vdev, elem->in_sg, elem->in_num, 1629640b8a1cSEugenio Pérez elem->out_sg, elem->out_num); 1630640b8a1cSEugenio Pérez if (written > 0) { 1631640b8a1cSEugenio Pérez virtqueue_push(vq, elem, written); 1632640b8a1cSEugenio Pérez virtio_notify(vdev, vq); 1633640b8a1cSEugenio Pérez g_free(elem); 1634640b8a1cSEugenio Pérez } else { 1635ba7eadb5SGreg Kurz virtqueue_detach_element(vq, elem, 0); 1636ba7eadb5SGreg Kurz g_free(elem); 1637ba7eadb5SGreg Kurz break; 16386e790746SPaolo Bonzini } 16396e790746SPaolo Bonzini } 16406e790746SPaolo Bonzini } 16416e790746SPaolo Bonzini 16426e790746SPaolo Bonzini /* RX */ 16436e790746SPaolo Bonzini 16446e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq) 16456e790746SPaolo Bonzini { 164617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 16476e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(vq)); 16486e790746SPaolo Bonzini 16496e790746SPaolo Bonzini qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index)); 16506e790746SPaolo Bonzini } 16516e790746SPaolo Bonzini 1652b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc) 16536e790746SPaolo Bonzini { 16546e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 165517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 16566e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 16576e790746SPaolo Bonzini 165817a0ca55SKONRAD Frederic if (!vdev->vm_running) { 1659b8c4b67eSPhilippe Mathieu-Daudé return false; 16606e790746SPaolo Bonzini } 16616e790746SPaolo Bonzini 1662441537f1SJason Wang if (nc->queue_index >= n->curr_queue_pairs) { 1663b8c4b67eSPhilippe Mathieu-Daudé return false; 16646e790746SPaolo Bonzini } 16656e790746SPaolo Bonzini 16666e790746SPaolo Bonzini if (!virtio_queue_ready(q->rx_vq) || 166717a0ca55SKONRAD Frederic !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 1668b8c4b67eSPhilippe Mathieu-Daudé return false; 16696e790746SPaolo Bonzini } 16706e790746SPaolo Bonzini 1671b8c4b67eSPhilippe Mathieu-Daudé return true; 16726e790746SPaolo Bonzini } 16736e790746SPaolo Bonzini 16746e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize) 16756e790746SPaolo Bonzini { 16766e790746SPaolo Bonzini VirtIONet *n = q->n; 16776e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 16786e790746SPaolo Bonzini (n->mergeable_rx_bufs && 16796e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 16806e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 1); 16816e790746SPaolo Bonzini 16826e790746SPaolo Bonzini /* To avoid a race condition where the guest has made some buffers 16836e790746SPaolo Bonzini * available after the above check but before notification was 16846e790746SPaolo Bonzini * enabled, check for available buffers again. 16856e790746SPaolo Bonzini */ 16866e790746SPaolo Bonzini if (virtio_queue_empty(q->rx_vq) || 16876e790746SPaolo Bonzini (n->mergeable_rx_bufs && 16886e790746SPaolo Bonzini !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) { 16896e790746SPaolo Bonzini return 0; 16906e790746SPaolo Bonzini } 16916e790746SPaolo Bonzini } 16926e790746SPaolo Bonzini 16936e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 0); 16946e790746SPaolo Bonzini return 1; 16956e790746SPaolo Bonzini } 16966e790746SPaolo Bonzini 16971399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr) 1698032a74a1SCédric Le Goater { 16991399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->hdr_len); 17001399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->gso_size); 17011399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_start); 17021399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_offset); 1703032a74a1SCédric Le Goater } 1704032a74a1SCédric Le Goater 17056e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so 17066e790746SPaolo Bonzini * it never finds out that the packets don't have valid checksums. This 17076e790746SPaolo Bonzini * causes dhclient to get upset. Fedora's carried a patch for ages to 17086e790746SPaolo Bonzini * fix this with Xen but it hasn't appeared in an upstream release of 17096e790746SPaolo Bonzini * dhclient yet. 17106e790746SPaolo Bonzini * 17116e790746SPaolo Bonzini * To avoid breaking existing guests, we catch udp packets and add 17126e790746SPaolo Bonzini * checksums. This is terrible but it's better than hacking the guest 17136e790746SPaolo Bonzini * kernels. 17146e790746SPaolo Bonzini * 17156e790746SPaolo Bonzini * N.B. if we introduce a zero-copy API, this operation is no longer free so 17166e790746SPaolo Bonzini * we should provide a mechanism to disable it to avoid polluting the host 17176e790746SPaolo Bonzini * cache. 17186e790746SPaolo Bonzini */ 17196e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr, 17206e790746SPaolo Bonzini uint8_t *buf, size_t size) 17216e790746SPaolo Bonzini { 17226e790746SPaolo Bonzini if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */ 17236e790746SPaolo Bonzini (size > 27 && size < 1500) && /* normal sized MTU */ 17246e790746SPaolo Bonzini (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */ 17256e790746SPaolo Bonzini (buf[23] == 17) && /* ip.protocol == UDP */ 17266e790746SPaolo Bonzini (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */ 1727f5746335SBin Meng net_checksum_calculate(buf, size, CSUM_UDP); 17286e790746SPaolo Bonzini hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM; 17296e790746SPaolo Bonzini } 17306e790746SPaolo Bonzini } 17316e790746SPaolo Bonzini 17326e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt, 17336e790746SPaolo Bonzini const void *buf, size_t size) 17346e790746SPaolo Bonzini { 17356e790746SPaolo Bonzini if (n->has_vnet_hdr) { 17366e790746SPaolo Bonzini /* FIXME this cast is evil */ 17376e790746SPaolo Bonzini void *wbuf = (void *)buf; 17386e790746SPaolo Bonzini work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len, 17396e790746SPaolo Bonzini size - n->host_hdr_len); 17401bfa316cSGreg Kurz 17411bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 17421399c60dSRusty Russell virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf); 17431bfa316cSGreg Kurz } 17446e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr)); 17456e790746SPaolo Bonzini } else { 17466e790746SPaolo Bonzini struct virtio_net_hdr hdr = { 17476e790746SPaolo Bonzini .flags = 0, 17486e790746SPaolo Bonzini .gso_type = VIRTIO_NET_HDR_GSO_NONE 17496e790746SPaolo Bonzini }; 17506e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr); 17516e790746SPaolo Bonzini } 17526e790746SPaolo Bonzini } 17536e790746SPaolo Bonzini 17546e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size) 17556e790746SPaolo Bonzini { 17566e790746SPaolo Bonzini static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff}; 17576e790746SPaolo Bonzini static const uint8_t vlan[] = {0x81, 0x00}; 17586e790746SPaolo Bonzini uint8_t *ptr = (uint8_t *)buf; 17596e790746SPaolo Bonzini int i; 17606e790746SPaolo Bonzini 17616e790746SPaolo Bonzini if (n->promisc) 17626e790746SPaolo Bonzini return 1; 17636e790746SPaolo Bonzini 17646e790746SPaolo Bonzini ptr += n->host_hdr_len; 17656e790746SPaolo Bonzini 17666e790746SPaolo Bonzini if (!memcmp(&ptr[12], vlan, sizeof(vlan))) { 17677542d3e7SPeter Maydell int vid = lduw_be_p(ptr + 14) & 0xfff; 17686e790746SPaolo Bonzini if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f)))) 17696e790746SPaolo Bonzini return 0; 17706e790746SPaolo Bonzini } 17716e790746SPaolo Bonzini 17726e790746SPaolo Bonzini if (ptr[0] & 1) { // multicast 17736e790746SPaolo Bonzini if (!memcmp(ptr, bcast, sizeof(bcast))) { 17746e790746SPaolo Bonzini return !n->nobcast; 17756e790746SPaolo Bonzini } else if (n->nomulti) { 17766e790746SPaolo Bonzini return 0; 17776e790746SPaolo Bonzini } else if (n->allmulti || n->mac_table.multi_overflow) { 17786e790746SPaolo Bonzini return 1; 17796e790746SPaolo Bonzini } 17806e790746SPaolo Bonzini 17816e790746SPaolo Bonzini for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 17826e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 17836e790746SPaolo Bonzini return 1; 17846e790746SPaolo Bonzini } 17856e790746SPaolo Bonzini } 17866e790746SPaolo Bonzini } else { // unicast 17876e790746SPaolo Bonzini if (n->nouni) { 17886e790746SPaolo Bonzini return 0; 17896e790746SPaolo Bonzini } else if (n->alluni || n->mac_table.uni_overflow) { 17906e790746SPaolo Bonzini return 1; 17916e790746SPaolo Bonzini } else if (!memcmp(ptr, n->mac, ETH_ALEN)) { 17926e790746SPaolo Bonzini return 1; 17936e790746SPaolo Bonzini } 17946e790746SPaolo Bonzini 17956e790746SPaolo Bonzini for (i = 0; i < n->mac_table.first_multi; i++) { 17966e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 17976e790746SPaolo Bonzini return 1; 17986e790746SPaolo Bonzini } 17996e790746SPaolo Bonzini } 18006e790746SPaolo Bonzini } 18016e790746SPaolo Bonzini 18026e790746SPaolo Bonzini return 0; 18036e790746SPaolo Bonzini } 18046e790746SPaolo Bonzini 180569ff5ef8SAkihiko Odaki static uint8_t virtio_net_get_hash_type(bool hasip4, 180669ff5ef8SAkihiko Odaki bool hasip6, 180765f474bbSAkihiko Odaki EthL4HdrProto l4hdr_proto, 18084474e37aSYuri Benditovich uint32_t types) 18094474e37aSYuri Benditovich { 181069ff5ef8SAkihiko Odaki if (hasip4) { 181165f474bbSAkihiko Odaki switch (l4hdr_proto) { 181265f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_TCP: 181365f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4) { 18144474e37aSYuri Benditovich return NetPktRssIpV4Tcp; 18154474e37aSYuri Benditovich } 181665f474bbSAkihiko Odaki break; 181765f474bbSAkihiko Odaki 181865f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_UDP: 181965f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4) { 18204474e37aSYuri Benditovich return NetPktRssIpV4Udp; 18214474e37aSYuri Benditovich } 182265f474bbSAkihiko Odaki break; 182365f474bbSAkihiko Odaki 182465f474bbSAkihiko Odaki default: 182565f474bbSAkihiko Odaki break; 182665f474bbSAkihiko Odaki } 182765f474bbSAkihiko Odaki 18284474e37aSYuri Benditovich if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) { 18294474e37aSYuri Benditovich return NetPktRssIpV4; 18304474e37aSYuri Benditovich } 183169ff5ef8SAkihiko Odaki } else if (hasip6) { 183265f474bbSAkihiko Odaki switch (l4hdr_proto) { 183365f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_TCP: 183465f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) { 183565f474bbSAkihiko Odaki return NetPktRssIpV6TcpEx; 183665f474bbSAkihiko Odaki } 183765f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv6) { 183865f474bbSAkihiko Odaki return NetPktRssIpV6Tcp; 183965f474bbSAkihiko Odaki } 184065f474bbSAkihiko Odaki break; 18414474e37aSYuri Benditovich 184265f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_UDP: 184365f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) { 184465f474bbSAkihiko Odaki return NetPktRssIpV6UdpEx; 18454474e37aSYuri Benditovich } 184665f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv6) { 184765f474bbSAkihiko Odaki return NetPktRssIpV6Udp; 18484474e37aSYuri Benditovich } 184965f474bbSAkihiko Odaki break; 185065f474bbSAkihiko Odaki 185165f474bbSAkihiko Odaki default: 185265f474bbSAkihiko Odaki break; 185365f474bbSAkihiko Odaki } 185465f474bbSAkihiko Odaki 185565f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) { 185665f474bbSAkihiko Odaki return NetPktRssIpV6Ex; 185765f474bbSAkihiko Odaki } 185865f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv6) { 185965f474bbSAkihiko Odaki return NetPktRssIpV6; 18604474e37aSYuri Benditovich } 18614474e37aSYuri Benditovich } 18624474e37aSYuri Benditovich return 0xff; 18634474e37aSYuri Benditovich } 18644474e37aSYuri Benditovich 1865e22f0603SYuri Benditovich static void virtio_set_packet_hash(const uint8_t *buf, uint8_t report, 1866e22f0603SYuri Benditovich uint32_t hash) 1867e22f0603SYuri Benditovich { 1868e22f0603SYuri Benditovich struct virtio_net_hdr_v1_hash *hdr = (void *)buf; 1869e22f0603SYuri Benditovich hdr->hash_value = hash; 1870e22f0603SYuri Benditovich hdr->hash_report = report; 1871e22f0603SYuri Benditovich } 1872e22f0603SYuri Benditovich 18734474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf, 187497cd965cSPaolo Bonzini size_t size) 18756e790746SPaolo Bonzini { 18766e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1877e22f0603SYuri Benditovich unsigned int index = nc->queue_index, new_index = index; 18784474e37aSYuri Benditovich struct NetRxPkt *pkt = n->rx_pkt; 18794474e37aSYuri Benditovich uint8_t net_hash_type; 18804474e37aSYuri Benditovich uint32_t hash; 188165f474bbSAkihiko Odaki bool hasip4, hasip6; 188265f474bbSAkihiko Odaki EthL4HdrProto l4hdr_proto; 1883e22f0603SYuri Benditovich static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = { 1884e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv4, 1885e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv4, 1886e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6, 1887e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6, 1888e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6_EX, 1889e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6_EX, 1890e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv4, 1891e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6, 1892e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6_EX 1893e22f0603SYuri Benditovich }; 18942f0fa232SAkihiko Odaki struct iovec iov = { 18952f0fa232SAkihiko Odaki .iov_base = (void *)buf, 18962f0fa232SAkihiko Odaki .iov_len = size 18972f0fa232SAkihiko Odaki }; 18984474e37aSYuri Benditovich 18992f0fa232SAkihiko Odaki net_rx_pkt_set_protocols(pkt, &iov, 1, n->host_hdr_len); 190065f474bbSAkihiko Odaki net_rx_pkt_get_protocols(pkt, &hasip4, &hasip6, &l4hdr_proto); 190165f474bbSAkihiko Odaki net_hash_type = virtio_net_get_hash_type(hasip4, hasip6, l4hdr_proto, 19024474e37aSYuri Benditovich n->rss_data.hash_types); 19034474e37aSYuri Benditovich if (net_hash_type > NetPktRssIpV6UdpEx) { 1904e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1905e22f0603SYuri Benditovich virtio_set_packet_hash(buf, VIRTIO_NET_HASH_REPORT_NONE, 0); 1906e22f0603SYuri Benditovich } 1907e22f0603SYuri Benditovich return n->rss_data.redirect ? n->rss_data.default_queue : -1; 19084474e37aSYuri Benditovich } 19094474e37aSYuri Benditovich 19104474e37aSYuri Benditovich hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key); 1911e22f0603SYuri Benditovich 1912e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1913e22f0603SYuri Benditovich virtio_set_packet_hash(buf, reports[net_hash_type], hash); 1914e22f0603SYuri Benditovich } 1915e22f0603SYuri Benditovich 1916e22f0603SYuri Benditovich if (n->rss_data.redirect) { 19174474e37aSYuri Benditovich new_index = hash & (n->rss_data.indirections_len - 1); 19184474e37aSYuri Benditovich new_index = n->rss_data.indirections_table[new_index]; 19194474e37aSYuri Benditovich } 1920e22f0603SYuri Benditovich 1921e22f0603SYuri Benditovich return (index == new_index) ? -1 : new_index; 19224474e37aSYuri Benditovich } 19234474e37aSYuri Benditovich 19244474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf, 19254474e37aSYuri Benditovich size_t size, bool no_rss) 19264474e37aSYuri Benditovich { 19274474e37aSYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 19286e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 192917a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1930bedd7e93SJason Wang VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE]; 1931bedd7e93SJason Wang size_t lens[VIRTQUEUE_MAX_SIZE]; 19326e790746SPaolo Bonzini struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE]; 19336e790746SPaolo Bonzini struct virtio_net_hdr_mrg_rxbuf mhdr; 19346e790746SPaolo Bonzini unsigned mhdr_cnt = 0; 1935bedd7e93SJason Wang size_t offset, i, guest_offset, j; 1936bedd7e93SJason Wang ssize_t err; 19376e790746SPaolo Bonzini 19386e790746SPaolo Bonzini if (!virtio_net_can_receive(nc)) { 19396e790746SPaolo Bonzini return -1; 19406e790746SPaolo Bonzini } 19416e790746SPaolo Bonzini 19420145c393SAndrew Melnychenko if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) { 19434474e37aSYuri Benditovich int index = virtio_net_process_rss(nc, buf, size); 19444474e37aSYuri Benditovich if (index >= 0) { 19454474e37aSYuri Benditovich NetClientState *nc2 = qemu_get_subqueue(n->nic, index); 19464474e37aSYuri Benditovich return virtio_net_receive_rcu(nc2, buf, size, true); 19474474e37aSYuri Benditovich } 19484474e37aSYuri Benditovich } 19494474e37aSYuri Benditovich 19506e790746SPaolo Bonzini /* hdr_len refers to the header we supply to the guest */ 19516e790746SPaolo Bonzini if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) { 19526e790746SPaolo Bonzini return 0; 19536e790746SPaolo Bonzini } 19546e790746SPaolo Bonzini 19556e790746SPaolo Bonzini if (!receive_filter(n, buf, size)) 19566e790746SPaolo Bonzini return size; 19576e790746SPaolo Bonzini 19586e790746SPaolo Bonzini offset = i = 0; 19596e790746SPaolo Bonzini 19606e790746SPaolo Bonzini while (offset < size) { 196151b19ebeSPaolo Bonzini VirtQueueElement *elem; 19626e790746SPaolo Bonzini int len, total; 196351b19ebeSPaolo Bonzini const struct iovec *sg; 19646e790746SPaolo Bonzini 19656e790746SPaolo Bonzini total = 0; 19666e790746SPaolo Bonzini 1967bedd7e93SJason Wang if (i == VIRTQUEUE_MAX_SIZE) { 1968bedd7e93SJason Wang virtio_error(vdev, "virtio-net unexpected long buffer chain"); 1969bedd7e93SJason Wang err = size; 1970bedd7e93SJason Wang goto err; 1971bedd7e93SJason Wang } 1972bedd7e93SJason Wang 197351b19ebeSPaolo Bonzini elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement)); 197451b19ebeSPaolo Bonzini if (!elem) { 1975ba10b9c0SGreg Kurz if (i) { 1976ba10b9c0SGreg Kurz virtio_error(vdev, "virtio-net unexpected empty queue: " 19776e790746SPaolo Bonzini "i %zd mergeable %d offset %zd, size %zd, " 1978019a3edbSGerd Hoffmann "guest hdr len %zd, host hdr len %zd " 1979019a3edbSGerd Hoffmann "guest features 0x%" PRIx64, 19806e790746SPaolo Bonzini i, n->mergeable_rx_bufs, offset, size, 1981019a3edbSGerd Hoffmann n->guest_hdr_len, n->host_hdr_len, 1982019a3edbSGerd Hoffmann vdev->guest_features); 1983ba10b9c0SGreg Kurz } 1984bedd7e93SJason Wang err = -1; 1985bedd7e93SJason Wang goto err; 19866e790746SPaolo Bonzini } 19876e790746SPaolo Bonzini 198851b19ebeSPaolo Bonzini if (elem->in_num < 1) { 1989ba10b9c0SGreg Kurz virtio_error(vdev, 1990ba10b9c0SGreg Kurz "virtio-net receive queue contains no in buffers"); 1991ba10b9c0SGreg Kurz virtqueue_detach_element(q->rx_vq, elem, 0); 1992ba10b9c0SGreg Kurz g_free(elem); 1993bedd7e93SJason Wang err = -1; 1994bedd7e93SJason Wang goto err; 19956e790746SPaolo Bonzini } 19966e790746SPaolo Bonzini 199751b19ebeSPaolo Bonzini sg = elem->in_sg; 19986e790746SPaolo Bonzini if (i == 0) { 19996e790746SPaolo Bonzini assert(offset == 0); 20006e790746SPaolo Bonzini if (n->mergeable_rx_bufs) { 20016e790746SPaolo Bonzini mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg), 200251b19ebeSPaolo Bonzini sg, elem->in_num, 20036e790746SPaolo Bonzini offsetof(typeof(mhdr), num_buffers), 20046e790746SPaolo Bonzini sizeof(mhdr.num_buffers)); 20056e790746SPaolo Bonzini } 20066e790746SPaolo Bonzini 200751b19ebeSPaolo Bonzini receive_header(n, sg, elem->in_num, buf, size); 2008e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 2009e22f0603SYuri Benditovich offset = sizeof(mhdr); 2010e22f0603SYuri Benditovich iov_from_buf(sg, elem->in_num, offset, 2011e22f0603SYuri Benditovich buf + offset, n->host_hdr_len - sizeof(mhdr)); 2012e22f0603SYuri Benditovich } 20136e790746SPaolo Bonzini offset = n->host_hdr_len; 20146e790746SPaolo Bonzini total += n->guest_hdr_len; 20156e790746SPaolo Bonzini guest_offset = n->guest_hdr_len; 20166e790746SPaolo Bonzini } else { 20176e790746SPaolo Bonzini guest_offset = 0; 20186e790746SPaolo Bonzini } 20196e790746SPaolo Bonzini 20206e790746SPaolo Bonzini /* copy in packet. ugh */ 202151b19ebeSPaolo Bonzini len = iov_from_buf(sg, elem->in_num, guest_offset, 20226e790746SPaolo Bonzini buf + offset, size - offset); 20236e790746SPaolo Bonzini total += len; 20246e790746SPaolo Bonzini offset += len; 20256e790746SPaolo Bonzini /* If buffers can't be merged, at this point we 20266e790746SPaolo Bonzini * must have consumed the complete packet. 20276e790746SPaolo Bonzini * Otherwise, drop it. */ 20286e790746SPaolo Bonzini if (!n->mergeable_rx_bufs && offset < size) { 202927e57efeSLadi Prosek virtqueue_unpop(q->rx_vq, elem, total); 203051b19ebeSPaolo Bonzini g_free(elem); 2031bedd7e93SJason Wang err = size; 2032bedd7e93SJason Wang goto err; 20336e790746SPaolo Bonzini } 20346e790746SPaolo Bonzini 2035bedd7e93SJason Wang elems[i] = elem; 2036bedd7e93SJason Wang lens[i] = total; 2037bedd7e93SJason Wang i++; 20386e790746SPaolo Bonzini } 20396e790746SPaolo Bonzini 20406e790746SPaolo Bonzini if (mhdr_cnt) { 20411399c60dSRusty Russell virtio_stw_p(vdev, &mhdr.num_buffers, i); 20426e790746SPaolo Bonzini iov_from_buf(mhdr_sg, mhdr_cnt, 20436e790746SPaolo Bonzini 0, 20446e790746SPaolo Bonzini &mhdr.num_buffers, sizeof mhdr.num_buffers); 20456e790746SPaolo Bonzini } 20466e790746SPaolo Bonzini 2047bedd7e93SJason Wang for (j = 0; j < i; j++) { 2048bedd7e93SJason Wang /* signal other side */ 2049bedd7e93SJason Wang virtqueue_fill(q->rx_vq, elems[j], lens[j], j); 2050bedd7e93SJason Wang g_free(elems[j]); 2051bedd7e93SJason Wang } 2052bedd7e93SJason Wang 20536e790746SPaolo Bonzini virtqueue_flush(q->rx_vq, i); 205417a0ca55SKONRAD Frederic virtio_notify(vdev, q->rx_vq); 20556e790746SPaolo Bonzini 20566e790746SPaolo Bonzini return size; 2057bedd7e93SJason Wang 2058bedd7e93SJason Wang err: 2059bedd7e93SJason Wang for (j = 0; j < i; j++) { 2060abe300d9SJason Wang virtqueue_detach_element(q->rx_vq, elems[j], lens[j]); 2061bedd7e93SJason Wang g_free(elems[j]); 2062bedd7e93SJason Wang } 2063bedd7e93SJason Wang 2064bedd7e93SJason Wang return err; 20656e790746SPaolo Bonzini } 20666e790746SPaolo Bonzini 20672974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf, 206897cd965cSPaolo Bonzini size_t size) 206997cd965cSPaolo Bonzini { 2070068ddfa9SDr. David Alan Gilbert RCU_READ_LOCK_GUARD(); 207197cd965cSPaolo Bonzini 20724474e37aSYuri Benditovich return virtio_net_receive_rcu(nc, buf, size, false); 207397cd965cSPaolo Bonzini } 207497cd965cSPaolo Bonzini 20752974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain, 20762974e916SYuri Benditovich const uint8_t *buf, 20772974e916SYuri Benditovich VirtioNetRscUnit *unit) 20782974e916SYuri Benditovich { 20792974e916SYuri Benditovich uint16_t ip_hdrlen; 20802974e916SYuri Benditovich struct ip_header *ip; 20812974e916SYuri Benditovich 20822974e916SYuri Benditovich ip = (struct ip_header *)(buf + chain->n->guest_hdr_len 20832974e916SYuri Benditovich + sizeof(struct eth_header)); 20842974e916SYuri Benditovich unit->ip = (void *)ip; 20852974e916SYuri Benditovich ip_hdrlen = (ip->ip_ver_len & 0xF) << 2; 20862974e916SYuri Benditovich unit->ip_plen = &ip->ip_len; 20872974e916SYuri Benditovich unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen); 20882974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 20892974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen; 20902974e916SYuri Benditovich } 20912974e916SYuri Benditovich 20922974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain, 20932974e916SYuri Benditovich const uint8_t *buf, 20942974e916SYuri Benditovich VirtioNetRscUnit *unit) 20952974e916SYuri Benditovich { 20962974e916SYuri Benditovich struct ip6_header *ip6; 20972974e916SYuri Benditovich 20982974e916SYuri Benditovich ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len 20992974e916SYuri Benditovich + sizeof(struct eth_header)); 21002974e916SYuri Benditovich unit->ip = ip6; 21012974e916SYuri Benditovich unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 210278ee6bd0SPhilippe Mathieu-Daudé unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) 21032974e916SYuri Benditovich + sizeof(struct ip6_header)); 21042974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 21052974e916SYuri Benditovich 21062431f4f1SMichael Tokarev /* There is a difference between payload length in ipv4 and v6, 21072974e916SYuri Benditovich ip header is excluded in ipv6 */ 21082974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen; 21092974e916SYuri Benditovich } 21102974e916SYuri Benditovich 21112974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain, 21122974e916SYuri Benditovich VirtioNetRscSeg *seg) 21132974e916SYuri Benditovich { 21142974e916SYuri Benditovich int ret; 2115dd3d85e8SYuri Benditovich struct virtio_net_hdr_v1 *h; 21162974e916SYuri Benditovich 2117dd3d85e8SYuri Benditovich h = (struct virtio_net_hdr_v1 *)seg->buf; 21182974e916SYuri Benditovich h->flags = 0; 21192974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_NONE; 21202974e916SYuri Benditovich 21212974e916SYuri Benditovich if (seg->is_coalesced) { 2122dd3d85e8SYuri Benditovich h->rsc.segments = seg->packets; 2123dd3d85e8SYuri Benditovich h->rsc.dup_acks = seg->dup_ack; 21242974e916SYuri Benditovich h->flags = VIRTIO_NET_HDR_F_RSC_INFO; 21252974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 21262974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 21272974e916SYuri Benditovich } else { 21282974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 21292974e916SYuri Benditovich } 21302974e916SYuri Benditovich } 21312974e916SYuri Benditovich 21322974e916SYuri Benditovich ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size); 21332974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 21342974e916SYuri Benditovich g_free(seg->buf); 21352974e916SYuri Benditovich g_free(seg); 21362974e916SYuri Benditovich 21372974e916SYuri Benditovich return ret; 21382974e916SYuri Benditovich } 21392974e916SYuri Benditovich 21402974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq) 21412974e916SYuri Benditovich { 21422974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn; 21432974e916SYuri Benditovich VirtioNetRscChain *chain = (VirtioNetRscChain *)opq; 21442974e916SYuri Benditovich 21452974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) { 21462974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 21472974e916SYuri Benditovich chain->stat.purge_failed++; 21482974e916SYuri Benditovich continue; 21492974e916SYuri Benditovich } 21502974e916SYuri Benditovich } 21512974e916SYuri Benditovich 21522974e916SYuri Benditovich chain->stat.timer++; 21532974e916SYuri Benditovich if (!QTAILQ_EMPTY(&chain->buffers)) { 21542974e916SYuri Benditovich timer_mod(chain->drain_timer, 21552974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 21562974e916SYuri Benditovich } 21572974e916SYuri Benditovich } 21582974e916SYuri Benditovich 21592974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n) 21602974e916SYuri Benditovich { 21612974e916SYuri Benditovich VirtioNetRscChain *chain, *rn_chain; 21622974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn_seg; 21632974e916SYuri Benditovich 21642974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) { 21652974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) { 21662974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 21672974e916SYuri Benditovich g_free(seg->buf); 21682974e916SYuri Benditovich g_free(seg); 21692974e916SYuri Benditovich } 21702974e916SYuri Benditovich 21712974e916SYuri Benditovich timer_free(chain->drain_timer); 21722974e916SYuri Benditovich QTAILQ_REMOVE(&n->rsc_chains, chain, next); 21732974e916SYuri Benditovich g_free(chain); 21742974e916SYuri Benditovich } 21752974e916SYuri Benditovich } 21762974e916SYuri Benditovich 21772974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain, 21782974e916SYuri Benditovich NetClientState *nc, 21792974e916SYuri Benditovich const uint8_t *buf, size_t size) 21802974e916SYuri Benditovich { 21812974e916SYuri Benditovich uint16_t hdr_len; 21822974e916SYuri Benditovich VirtioNetRscSeg *seg; 21832974e916SYuri Benditovich 21842974e916SYuri Benditovich hdr_len = chain->n->guest_hdr_len; 2185b21e2380SMarkus Armbruster seg = g_new(VirtioNetRscSeg, 1); 21862974e916SYuri Benditovich seg->buf = g_malloc(hdr_len + sizeof(struct eth_header) 21872974e916SYuri Benditovich + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD); 21882974e916SYuri Benditovich memcpy(seg->buf, buf, size); 21892974e916SYuri Benditovich seg->size = size; 21902974e916SYuri Benditovich seg->packets = 1; 21912974e916SYuri Benditovich seg->dup_ack = 0; 21922974e916SYuri Benditovich seg->is_coalesced = 0; 21932974e916SYuri Benditovich seg->nc = nc; 21942974e916SYuri Benditovich 21952974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&chain->buffers, seg, next); 21962974e916SYuri Benditovich chain->stat.cache++; 21972974e916SYuri Benditovich 21982974e916SYuri Benditovich switch (chain->proto) { 21992974e916SYuri Benditovich case ETH_P_IP: 22002974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit); 22012974e916SYuri Benditovich break; 22022974e916SYuri Benditovich case ETH_P_IPV6: 22032974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit); 22042974e916SYuri Benditovich break; 22052974e916SYuri Benditovich default: 22062974e916SYuri Benditovich g_assert_not_reached(); 22072974e916SYuri Benditovich } 22082974e916SYuri Benditovich } 22092974e916SYuri Benditovich 22102974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain, 22112974e916SYuri Benditovich VirtioNetRscSeg *seg, 22122974e916SYuri Benditovich const uint8_t *buf, 22132974e916SYuri Benditovich struct tcp_header *n_tcp, 22142974e916SYuri Benditovich struct tcp_header *o_tcp) 22152974e916SYuri Benditovich { 22162974e916SYuri Benditovich uint32_t nack, oack; 22172974e916SYuri Benditovich uint16_t nwin, owin; 22182974e916SYuri Benditovich 22192974e916SYuri Benditovich nack = htonl(n_tcp->th_ack); 22202974e916SYuri Benditovich nwin = htons(n_tcp->th_win); 22212974e916SYuri Benditovich oack = htonl(o_tcp->th_ack); 22222974e916SYuri Benditovich owin = htons(o_tcp->th_win); 22232974e916SYuri Benditovich 22242974e916SYuri Benditovich if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) { 22252974e916SYuri Benditovich chain->stat.ack_out_of_win++; 22262974e916SYuri Benditovich return RSC_FINAL; 22272974e916SYuri Benditovich } else if (nack == oack) { 22282974e916SYuri Benditovich /* duplicated ack or window probe */ 22292974e916SYuri Benditovich if (nwin == owin) { 22302974e916SYuri Benditovich /* duplicated ack, add dup ack count due to whql test up to 1 */ 22312974e916SYuri Benditovich chain->stat.dup_ack++; 22322974e916SYuri Benditovich return RSC_FINAL; 22332974e916SYuri Benditovich } else { 22342974e916SYuri Benditovich /* Coalesce window update */ 22352974e916SYuri Benditovich o_tcp->th_win = n_tcp->th_win; 22362974e916SYuri Benditovich chain->stat.win_update++; 22372974e916SYuri Benditovich return RSC_COALESCE; 22382974e916SYuri Benditovich } 22392974e916SYuri Benditovich } else { 22402974e916SYuri Benditovich /* pure ack, go to 'C', finalize*/ 22412974e916SYuri Benditovich chain->stat.pure_ack++; 22422974e916SYuri Benditovich return RSC_FINAL; 22432974e916SYuri Benditovich } 22442974e916SYuri Benditovich } 22452974e916SYuri Benditovich 22462974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain, 22472974e916SYuri Benditovich VirtioNetRscSeg *seg, 22482974e916SYuri Benditovich const uint8_t *buf, 22492974e916SYuri Benditovich VirtioNetRscUnit *n_unit) 22502974e916SYuri Benditovich { 22512974e916SYuri Benditovich void *data; 22522974e916SYuri Benditovich uint16_t o_ip_len; 22532974e916SYuri Benditovich uint32_t nseq, oseq; 22542974e916SYuri Benditovich VirtioNetRscUnit *o_unit; 22552974e916SYuri Benditovich 22562974e916SYuri Benditovich o_unit = &seg->unit; 22572974e916SYuri Benditovich o_ip_len = htons(*o_unit->ip_plen); 22582974e916SYuri Benditovich nseq = htonl(n_unit->tcp->th_seq); 22592974e916SYuri Benditovich oseq = htonl(o_unit->tcp->th_seq); 22602974e916SYuri Benditovich 22612974e916SYuri Benditovich /* out of order or retransmitted. */ 22622974e916SYuri Benditovich if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) { 22632974e916SYuri Benditovich chain->stat.data_out_of_win++; 22642974e916SYuri Benditovich return RSC_FINAL; 22652974e916SYuri Benditovich } 22662974e916SYuri Benditovich 22672974e916SYuri Benditovich data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen; 22682974e916SYuri Benditovich if (nseq == oseq) { 22692974e916SYuri Benditovich if ((o_unit->payload == 0) && n_unit->payload) { 22702974e916SYuri Benditovich /* From no payload to payload, normal case, not a dup ack or etc */ 22712974e916SYuri Benditovich chain->stat.data_after_pure_ack++; 22722974e916SYuri Benditovich goto coalesce; 22732974e916SYuri Benditovich } else { 22742974e916SYuri Benditovich return virtio_net_rsc_handle_ack(chain, seg, buf, 22752974e916SYuri Benditovich n_unit->tcp, o_unit->tcp); 22762974e916SYuri Benditovich } 22772974e916SYuri Benditovich } else if ((nseq - oseq) != o_unit->payload) { 22782974e916SYuri Benditovich /* Not a consistent packet, out of order */ 22792974e916SYuri Benditovich chain->stat.data_out_of_order++; 22802974e916SYuri Benditovich return RSC_FINAL; 22812974e916SYuri Benditovich } else { 22822974e916SYuri Benditovich coalesce: 22832974e916SYuri Benditovich if ((o_ip_len + n_unit->payload) > chain->max_payload) { 22842974e916SYuri Benditovich chain->stat.over_size++; 22852974e916SYuri Benditovich return RSC_FINAL; 22862974e916SYuri Benditovich } 22872974e916SYuri Benditovich 22882974e916SYuri Benditovich /* Here comes the right data, the payload length in v4/v6 is different, 22892974e916SYuri Benditovich so use the field value to update and record the new data len */ 22902974e916SYuri Benditovich o_unit->payload += n_unit->payload; /* update new data len */ 22912974e916SYuri Benditovich 22922974e916SYuri Benditovich /* update field in ip header */ 22932974e916SYuri Benditovich *o_unit->ip_plen = htons(o_ip_len + n_unit->payload); 22942974e916SYuri Benditovich 22952974e916SYuri Benditovich /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced 22962974e916SYuri Benditovich for windows guest, while this may change the behavior for linux 22972974e916SYuri Benditovich guest (only if it uses RSC feature). */ 22982974e916SYuri Benditovich o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags; 22992974e916SYuri Benditovich 23002974e916SYuri Benditovich o_unit->tcp->th_ack = n_unit->tcp->th_ack; 23012974e916SYuri Benditovich o_unit->tcp->th_win = n_unit->tcp->th_win; 23022974e916SYuri Benditovich 23032974e916SYuri Benditovich memmove(seg->buf + seg->size, data, n_unit->payload); 23042974e916SYuri Benditovich seg->size += n_unit->payload; 23052974e916SYuri Benditovich seg->packets++; 23062974e916SYuri Benditovich chain->stat.coalesced++; 23072974e916SYuri Benditovich return RSC_COALESCE; 23082974e916SYuri Benditovich } 23092974e916SYuri Benditovich } 23102974e916SYuri Benditovich 23112974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain, 23122974e916SYuri Benditovich VirtioNetRscSeg *seg, 23132974e916SYuri Benditovich const uint8_t *buf, size_t size, 23142974e916SYuri Benditovich VirtioNetRscUnit *unit) 23152974e916SYuri Benditovich { 23162974e916SYuri Benditovich struct ip_header *ip1, *ip2; 23172974e916SYuri Benditovich 23182974e916SYuri Benditovich ip1 = (struct ip_header *)(unit->ip); 23192974e916SYuri Benditovich ip2 = (struct ip_header *)(seg->unit.ip); 23202974e916SYuri Benditovich if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst) 23212974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 23222974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 23232974e916SYuri Benditovich chain->stat.no_match++; 23242974e916SYuri Benditovich return RSC_NO_MATCH; 23252974e916SYuri Benditovich } 23262974e916SYuri Benditovich 23272974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 23282974e916SYuri Benditovich } 23292974e916SYuri Benditovich 23302974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain, 23312974e916SYuri Benditovich VirtioNetRscSeg *seg, 23322974e916SYuri Benditovich const uint8_t *buf, size_t size, 23332974e916SYuri Benditovich VirtioNetRscUnit *unit) 23342974e916SYuri Benditovich { 23352974e916SYuri Benditovich struct ip6_header *ip1, *ip2; 23362974e916SYuri Benditovich 23372974e916SYuri Benditovich ip1 = (struct ip6_header *)(unit->ip); 23382974e916SYuri Benditovich ip2 = (struct ip6_header *)(seg->unit.ip); 23392974e916SYuri Benditovich if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address)) 23402974e916SYuri Benditovich || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address)) 23412974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 23422974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 23432974e916SYuri Benditovich chain->stat.no_match++; 23442974e916SYuri Benditovich return RSC_NO_MATCH; 23452974e916SYuri Benditovich } 23462974e916SYuri Benditovich 23472974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 23482974e916SYuri Benditovich } 23492974e916SYuri Benditovich 23502974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain 23512974e916SYuri Benditovich * to prevent out of order */ 23522974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain, 23532974e916SYuri Benditovich struct tcp_header *tcp) 23542974e916SYuri Benditovich { 23552974e916SYuri Benditovich uint16_t tcp_hdr; 23562974e916SYuri Benditovich uint16_t tcp_flag; 23572974e916SYuri Benditovich 23582974e916SYuri Benditovich tcp_flag = htons(tcp->th_offset_flags); 23592974e916SYuri Benditovich tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10; 23602974e916SYuri Benditovich tcp_flag &= VIRTIO_NET_TCP_FLAG; 23612974e916SYuri Benditovich if (tcp_flag & TH_SYN) { 23622974e916SYuri Benditovich chain->stat.tcp_syn++; 23632974e916SYuri Benditovich return RSC_BYPASS; 23642974e916SYuri Benditovich } 23652974e916SYuri Benditovich 23662974e916SYuri Benditovich if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) { 23672974e916SYuri Benditovich chain->stat.tcp_ctrl_drain++; 23682974e916SYuri Benditovich return RSC_FINAL; 23692974e916SYuri Benditovich } 23702974e916SYuri Benditovich 23712974e916SYuri Benditovich if (tcp_hdr > sizeof(struct tcp_header)) { 23722974e916SYuri Benditovich chain->stat.tcp_all_opt++; 23732974e916SYuri Benditovich return RSC_FINAL; 23742974e916SYuri Benditovich } 23752974e916SYuri Benditovich 23762974e916SYuri Benditovich return RSC_CANDIDATE; 23772974e916SYuri Benditovich } 23782974e916SYuri Benditovich 23792974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain, 23802974e916SYuri Benditovich NetClientState *nc, 23812974e916SYuri Benditovich const uint8_t *buf, size_t size, 23822974e916SYuri Benditovich VirtioNetRscUnit *unit) 23832974e916SYuri Benditovich { 23842974e916SYuri Benditovich int ret; 23852974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 23862974e916SYuri Benditovich 23872974e916SYuri Benditovich if (QTAILQ_EMPTY(&chain->buffers)) { 23882974e916SYuri Benditovich chain->stat.empty_cache++; 23892974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 23902974e916SYuri Benditovich timer_mod(chain->drain_timer, 23912974e916SYuri Benditovich qemu_clock_get_ns(QEMU_CLOCK_HOST) + chain->n->rsc_timeout); 23922974e916SYuri Benditovich return size; 23932974e916SYuri Benditovich } 23942974e916SYuri Benditovich 23952974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 23962974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 23972974e916SYuri Benditovich ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit); 23982974e916SYuri Benditovich } else { 23992974e916SYuri Benditovich ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit); 24002974e916SYuri Benditovich } 24012974e916SYuri Benditovich 24022974e916SYuri Benditovich if (ret == RSC_FINAL) { 24032974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 24042974e916SYuri Benditovich /* Send failed */ 24052974e916SYuri Benditovich chain->stat.final_failed++; 24062974e916SYuri Benditovich return 0; 24072974e916SYuri Benditovich } 24082974e916SYuri Benditovich 24092974e916SYuri Benditovich /* Send current packet */ 24102974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24112974e916SYuri Benditovich } else if (ret == RSC_NO_MATCH) { 24122974e916SYuri Benditovich continue; 24132974e916SYuri Benditovich } else { 24142974e916SYuri Benditovich /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */ 24152974e916SYuri Benditovich seg->is_coalesced = 1; 24162974e916SYuri Benditovich return size; 24172974e916SYuri Benditovich } 24182974e916SYuri Benditovich } 24192974e916SYuri Benditovich 24202974e916SYuri Benditovich chain->stat.no_match_cache++; 24212974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 24222974e916SYuri Benditovich return size; 24232974e916SYuri Benditovich } 24242974e916SYuri Benditovich 24252974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */ 24262974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain, 24272974e916SYuri Benditovich NetClientState *nc, 24282974e916SYuri Benditovich const uint8_t *buf, size_t size, 24292974e916SYuri Benditovich uint16_t ip_start, uint16_t ip_size, 24302974e916SYuri Benditovich uint16_t tcp_port) 24312974e916SYuri Benditovich { 24322974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 24332974e916SYuri Benditovich uint32_t ppair1, ppair2; 24342974e916SYuri Benditovich 24352974e916SYuri Benditovich ppair1 = *(uint32_t *)(buf + tcp_port); 24362974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 24372974e916SYuri Benditovich ppair2 = *(uint32_t *)(seg->buf + tcp_port); 24382974e916SYuri Benditovich if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size) 24392974e916SYuri Benditovich || (ppair1 != ppair2)) { 24402974e916SYuri Benditovich continue; 24412974e916SYuri Benditovich } 24422974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 24432974e916SYuri Benditovich chain->stat.drain_failed++; 24442974e916SYuri Benditovich } 24452974e916SYuri Benditovich 24462974e916SYuri Benditovich break; 24472974e916SYuri Benditovich } 24482974e916SYuri Benditovich 24492974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24502974e916SYuri Benditovich } 24512974e916SYuri Benditovich 24522974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain, 24532974e916SYuri Benditovich struct ip_header *ip, 24542974e916SYuri Benditovich const uint8_t *buf, size_t size) 24552974e916SYuri Benditovich { 24562974e916SYuri Benditovich uint16_t ip_len; 24572974e916SYuri Benditovich 24582974e916SYuri Benditovich /* Not an ipv4 packet */ 24592974e916SYuri Benditovich if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) { 24602974e916SYuri Benditovich chain->stat.ip_option++; 24612974e916SYuri Benditovich return RSC_BYPASS; 24622974e916SYuri Benditovich } 24632974e916SYuri Benditovich 24642974e916SYuri Benditovich /* Don't handle packets with ip option */ 24652974e916SYuri Benditovich if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) { 24662974e916SYuri Benditovich chain->stat.ip_option++; 24672974e916SYuri Benditovich return RSC_BYPASS; 24682974e916SYuri Benditovich } 24692974e916SYuri Benditovich 24702974e916SYuri Benditovich if (ip->ip_p != IPPROTO_TCP) { 24712974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 24722974e916SYuri Benditovich return RSC_BYPASS; 24732974e916SYuri Benditovich } 24742974e916SYuri Benditovich 24752974e916SYuri Benditovich /* Don't handle packets with ip fragment */ 24762974e916SYuri Benditovich if (!(htons(ip->ip_off) & IP_DF)) { 24772974e916SYuri Benditovich chain->stat.ip_frag++; 24782974e916SYuri Benditovich return RSC_BYPASS; 24792974e916SYuri Benditovich } 24802974e916SYuri Benditovich 24812974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 24822974e916SYuri Benditovich if (IPTOS_ECN(ip->ip_tos)) { 24832974e916SYuri Benditovich chain->stat.ip_ecn++; 24842974e916SYuri Benditovich return RSC_BYPASS; 24852974e916SYuri Benditovich } 24862974e916SYuri Benditovich 24872974e916SYuri Benditovich ip_len = htons(ip->ip_len); 24882974e916SYuri Benditovich if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header)) 24892974e916SYuri Benditovich || ip_len > (size - chain->n->guest_hdr_len - 24902974e916SYuri Benditovich sizeof(struct eth_header))) { 24912974e916SYuri Benditovich chain->stat.ip_hacked++; 24922974e916SYuri Benditovich return RSC_BYPASS; 24932974e916SYuri Benditovich } 24942974e916SYuri Benditovich 24952974e916SYuri Benditovich return RSC_CANDIDATE; 24962974e916SYuri Benditovich } 24972974e916SYuri Benditovich 24982974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain, 24992974e916SYuri Benditovich NetClientState *nc, 25002974e916SYuri Benditovich const uint8_t *buf, size_t size) 25012974e916SYuri Benditovich { 25022974e916SYuri Benditovich int32_t ret; 25032974e916SYuri Benditovich uint16_t hdr_len; 25042974e916SYuri Benditovich VirtioNetRscUnit unit; 25052974e916SYuri Benditovich 25062974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 25072974e916SYuri Benditovich 25082974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header) 25092974e916SYuri Benditovich + sizeof(struct tcp_header))) { 25102974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 25112974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25122974e916SYuri Benditovich } 25132974e916SYuri Benditovich 25142974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, buf, &unit); 25152974e916SYuri Benditovich if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size) 25162974e916SYuri Benditovich != RSC_CANDIDATE) { 25172974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25182974e916SYuri Benditovich } 25192974e916SYuri Benditovich 25202974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 25212974e916SYuri Benditovich if (ret == RSC_BYPASS) { 25222974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25232974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 25242974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 25252974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 12), 25262974e916SYuri Benditovich VIRTIO_NET_IP4_ADDR_SIZE, 25272974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)); 25282974e916SYuri Benditovich } 25292974e916SYuri Benditovich 25302974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 25312974e916SYuri Benditovich } 25322974e916SYuri Benditovich 25332974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain, 25342974e916SYuri Benditovich struct ip6_header *ip6, 25352974e916SYuri Benditovich const uint8_t *buf, size_t size) 25362974e916SYuri Benditovich { 25372974e916SYuri Benditovich uint16_t ip_len; 25382974e916SYuri Benditovich 25392974e916SYuri Benditovich if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4) 25402974e916SYuri Benditovich != IP_HEADER_VERSION_6) { 25412974e916SYuri Benditovich return RSC_BYPASS; 25422974e916SYuri Benditovich } 25432974e916SYuri Benditovich 25442974e916SYuri Benditovich /* Both option and protocol is checked in this */ 25452974e916SYuri Benditovich if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) { 25462974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 25472974e916SYuri Benditovich return RSC_BYPASS; 25482974e916SYuri Benditovich } 25492974e916SYuri Benditovich 25502974e916SYuri Benditovich ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 25512974e916SYuri Benditovich if (ip_len < sizeof(struct tcp_header) || 25522974e916SYuri Benditovich ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header) 25532974e916SYuri Benditovich - sizeof(struct ip6_header))) { 25542974e916SYuri Benditovich chain->stat.ip_hacked++; 25552974e916SYuri Benditovich return RSC_BYPASS; 25562974e916SYuri Benditovich } 25572974e916SYuri Benditovich 25582974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 25592974e916SYuri Benditovich if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) { 25602974e916SYuri Benditovich chain->stat.ip_ecn++; 25612974e916SYuri Benditovich return RSC_BYPASS; 25622974e916SYuri Benditovich } 25632974e916SYuri Benditovich 25642974e916SYuri Benditovich return RSC_CANDIDATE; 25652974e916SYuri Benditovich } 25662974e916SYuri Benditovich 25672974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc, 25682974e916SYuri Benditovich const uint8_t *buf, size_t size) 25692974e916SYuri Benditovich { 25702974e916SYuri Benditovich int32_t ret; 25712974e916SYuri Benditovich uint16_t hdr_len; 25722974e916SYuri Benditovich VirtioNetRscChain *chain; 25732974e916SYuri Benditovich VirtioNetRscUnit unit; 25742974e916SYuri Benditovich 25753d558330SMarkus Armbruster chain = opq; 25762974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 25772974e916SYuri Benditovich 25782974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header) 25792974e916SYuri Benditovich + sizeof(tcp_header))) { 25802974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25812974e916SYuri Benditovich } 25822974e916SYuri Benditovich 25832974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, buf, &unit); 25842974e916SYuri Benditovich if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain, 25852974e916SYuri Benditovich unit.ip, buf, size)) { 25862974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25872974e916SYuri Benditovich } 25882974e916SYuri Benditovich 25892974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 25902974e916SYuri Benditovich if (ret == RSC_BYPASS) { 25912974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25922974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 25932974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 25942974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 8), 25952974e916SYuri Benditovich VIRTIO_NET_IP6_ADDR_SIZE, 25962974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) 25972974e916SYuri Benditovich + sizeof(struct ip6_header)); 25982974e916SYuri Benditovich } 25992974e916SYuri Benditovich 26002974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 26012974e916SYuri Benditovich } 26022974e916SYuri Benditovich 26032974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n, 26042974e916SYuri Benditovich NetClientState *nc, 26052974e916SYuri Benditovich uint16_t proto) 26062974e916SYuri Benditovich { 26072974e916SYuri Benditovich VirtioNetRscChain *chain; 26082974e916SYuri Benditovich 26092974e916SYuri Benditovich if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) { 26102974e916SYuri Benditovich return NULL; 26112974e916SYuri Benditovich } 26122974e916SYuri Benditovich 26132974e916SYuri Benditovich QTAILQ_FOREACH(chain, &n->rsc_chains, next) { 26142974e916SYuri Benditovich if (chain->proto == proto) { 26152974e916SYuri Benditovich return chain; 26162974e916SYuri Benditovich } 26172974e916SYuri Benditovich } 26182974e916SYuri Benditovich 26192974e916SYuri Benditovich chain = g_malloc(sizeof(*chain)); 26202974e916SYuri Benditovich chain->n = n; 26212974e916SYuri Benditovich chain->proto = proto; 26222974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP) { 26232974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD; 26242974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 26252974e916SYuri Benditovich } else { 26262974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD; 26272974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 26282974e916SYuri Benditovich } 26292974e916SYuri Benditovich chain->drain_timer = timer_new_ns(QEMU_CLOCK_HOST, 26302974e916SYuri Benditovich virtio_net_rsc_purge, chain); 26312974e916SYuri Benditovich memset(&chain->stat, 0, sizeof(chain->stat)); 26322974e916SYuri Benditovich 26332974e916SYuri Benditovich QTAILQ_INIT(&chain->buffers); 26342974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next); 26352974e916SYuri Benditovich 26362974e916SYuri Benditovich return chain; 26372974e916SYuri Benditovich } 26382974e916SYuri Benditovich 26392974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc, 26402974e916SYuri Benditovich const uint8_t *buf, 26412974e916SYuri Benditovich size_t size) 26422974e916SYuri Benditovich { 26432974e916SYuri Benditovich uint16_t proto; 26442974e916SYuri Benditovich VirtioNetRscChain *chain; 26452974e916SYuri Benditovich struct eth_header *eth; 26462974e916SYuri Benditovich VirtIONet *n; 26472974e916SYuri Benditovich 26482974e916SYuri Benditovich n = qemu_get_nic_opaque(nc); 26492974e916SYuri Benditovich if (size < (n->host_hdr_len + sizeof(struct eth_header))) { 26502974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26512974e916SYuri Benditovich } 26522974e916SYuri Benditovich 26532974e916SYuri Benditovich eth = (struct eth_header *)(buf + n->guest_hdr_len); 26542974e916SYuri Benditovich proto = htons(eth->h_proto); 26552974e916SYuri Benditovich 26562974e916SYuri Benditovich chain = virtio_net_rsc_lookup_chain(n, nc, proto); 26572974e916SYuri Benditovich if (chain) { 26582974e916SYuri Benditovich chain->stat.received++; 26592974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) { 26602974e916SYuri Benditovich return virtio_net_rsc_receive4(chain, nc, buf, size); 26612974e916SYuri Benditovich } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) { 26622974e916SYuri Benditovich return virtio_net_rsc_receive6(chain, nc, buf, size); 26632974e916SYuri Benditovich } 26642974e916SYuri Benditovich } 26652974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26662974e916SYuri Benditovich } 26672974e916SYuri Benditovich 26682974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, 26692974e916SYuri Benditovich size_t size) 26702974e916SYuri Benditovich { 26712974e916SYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 26722974e916SYuri Benditovich if ((n->rsc4_enabled || n->rsc6_enabled)) { 26732974e916SYuri Benditovich return virtio_net_rsc_receive(nc, buf, size); 26742974e916SYuri Benditovich } else { 26752974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26762974e916SYuri Benditovich } 26772974e916SYuri Benditovich } 26782974e916SYuri Benditovich 26796e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q); 26806e790746SPaolo Bonzini 26816e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len) 26826e790746SPaolo Bonzini { 26836e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 26846e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 268517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2686df8d0708SLaurent Vivier int ret; 26876e790746SPaolo Bonzini 268851b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, q->async_tx.elem, 0); 268917a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 26906e790746SPaolo Bonzini 269151b19ebeSPaolo Bonzini g_free(q->async_tx.elem); 269251b19ebeSPaolo Bonzini q->async_tx.elem = NULL; 26936e790746SPaolo Bonzini 26946e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2695df8d0708SLaurent Vivier ret = virtio_net_flush_tx(q); 26967550a822SLaurent Vivier if (ret >= n->tx_burst) { 2697df8d0708SLaurent Vivier /* 2698df8d0708SLaurent Vivier * the flush has been stopped by tx_burst 2699df8d0708SLaurent Vivier * we will not receive notification for the 2700df8d0708SLaurent Vivier * remainining part, so re-schedule 2701df8d0708SLaurent Vivier */ 2702df8d0708SLaurent Vivier virtio_queue_set_notification(q->tx_vq, 0); 27037550a822SLaurent Vivier if (q->tx_bh) { 2704df8d0708SLaurent Vivier qemu_bh_schedule(q->tx_bh); 27057550a822SLaurent Vivier } else { 27067550a822SLaurent Vivier timer_mod(q->tx_timer, 27077550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 27087550a822SLaurent Vivier } 2709df8d0708SLaurent Vivier q->tx_waiting = 1; 2710df8d0708SLaurent Vivier } 27116e790746SPaolo Bonzini } 27126e790746SPaolo Bonzini 27136e790746SPaolo Bonzini /* TX */ 27146e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q) 27156e790746SPaolo Bonzini { 27166e790746SPaolo Bonzini VirtIONet *n = q->n; 271717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 271851b19ebeSPaolo Bonzini VirtQueueElement *elem; 27196e790746SPaolo Bonzini int32_t num_packets = 0; 27206e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(q->tx_vq)); 272117a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 27226e790746SPaolo Bonzini return num_packets; 27236e790746SPaolo Bonzini } 27246e790746SPaolo Bonzini 272551b19ebeSPaolo Bonzini if (q->async_tx.elem) { 27266e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27276e790746SPaolo Bonzini return num_packets; 27286e790746SPaolo Bonzini } 27296e790746SPaolo Bonzini 273051b19ebeSPaolo Bonzini for (;;) { 2731bd89dd98SJason Wang ssize_t ret; 273251b19ebeSPaolo Bonzini unsigned int out_num; 273351b19ebeSPaolo Bonzini struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg; 2734*942f420eSAkihiko Odaki struct virtio_net_hdr vhdr; 27356e790746SPaolo Bonzini 273651b19ebeSPaolo Bonzini elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement)); 273751b19ebeSPaolo Bonzini if (!elem) { 273851b19ebeSPaolo Bonzini break; 273951b19ebeSPaolo Bonzini } 274051b19ebeSPaolo Bonzini 274151b19ebeSPaolo Bonzini out_num = elem->out_num; 274251b19ebeSPaolo Bonzini out_sg = elem->out_sg; 27436e790746SPaolo Bonzini if (out_num < 1) { 2744fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header not in first element"); 2745fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2746fa5e56c2SGreg Kurz g_free(elem); 2747fa5e56c2SGreg Kurz return -EINVAL; 27486e790746SPaolo Bonzini } 27496e790746SPaolo Bonzini 2750ad57f700SAkihiko Odaki if (n->needs_vnet_hdr_swap) { 2751*942f420eSAkihiko Odaki if (iov_to_buf(out_sg, out_num, 0, &vhdr, sizeof(vhdr)) < 2752*942f420eSAkihiko Odaki sizeof(vhdr)) { 2753fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header incorrect"); 2754fa5e56c2SGreg Kurz virtqueue_detach_element(q->tx_vq, elem, 0); 2755fa5e56c2SGreg Kurz g_free(elem); 2756fa5e56c2SGreg Kurz return -EINVAL; 2757032a74a1SCédric Le Goater } 2758*942f420eSAkihiko Odaki virtio_net_hdr_swap(vdev, &vhdr); 27592220e818SJason Wang sg2[0].iov_base = &vhdr; 2760*942f420eSAkihiko Odaki sg2[0].iov_len = sizeof(vhdr); 2761ad57f700SAkihiko Odaki out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1, out_sg, out_num, 2762*942f420eSAkihiko Odaki sizeof(vhdr), -1); 2763feb93f36SJason Wang if (out_num == VIRTQUEUE_MAX_SIZE) { 2764feb93f36SJason Wang goto drop; 2765032a74a1SCédric Le Goater } 2766feb93f36SJason Wang out_num += 1; 2767feb93f36SJason Wang out_sg = sg2; 2768feb93f36SJason Wang } 27696e790746SPaolo Bonzini /* 27706e790746SPaolo Bonzini * If host wants to see the guest header as is, we can 27716e790746SPaolo Bonzini * pass it on unchanged. Otherwise, copy just the parts 27726e790746SPaolo Bonzini * that host is interested in. 27736e790746SPaolo Bonzini */ 27746e790746SPaolo Bonzini assert(n->host_hdr_len <= n->guest_hdr_len); 27756e790746SPaolo Bonzini if (n->host_hdr_len != n->guest_hdr_len) { 27766e790746SPaolo Bonzini unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg), 27776e790746SPaolo Bonzini out_sg, out_num, 27786e790746SPaolo Bonzini 0, n->host_hdr_len); 27796e790746SPaolo Bonzini sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num, 27806e790746SPaolo Bonzini out_sg, out_num, 27816e790746SPaolo Bonzini n->guest_hdr_len, -1); 27826e790746SPaolo Bonzini out_num = sg_num; 27836e790746SPaolo Bonzini out_sg = sg; 27846e790746SPaolo Bonzini } 27856e790746SPaolo Bonzini 27866e790746SPaolo Bonzini ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index), 27876e790746SPaolo Bonzini out_sg, out_num, virtio_net_tx_complete); 27886e790746SPaolo Bonzini if (ret == 0) { 27896e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27906e790746SPaolo Bonzini q->async_tx.elem = elem; 27916e790746SPaolo Bonzini return -EBUSY; 27926e790746SPaolo Bonzini } 27936e790746SPaolo Bonzini 2794feb93f36SJason Wang drop: 279551b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, elem, 0); 279617a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 279751b19ebeSPaolo Bonzini g_free(elem); 27986e790746SPaolo Bonzini 27996e790746SPaolo Bonzini if (++num_packets >= n->tx_burst) { 28006e790746SPaolo Bonzini break; 28016e790746SPaolo Bonzini } 28026e790746SPaolo Bonzini } 28036e790746SPaolo Bonzini return num_packets; 28046e790746SPaolo Bonzini } 28056e790746SPaolo Bonzini 28067550a822SLaurent Vivier static void virtio_net_tx_timer(void *opaque); 28077550a822SLaurent Vivier 28086e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq) 28096e790746SPaolo Bonzini { 281017a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 28116e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 28126e790746SPaolo Bonzini 2813283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2814283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2815283e2c2aSYuri Benditovich return; 2816283e2c2aSYuri Benditovich } 2817283e2c2aSYuri Benditovich 28186e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 281917a0ca55SKONRAD Frederic if (!vdev->vm_running) { 28206e790746SPaolo Bonzini q->tx_waiting = 1; 28216e790746SPaolo Bonzini return; 28226e790746SPaolo Bonzini } 28236e790746SPaolo Bonzini 28246e790746SPaolo Bonzini if (q->tx_waiting) { 28257550a822SLaurent Vivier /* We already have queued packets, immediately flush */ 2826bc72ad67SAlex Bligh timer_del(q->tx_timer); 28277550a822SLaurent Vivier virtio_net_tx_timer(q); 28286e790746SPaolo Bonzini } else { 28297550a822SLaurent Vivier /* re-arm timer to flush it (and more) on next tick */ 2830bc72ad67SAlex Bligh timer_mod(q->tx_timer, 2831bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28326e790746SPaolo Bonzini q->tx_waiting = 1; 28336e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 28346e790746SPaolo Bonzini } 28356e790746SPaolo Bonzini } 28366e790746SPaolo Bonzini 28376e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq) 28386e790746SPaolo Bonzini { 283917a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 28406e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 28416e790746SPaolo Bonzini 28424c54f5bcSYajun Wu if (unlikely(n->vhost_started)) { 28434c54f5bcSYajun Wu return; 28444c54f5bcSYajun Wu } 28454c54f5bcSYajun Wu 2846283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2847283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2848283e2c2aSYuri Benditovich return; 2849283e2c2aSYuri Benditovich } 2850283e2c2aSYuri Benditovich 28516e790746SPaolo Bonzini if (unlikely(q->tx_waiting)) { 28526e790746SPaolo Bonzini return; 28536e790746SPaolo Bonzini } 28546e790746SPaolo Bonzini q->tx_waiting = 1; 28556e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 285617a0ca55SKONRAD Frederic if (!vdev->vm_running) { 28576e790746SPaolo Bonzini return; 28586e790746SPaolo Bonzini } 28596e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 28606e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 28616e790746SPaolo Bonzini } 28626e790746SPaolo Bonzini 28636e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque) 28646e790746SPaolo Bonzini { 28656e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 28666e790746SPaolo Bonzini VirtIONet *n = q->n; 286717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 28687550a822SLaurent Vivier int ret; 28697550a822SLaurent Vivier 2870e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2871e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2872e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2873e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2874e8bcf842SMichael S. Tsirkin return; 2875e8bcf842SMichael S. Tsirkin } 28766e790746SPaolo Bonzini 28776e790746SPaolo Bonzini q->tx_waiting = 0; 28786e790746SPaolo Bonzini 28796e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 288017a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 28816e790746SPaolo Bonzini return; 288217a0ca55SKONRAD Frederic } 28836e790746SPaolo Bonzini 28847550a822SLaurent Vivier ret = virtio_net_flush_tx(q); 28857550a822SLaurent Vivier if (ret == -EBUSY || ret == -EINVAL) { 28867550a822SLaurent Vivier return; 28877550a822SLaurent Vivier } 28887550a822SLaurent Vivier /* 28897550a822SLaurent Vivier * If we flush a full burst of packets, assume there are 28907550a822SLaurent Vivier * more coming and immediately rearm 28917550a822SLaurent Vivier */ 28927550a822SLaurent Vivier if (ret >= n->tx_burst) { 28937550a822SLaurent Vivier q->tx_waiting = 1; 28947550a822SLaurent Vivier timer_mod(q->tx_timer, 28957550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28967550a822SLaurent Vivier return; 28977550a822SLaurent Vivier } 28987550a822SLaurent Vivier /* 28997550a822SLaurent Vivier * If less than a full burst, re-enable notification and flush 29007550a822SLaurent Vivier * anything that may have come in while we weren't looking. If 29017550a822SLaurent Vivier * we find something, assume the guest is still active and rearm 29027550a822SLaurent Vivier */ 29036e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 29047550a822SLaurent Vivier ret = virtio_net_flush_tx(q); 29057550a822SLaurent Vivier if (ret > 0) { 29067550a822SLaurent Vivier virtio_queue_set_notification(q->tx_vq, 0); 29077550a822SLaurent Vivier q->tx_waiting = 1; 29087550a822SLaurent Vivier timer_mod(q->tx_timer, 29097550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 29107550a822SLaurent Vivier } 29116e790746SPaolo Bonzini } 29126e790746SPaolo Bonzini 29136e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque) 29146e790746SPaolo Bonzini { 29156e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 29166e790746SPaolo Bonzini VirtIONet *n = q->n; 291717a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 29186e790746SPaolo Bonzini int32_t ret; 29196e790746SPaolo Bonzini 2920e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2921e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2922e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2923e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2924e8bcf842SMichael S. Tsirkin return; 2925e8bcf842SMichael S. Tsirkin } 29266e790746SPaolo Bonzini 29276e790746SPaolo Bonzini q->tx_waiting = 0; 29286e790746SPaolo Bonzini 29296e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 293017a0ca55SKONRAD Frederic if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) { 29316e790746SPaolo Bonzini return; 293217a0ca55SKONRAD Frederic } 29336e790746SPaolo Bonzini 29346e790746SPaolo Bonzini ret = virtio_net_flush_tx(q); 2935fa5e56c2SGreg Kurz if (ret == -EBUSY || ret == -EINVAL) { 2936fa5e56c2SGreg Kurz return; /* Notification re-enable handled by tx_complete or device 2937fa5e56c2SGreg Kurz * broken */ 29386e790746SPaolo Bonzini } 29396e790746SPaolo Bonzini 29406e790746SPaolo Bonzini /* If we flush a full burst of packets, assume there are 29416e790746SPaolo Bonzini * more coming and immediately reschedule */ 29426e790746SPaolo Bonzini if (ret >= n->tx_burst) { 29436e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 29446e790746SPaolo Bonzini q->tx_waiting = 1; 29456e790746SPaolo Bonzini return; 29466e790746SPaolo Bonzini } 29476e790746SPaolo Bonzini 29486e790746SPaolo Bonzini /* If less than a full burst, re-enable notification and flush 29496e790746SPaolo Bonzini * anything that may have come in while we weren't looking. If 29506e790746SPaolo Bonzini * we find something, assume the guest is still active and reschedule */ 29516e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2952fa5e56c2SGreg Kurz ret = virtio_net_flush_tx(q); 2953fa5e56c2SGreg Kurz if (ret == -EINVAL) { 2954fa5e56c2SGreg Kurz return; 2955fa5e56c2SGreg Kurz } else if (ret > 0) { 29566e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 29576e790746SPaolo Bonzini qemu_bh_schedule(q->tx_bh); 29586e790746SPaolo Bonzini q->tx_waiting = 1; 29596e790746SPaolo Bonzini } 29606e790746SPaolo Bonzini } 29616e790746SPaolo Bonzini 2962f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index) 2963f9d6dbf0SWen Congyang { 2964f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2965f9d6dbf0SWen Congyang 29661c0fbfa3SMichael S. Tsirkin n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size, 29671c0fbfa3SMichael S. Tsirkin virtio_net_handle_rx); 29689b02e161SWei Wang 2969f9d6dbf0SWen Congyang if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) { 2970f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 29719b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 29729b02e161SWei Wang virtio_net_handle_tx_timer); 2973f9d6dbf0SWen Congyang n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, 2974f9d6dbf0SWen Congyang virtio_net_tx_timer, 2975f9d6dbf0SWen Congyang &n->vqs[index]); 2976f9d6dbf0SWen Congyang } else { 2977f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 29789b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 29799b02e161SWei Wang virtio_net_handle_tx_bh); 2980f63192b0SAlexander Bulekov n->vqs[index].tx_bh = qemu_bh_new_guarded(virtio_net_tx_bh, &n->vqs[index], 2981f63192b0SAlexander Bulekov &DEVICE(vdev)->mem_reentrancy_guard); 2982f9d6dbf0SWen Congyang } 2983f9d6dbf0SWen Congyang 2984f9d6dbf0SWen Congyang n->vqs[index].tx_waiting = 0; 2985f9d6dbf0SWen Congyang n->vqs[index].n = n; 2986f9d6dbf0SWen Congyang } 2987f9d6dbf0SWen Congyang 2988f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index) 2989f9d6dbf0SWen Congyang { 2990f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2991f9d6dbf0SWen Congyang VirtIONetQueue *q = &n->vqs[index]; 2992f9d6dbf0SWen Congyang NetClientState *nc = qemu_get_subqueue(n->nic, index); 2993f9d6dbf0SWen Congyang 2994f9d6dbf0SWen Congyang qemu_purge_queued_packets(nc); 2995f9d6dbf0SWen Congyang 2996f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2); 2997f9d6dbf0SWen Congyang if (q->tx_timer) { 2998f9d6dbf0SWen Congyang timer_free(q->tx_timer); 2999f989c30cSYunjian Wang q->tx_timer = NULL; 3000f9d6dbf0SWen Congyang } else { 3001f9d6dbf0SWen Congyang qemu_bh_delete(q->tx_bh); 3002f989c30cSYunjian Wang q->tx_bh = NULL; 3003f9d6dbf0SWen Congyang } 3004f989c30cSYunjian Wang q->tx_waiting = 0; 3005f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2 + 1); 3006f9d6dbf0SWen Congyang } 3007f9d6dbf0SWen Congyang 3008441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs) 3009f9d6dbf0SWen Congyang { 3010f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 3011f9d6dbf0SWen Congyang int old_num_queues = virtio_get_num_queues(vdev); 3012441537f1SJason Wang int new_num_queues = new_max_queue_pairs * 2 + 1; 3013f9d6dbf0SWen Congyang int i; 3014f9d6dbf0SWen Congyang 3015f9d6dbf0SWen Congyang assert(old_num_queues >= 3); 3016f9d6dbf0SWen Congyang assert(old_num_queues % 2 == 1); 3017f9d6dbf0SWen Congyang 3018f9d6dbf0SWen Congyang if (old_num_queues == new_num_queues) { 3019f9d6dbf0SWen Congyang return; 3020f9d6dbf0SWen Congyang } 3021f9d6dbf0SWen Congyang 3022f9d6dbf0SWen Congyang /* 3023f9d6dbf0SWen Congyang * We always need to remove and add ctrl vq if 3024f9d6dbf0SWen Congyang * old_num_queues != new_num_queues. Remove ctrl_vq first, 302520f86a75SYuval Shaia * and then we only enter one of the following two loops. 3026f9d6dbf0SWen Congyang */ 3027f9d6dbf0SWen Congyang virtio_del_queue(vdev, old_num_queues - 1); 3028f9d6dbf0SWen Congyang 3029f9d6dbf0SWen Congyang for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) { 3030f9d6dbf0SWen Congyang /* new_num_queues < old_num_queues */ 3031f9d6dbf0SWen Congyang virtio_net_del_queue(n, i / 2); 3032f9d6dbf0SWen Congyang } 3033f9d6dbf0SWen Congyang 3034f9d6dbf0SWen Congyang for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) { 3035f9d6dbf0SWen Congyang /* new_num_queues > old_num_queues */ 3036f9d6dbf0SWen Congyang virtio_net_add_queue(n, i / 2); 3037f9d6dbf0SWen Congyang } 3038f9d6dbf0SWen Congyang 3039f9d6dbf0SWen Congyang /* add ctrl_vq last */ 3040f9d6dbf0SWen Congyang n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 3041f9d6dbf0SWen Congyang } 3042f9d6dbf0SWen Congyang 3043ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue) 30446e790746SPaolo Bonzini { 3045441537f1SJason Wang int max = multiqueue ? n->max_queue_pairs : 1; 3046f9d6dbf0SWen Congyang 30476e790746SPaolo Bonzini n->multiqueue = multiqueue; 3048441537f1SJason Wang virtio_net_change_num_queue_pairs(n, max); 30496e790746SPaolo Bonzini 3050441537f1SJason Wang virtio_net_set_queue_pairs(n); 30516e790746SPaolo Bonzini } 30526e790746SPaolo Bonzini 3053982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id) 3054037dab2fSGreg Kurz { 3055982b78c5SDr. David Alan Gilbert VirtIONet *n = opaque; 3056982b78c5SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 3057037dab2fSGreg Kurz int i, link_down; 3058037dab2fSGreg Kurz 30599d8c6a25SDr. David Alan Gilbert trace_virtio_net_post_load_device(); 3060982b78c5SDr. David Alan Gilbert virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs, 306195129d6fSCornelia Huck virtio_vdev_has_feature(vdev, 3062e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 3063e22f0603SYuri Benditovich virtio_vdev_has_feature(vdev, 3064e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 30656e790746SPaolo Bonzini 30666e790746SPaolo Bonzini /* MAC_TABLE_ENTRIES may be different from the saved image */ 3067982b78c5SDr. David Alan Gilbert if (n->mac_table.in_use > MAC_TABLE_ENTRIES) { 30686e790746SPaolo Bonzini n->mac_table.in_use = 0; 30696e790746SPaolo Bonzini } 30706e790746SPaolo Bonzini 3071982b78c5SDr. David Alan Gilbert if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 30726c666823SMichael S. Tsirkin n->curr_guest_offloads = virtio_net_supported_guest_offloads(n); 30736c666823SMichael S. Tsirkin } 30746c666823SMichael S. Tsirkin 30757788c3f2SMikhail Sennikovsky /* 30767788c3f2SMikhail Sennikovsky * curr_guest_offloads will be later overwritten by the 30777788c3f2SMikhail Sennikovsky * virtio_set_features_nocheck call done from the virtio_load. 30787788c3f2SMikhail Sennikovsky * Here we make sure it is preserved and restored accordingly 30797788c3f2SMikhail Sennikovsky * in the virtio_net_post_load_virtio callback. 30807788c3f2SMikhail Sennikovsky */ 30817788c3f2SMikhail Sennikovsky n->saved_guest_offloads = n->curr_guest_offloads; 30826c666823SMichael S. Tsirkin 3083441537f1SJason Wang virtio_net_set_queue_pairs(n); 30846e790746SPaolo Bonzini 30856e790746SPaolo Bonzini /* Find the first multicast entry in the saved MAC filter */ 30866e790746SPaolo Bonzini for (i = 0; i < n->mac_table.in_use; i++) { 30876e790746SPaolo Bonzini if (n->mac_table.macs[i * ETH_ALEN] & 1) { 30886e790746SPaolo Bonzini break; 30896e790746SPaolo Bonzini } 30906e790746SPaolo Bonzini } 30916e790746SPaolo Bonzini n->mac_table.first_multi = i; 30926e790746SPaolo Bonzini 30936e790746SPaolo Bonzini /* nc.link_down can't be migrated, so infer link_down according 30946e790746SPaolo Bonzini * to link status bit in n->status */ 30956e790746SPaolo Bonzini link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0; 3096441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 30976e790746SPaolo Bonzini qemu_get_subqueue(n->nic, i)->link_down = link_down; 30986e790746SPaolo Bonzini } 30996e790746SPaolo Bonzini 31006c666823SMichael S. Tsirkin if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 31016c666823SMichael S. Tsirkin virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 31029d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 31039d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 31049d8c6a25SDr. David Alan Gilbert virtio_net_announce_timer, n); 31059d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 31069d8c6a25SDr. David Alan Gilbert timer_mod(n->announce_timer.tm, 31079d8c6a25SDr. David Alan Gilbert qemu_clock_get_ms(n->announce_timer.type)); 31089d8c6a25SDr. David Alan Gilbert } else { 3109944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 31109d8c6a25SDr. David Alan Gilbert } 31116c666823SMichael S. Tsirkin } 31126c666823SMichael S. Tsirkin 3113e41b7114SYuri Benditovich if (n->rss_data.enabled) { 31140145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = n->rss_data.populate_hash; 31150145c393SAndrew Melnychenko if (!n->rss_data.populate_hash) { 31160145c393SAndrew Melnychenko if (!virtio_net_attach_epbf_rss(n)) { 31170145c393SAndrew Melnychenko if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 31180145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS for vhost"); 31190145c393SAndrew Melnychenko } else { 31200145c393SAndrew Melnychenko warn_report("Can't post-load eBPF RSS - " 31210145c393SAndrew Melnychenko "fallback to software RSS"); 31220145c393SAndrew Melnychenko n->rss_data.enabled_software_rss = true; 31230145c393SAndrew Melnychenko } 31240145c393SAndrew Melnychenko } 31250145c393SAndrew Melnychenko } 31260145c393SAndrew Melnychenko 3127e41b7114SYuri Benditovich trace_virtio_net_rss_enable(n->rss_data.hash_types, 3128e41b7114SYuri Benditovich n->rss_data.indirections_len, 3129e41b7114SYuri Benditovich sizeof(n->rss_data.key)); 3130e41b7114SYuri Benditovich } else { 3131e41b7114SYuri Benditovich trace_virtio_net_rss_disable(); 3132e41b7114SYuri Benditovich } 31336e790746SPaolo Bonzini return 0; 31346e790746SPaolo Bonzini } 31356e790746SPaolo Bonzini 31367788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev) 31377788c3f2SMikhail Sennikovsky { 31387788c3f2SMikhail Sennikovsky VirtIONet *n = VIRTIO_NET(vdev); 31397788c3f2SMikhail Sennikovsky /* 31407788c3f2SMikhail Sennikovsky * The actual needed state is now in saved_guest_offloads, 31417788c3f2SMikhail Sennikovsky * see virtio_net_post_load_device for detail. 31427788c3f2SMikhail Sennikovsky * Restore it back and apply the desired offloads. 31437788c3f2SMikhail Sennikovsky */ 31447788c3f2SMikhail Sennikovsky n->curr_guest_offloads = n->saved_guest_offloads; 31457788c3f2SMikhail Sennikovsky if (peer_has_vnet_hdr(n)) { 31467788c3f2SMikhail Sennikovsky virtio_net_apply_guest_offloads(n); 31477788c3f2SMikhail Sennikovsky } 31487788c3f2SMikhail Sennikovsky 31497788c3f2SMikhail Sennikovsky return 0; 31507788c3f2SMikhail Sennikovsky } 31517788c3f2SMikhail Sennikovsky 3152982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */ 3153982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = { 3154982b78c5SDr. David Alan Gilbert .name = "virtio-net-queue-tx_waiting", 31551de81b42SRichard Henderson .fields = (const VMStateField[]) { 3156982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(tx_waiting, VirtIONetQueue), 3157982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3158982b78c5SDr. David Alan Gilbert }, 3159982b78c5SDr. David Alan Gilbert }; 3160982b78c5SDr. David Alan Gilbert 3161441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id) 3162982b78c5SDr. David Alan Gilbert { 3163441537f1SJason Wang return VIRTIO_NET(opaque)->max_queue_pairs > 1; 3164982b78c5SDr. David Alan Gilbert } 3165982b78c5SDr. David Alan Gilbert 3166982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id) 3167982b78c5SDr. David Alan Gilbert { 3168982b78c5SDr. David Alan Gilbert return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque), 3169982b78c5SDr. David Alan Gilbert VIRTIO_NET_F_CTRL_GUEST_OFFLOADS); 3170982b78c5SDr. David Alan Gilbert } 3171982b78c5SDr. David Alan Gilbert 3172982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id) 3173982b78c5SDr. David Alan Gilbert { 3174982b78c5SDr. David Alan Gilbert return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES; 3175982b78c5SDr. David Alan Gilbert } 3176982b78c5SDr. David Alan Gilbert 3177982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id) 3178982b78c5SDr. David Alan Gilbert { 3179982b78c5SDr. David Alan Gilbert return !mac_table_fits(opaque, version_id); 3180982b78c5SDr. David Alan Gilbert } 3181982b78c5SDr. David Alan Gilbert 3182982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods 3183982b78c5SDr. David Alan Gilbert * although only some fields are used by each. 3184982b78c5SDr. David Alan Gilbert */ 3185982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp { 3186982b78c5SDr. David Alan Gilbert VirtIONet *parent; 3187982b78c5SDr. David Alan Gilbert VirtIONetQueue *vqs_1; 3188441537f1SJason Wang uint16_t curr_queue_pairs_1; 3189982b78c5SDr. David Alan Gilbert uint8_t has_ufo; 3190982b78c5SDr. David Alan Gilbert uint32_t has_vnet_hdr; 3191982b78c5SDr. David Alan Gilbert }; 3192982b78c5SDr. David Alan Gilbert 3193982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than 3194441537f1SJason Wang * the 1st entry in the queue_pairs and only if there's more than one 3195982b78c5SDr. David Alan Gilbert * entry. We use the tmp mechanism to calculate a temporary 3196982b78c5SDr. David Alan Gilbert * pointer and count and also validate the count. 3197982b78c5SDr. David Alan Gilbert */ 3198982b78c5SDr. David Alan Gilbert 319944b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque) 3200982b78c5SDr. David Alan Gilbert { 3201982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3202982b78c5SDr. David Alan Gilbert 3203982b78c5SDr. David Alan Gilbert tmp->vqs_1 = tmp->parent->vqs + 1; 3204441537f1SJason Wang tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1; 3205441537f1SJason Wang if (tmp->parent->curr_queue_pairs == 0) { 3206441537f1SJason Wang tmp->curr_queue_pairs_1 = 0; 3207982b78c5SDr. David Alan Gilbert } 320844b1ff31SDr. David Alan Gilbert 320944b1ff31SDr. David Alan Gilbert return 0; 3210982b78c5SDr. David Alan Gilbert } 3211982b78c5SDr. David Alan Gilbert 3212982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque) 3213982b78c5SDr. David Alan Gilbert { 3214982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3215982b78c5SDr. David Alan Gilbert 3216982b78c5SDr. David Alan Gilbert /* Reuse the pointer setup from save */ 3217982b78c5SDr. David Alan Gilbert virtio_net_tx_waiting_pre_save(opaque); 3218982b78c5SDr. David Alan Gilbert 3219441537f1SJason Wang if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) { 3220441537f1SJason Wang error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x", 3221441537f1SJason Wang tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs); 3222982b78c5SDr. David Alan Gilbert 3223982b78c5SDr. David Alan Gilbert return -EINVAL; 3224982b78c5SDr. David Alan Gilbert } 3225982b78c5SDr. David Alan Gilbert 3226982b78c5SDr. David Alan Gilbert return 0; /* all good */ 3227982b78c5SDr. David Alan Gilbert } 3228982b78c5SDr. David Alan Gilbert 3229982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = { 3230982b78c5SDr. David Alan Gilbert .name = "virtio-net-tx_waiting", 3231982b78c5SDr. David Alan Gilbert .pre_load = virtio_net_tx_waiting_pre_load, 3232982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_tx_waiting_pre_save, 32331de81b42SRichard Henderson .fields = (const VMStateField[]) { 3234982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp, 3235441537f1SJason Wang curr_queue_pairs_1, 3236982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3237982b78c5SDr. David Alan Gilbert struct VirtIONetQueue), 3238982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3239982b78c5SDr. David Alan Gilbert }, 3240982b78c5SDr. David Alan Gilbert }; 3241982b78c5SDr. David Alan Gilbert 3242982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the 3243982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3244982b78c5SDr. David Alan Gilbert */ 3245982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id) 3246982b78c5SDr. David Alan Gilbert { 3247982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3248982b78c5SDr. David Alan Gilbert 3249982b78c5SDr. David Alan Gilbert if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) { 3250982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires TUN_F_UFO support"); 3251982b78c5SDr. David Alan Gilbert return -EINVAL; 3252982b78c5SDr. David Alan Gilbert } 3253982b78c5SDr. David Alan Gilbert 3254982b78c5SDr. David Alan Gilbert return 0; 3255982b78c5SDr. David Alan Gilbert } 3256982b78c5SDr. David Alan Gilbert 325744b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque) 3258982b78c5SDr. David Alan Gilbert { 3259982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3260982b78c5SDr. David Alan Gilbert 3261982b78c5SDr. David Alan Gilbert tmp->has_ufo = tmp->parent->has_ufo; 326244b1ff31SDr. David Alan Gilbert 326344b1ff31SDr. David Alan Gilbert return 0; 3264982b78c5SDr. David Alan Gilbert } 3265982b78c5SDr. David Alan Gilbert 3266982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = { 3267982b78c5SDr. David Alan Gilbert .name = "virtio-net-ufo", 3268982b78c5SDr. David Alan Gilbert .post_load = virtio_net_ufo_post_load, 3269982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_ufo_pre_save, 32701de81b42SRichard Henderson .fields = (const VMStateField[]) { 3271982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp), 3272982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3273982b78c5SDr. David Alan Gilbert }, 3274982b78c5SDr. David Alan Gilbert }; 3275982b78c5SDr. David Alan Gilbert 3276982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the 3277982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3278982b78c5SDr. David Alan Gilbert */ 3279982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id) 3280982b78c5SDr. David Alan Gilbert { 3281982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3282982b78c5SDr. David Alan Gilbert 3283982b78c5SDr. David Alan Gilbert if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) { 3284982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires vnet_hdr=on"); 3285982b78c5SDr. David Alan Gilbert return -EINVAL; 3286982b78c5SDr. David Alan Gilbert } 3287982b78c5SDr. David Alan Gilbert 3288982b78c5SDr. David Alan Gilbert return 0; 3289982b78c5SDr. David Alan Gilbert } 3290982b78c5SDr. David Alan Gilbert 329144b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque) 3292982b78c5SDr. David Alan Gilbert { 3293982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3294982b78c5SDr. David Alan Gilbert 3295982b78c5SDr. David Alan Gilbert tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr; 329644b1ff31SDr. David Alan Gilbert 329744b1ff31SDr. David Alan Gilbert return 0; 3298982b78c5SDr. David Alan Gilbert } 3299982b78c5SDr. David Alan Gilbert 3300982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = { 3301982b78c5SDr. David Alan Gilbert .name = "virtio-net-vnet", 3302982b78c5SDr. David Alan Gilbert .post_load = virtio_net_vnet_post_load, 3303982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_vnet_pre_save, 33041de81b42SRichard Henderson .fields = (const VMStateField[]) { 3305982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp), 3306982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3307982b78c5SDr. David Alan Gilbert }, 3308982b78c5SDr. David Alan Gilbert }; 3309982b78c5SDr. David Alan Gilbert 3310e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque) 3311e41b7114SYuri Benditovich { 3312e41b7114SYuri Benditovich return VIRTIO_NET(opaque)->rss_data.enabled; 3313e41b7114SYuri Benditovich } 3314e41b7114SYuri Benditovich 3315e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = { 3316e41b7114SYuri Benditovich .name = "virtio-net-device/rss", 3317e41b7114SYuri Benditovich .version_id = 1, 3318e41b7114SYuri Benditovich .minimum_version_id = 1, 3319e41b7114SYuri Benditovich .needed = virtio_net_rss_needed, 33201de81b42SRichard Henderson .fields = (const VMStateField[]) { 3321e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.enabled, VirtIONet), 3322e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.redirect, VirtIONet), 3323e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.populate_hash, VirtIONet), 3324e41b7114SYuri Benditovich VMSTATE_UINT32(rss_data.hash_types, VirtIONet), 3325e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.indirections_len, VirtIONet), 3326e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.default_queue, VirtIONet), 3327e41b7114SYuri Benditovich VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet, 3328e41b7114SYuri Benditovich VIRTIO_NET_RSS_MAX_KEY_SIZE), 3329e41b7114SYuri Benditovich VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet, 3330e41b7114SYuri Benditovich rss_data.indirections_len, 0, 3331e41b7114SYuri Benditovich vmstate_info_uint16, uint16_t), 3332e41b7114SYuri Benditovich VMSTATE_END_OF_LIST() 3333e41b7114SYuri Benditovich }, 3334e41b7114SYuri Benditovich }; 3335e41b7114SYuri Benditovich 3336982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = { 3337982b78c5SDr. David Alan Gilbert .name = "virtio-net-device", 3338982b78c5SDr. David Alan Gilbert .version_id = VIRTIO_NET_VM_VERSION, 3339982b78c5SDr. David Alan Gilbert .minimum_version_id = VIRTIO_NET_VM_VERSION, 3340982b78c5SDr. David Alan Gilbert .post_load = virtio_net_post_load_device, 33411de81b42SRichard Henderson .fields = (const VMStateField[]) { 3342982b78c5SDr. David Alan Gilbert VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN), 3343982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_POINTER(vqs, VirtIONet, 3344982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3345982b78c5SDr. David Alan Gilbert VirtIONetQueue), 3346982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet), 3347982b78c5SDr. David Alan Gilbert VMSTATE_UINT16(status, VirtIONet), 3348982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(promisc, VirtIONet), 3349982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(allmulti, VirtIONet), 3350982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mac_table.in_use, VirtIONet), 3351982b78c5SDr. David Alan Gilbert 3352982b78c5SDr. David Alan Gilbert /* Guarded pair: If it fits we load it, else we throw it away 3353982b78c5SDr. David Alan Gilbert * - can happen if source has a larger MAC table.; post-load 3354982b78c5SDr. David Alan Gilbert * sets flags in this case. 3355982b78c5SDr. David Alan Gilbert */ 3356982b78c5SDr. David Alan Gilbert VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet, 3357982b78c5SDr. David Alan Gilbert 0, mac_table_fits, mac_table.in_use, 3358982b78c5SDr. David Alan Gilbert ETH_ALEN), 3359982b78c5SDr. David Alan Gilbert VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0, 3360982b78c5SDr. David Alan Gilbert mac_table.in_use, ETH_ALEN), 3361982b78c5SDr. David Alan Gilbert 3362982b78c5SDr. David Alan Gilbert /* Note: This is an array of uint32's that's always been saved as a 3363982b78c5SDr. David Alan Gilbert * buffer; hold onto your endiannesses; it's actually used as a bitmap 3364982b78c5SDr. David Alan Gilbert * but based on the uint. 3365982b78c5SDr. David Alan Gilbert */ 3366982b78c5SDr. David Alan Gilbert VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3), 3367982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3368982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_vnet), 3369982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet), 3370982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet), 3371982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(alluni, VirtIONet), 3372982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nomulti, VirtIONet), 3373982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nouni, VirtIONet), 3374982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nobcast, VirtIONet), 3375982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3376982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_ufo), 3377441537f1SJason Wang VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0, 3378982b78c5SDr. David Alan Gilbert vmstate_info_uint16_equal, uint16_t), 3379441537f1SJason Wang VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1), 3380982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3381982b78c5SDr. David Alan Gilbert vmstate_virtio_net_tx_waiting), 3382982b78c5SDr. David Alan Gilbert VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet, 3383982b78c5SDr. David Alan Gilbert has_ctrl_guest_offloads), 3384982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3385982b78c5SDr. David Alan Gilbert }, 33861de81b42SRichard Henderson .subsections = (const VMStateDescription * const []) { 3387e41b7114SYuri Benditovich &vmstate_virtio_net_rss, 3388e41b7114SYuri Benditovich NULL 3389e41b7114SYuri Benditovich } 3390982b78c5SDr. David Alan Gilbert }; 3391982b78c5SDr. David Alan Gilbert 33926e790746SPaolo Bonzini static NetClientInfo net_virtio_info = { 3393f394b2e2SEric Blake .type = NET_CLIENT_DRIVER_NIC, 33946e790746SPaolo Bonzini .size = sizeof(NICState), 33956e790746SPaolo Bonzini .can_receive = virtio_net_can_receive, 33966e790746SPaolo Bonzini .receive = virtio_net_receive, 33976e790746SPaolo Bonzini .link_status_changed = virtio_net_set_link_status, 3398b1be4280SAmos Kong .query_rx_filter = virtio_net_query_rxfilter, 3399b2c929f0SDr. David Alan Gilbert .announce = virtio_net_announce, 34006e790746SPaolo Bonzini }; 34016e790746SPaolo Bonzini 34026e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx) 34036e790746SPaolo Bonzini { 340417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 340568b0a639SSi-Wei Liu NetClientState *nc; 34066e790746SPaolo Bonzini assert(n->vhost_started); 34071c188fc8SAkihiko Odaki if (!n->multiqueue && idx == 2) { 340868b0a639SSi-Wei Liu /* Must guard against invalid features and bogus queue index 340968b0a639SSi-Wei Liu * from being set by malicious guest, or penetrated through 341068b0a639SSi-Wei Liu * buggy migration stream. 341168b0a639SSi-Wei Liu */ 341268b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 341368b0a639SSi-Wei Liu qemu_log_mask(LOG_GUEST_ERROR, 341468b0a639SSi-Wei Liu "%s: bogus vq index ignored\n", __func__); 341568b0a639SSi-Wei Liu return false; 341668b0a639SSi-Wei Liu } 341768b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, n->max_queue_pairs); 341868b0a639SSi-Wei Liu } else { 341968b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, vq2q(idx)); 342068b0a639SSi-Wei Liu } 3421544f0278SCindy Lu /* 3422544f0278SCindy Lu * Add the check for configure interrupt, Use VIRTIO_CONFIG_IRQ_IDX -1 34237e8094f0SAlex Bennée * as the macro of configure interrupt's IDX, If this driver does not 3424544f0278SCindy Lu * support, the function will return false 3425544f0278SCindy Lu */ 3426544f0278SCindy Lu 3427544f0278SCindy Lu if (idx == VIRTIO_CONFIG_IRQ_IDX) { 34288aab0d1dSCindy Lu return vhost_net_config_pending(get_vhost_net(nc->peer)); 3429544f0278SCindy Lu } 3430ed8b4afeSNikolay Nikolaev return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx); 34316e790746SPaolo Bonzini } 34326e790746SPaolo Bonzini 34336e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx, 34346e790746SPaolo Bonzini bool mask) 34356e790746SPaolo Bonzini { 343617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 343768b0a639SSi-Wei Liu NetClientState *nc; 34386e790746SPaolo Bonzini assert(n->vhost_started); 34391c188fc8SAkihiko Odaki if (!n->multiqueue && idx == 2) { 344068b0a639SSi-Wei Liu /* Must guard against invalid features and bogus queue index 344168b0a639SSi-Wei Liu * from being set by malicious guest, or penetrated through 344268b0a639SSi-Wei Liu * buggy migration stream. 344368b0a639SSi-Wei Liu */ 344468b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 344568b0a639SSi-Wei Liu qemu_log_mask(LOG_GUEST_ERROR, 344668b0a639SSi-Wei Liu "%s: bogus vq index ignored\n", __func__); 344768b0a639SSi-Wei Liu return; 344868b0a639SSi-Wei Liu } 344968b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, n->max_queue_pairs); 345068b0a639SSi-Wei Liu } else { 345168b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, vq2q(idx)); 345268b0a639SSi-Wei Liu } 3453544f0278SCindy Lu /* 3454544f0278SCindy Lu *Add the check for configure interrupt, Use VIRTIO_CONFIG_IRQ_IDX -1 34557e8094f0SAlex Bennée * as the macro of configure interrupt's IDX, If this driver does not 3456544f0278SCindy Lu * support, the function will return 3457544f0278SCindy Lu */ 3458544f0278SCindy Lu 3459544f0278SCindy Lu if (idx == VIRTIO_CONFIG_IRQ_IDX) { 34608aab0d1dSCindy Lu vhost_net_config_mask(get_vhost_net(nc->peer), vdev, mask); 3461544f0278SCindy Lu return; 3462544f0278SCindy Lu } 3463544f0278SCindy Lu vhost_net_virtqueue_mask(get_vhost_net(nc->peer), vdev, idx, mask); 34646e790746SPaolo Bonzini } 34656e790746SPaolo Bonzini 3466019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features) 34676e790746SPaolo Bonzini { 34680cd09c3aSCornelia Huck virtio_add_feature(&host_features, VIRTIO_NET_F_MAC); 3469a93e599dSMaxime Coquelin 3470d74c30c8SDaniil Tatianin n->config_size = virtio_get_config_size(&cfg_size_params, host_features); 347117ec5a86SKONRAD Frederic } 34726e790746SPaolo Bonzini 34738a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name, 34748a253ec2SKONRAD Frederic const char *type) 34758a253ec2SKONRAD Frederic { 34768a253ec2SKONRAD Frederic /* 34778a253ec2SKONRAD Frederic * The name can be NULL, the netclient name will be type.x. 34788a253ec2SKONRAD Frederic */ 34798a253ec2SKONRAD Frederic assert(type != NULL); 34808a253ec2SKONRAD Frederic 34818a253ec2SKONRAD Frederic g_free(n->netclient_name); 34828a253ec2SKONRAD Frederic g_free(n->netclient_type); 34838a253ec2SKONRAD Frederic n->netclient_name = g_strdup(name); 34848a253ec2SKONRAD Frederic n->netclient_type = g_strdup(type); 34858a253ec2SKONRAD Frederic } 34868a253ec2SKONRAD Frederic 34870e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev) 34889711cd0dSJens Freimann { 34899711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 34909711cd0dSJens Freimann PCIDevice *pci_dev; 34919711cd0dSJens Freimann Error *err = NULL; 34929711cd0dSJens Freimann 34930e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 34949711cd0dSJens Freimann if (hotplug_ctrl) { 34950e9a65c5SJuan Quintela pci_dev = PCI_DEVICE(dev); 34969711cd0dSJens Freimann pci_dev->partially_hotplugged = true; 34970e9a65c5SJuan Quintela hotplug_handler_unplug_request(hotplug_ctrl, dev, &err); 34989711cd0dSJens Freimann if (err) { 34999711cd0dSJens Freimann error_report_err(err); 35009711cd0dSJens Freimann return false; 35019711cd0dSJens Freimann } 35029711cd0dSJens Freimann } else { 35039711cd0dSJens Freimann return false; 35049711cd0dSJens Freimann } 35059711cd0dSJens Freimann return true; 35069711cd0dSJens Freimann } 35079711cd0dSJens Freimann 35080e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev, 35090e9a65c5SJuan Quintela Error **errp) 35109711cd0dSJens Freimann { 35115a0948d3SMarkus Armbruster Error *err = NULL; 35129711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 35130e9a65c5SJuan Quintela PCIDevice *pdev = PCI_DEVICE(dev); 351478274682SJuan Quintela BusState *primary_bus; 35159711cd0dSJens Freimann 35169711cd0dSJens Freimann if (!pdev->partially_hotplugged) { 35179711cd0dSJens Freimann return true; 35189711cd0dSJens Freimann } 35190e9a65c5SJuan Quintela primary_bus = dev->parent_bus; 352078274682SJuan Quintela if (!primary_bus) { 3521150ab54aSJens Freimann error_setg(errp, "virtio_net: couldn't find primary bus"); 35225a0948d3SMarkus Armbruster return false; 35239711cd0dSJens Freimann } 35240e9a65c5SJuan Quintela qdev_set_parent_bus(dev, primary_bus, &error_abort); 3525e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 35260e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 35279711cd0dSJens Freimann if (hotplug_ctrl) { 35280e9a65c5SJuan Quintela hotplug_handler_pre_plug(hotplug_ctrl, dev, &err); 35295a0948d3SMarkus Armbruster if (err) { 35305a0948d3SMarkus Armbruster goto out; 35315a0948d3SMarkus Armbruster } 35320e9a65c5SJuan Quintela hotplug_handler_plug(hotplug_ctrl, dev, &err); 35339711cd0dSJens Freimann } 3534109c20eaSLaurent Vivier pdev->partially_hotplugged = false; 3535150ab54aSJens Freimann 3536150ab54aSJens Freimann out: 35375a0948d3SMarkus Armbruster error_propagate(errp, err); 35385a0948d3SMarkus Armbruster return !err; 35399711cd0dSJens Freimann } 35409711cd0dSJens Freimann 35419d9babf7SSteve Sistare static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationEvent *e) 35429711cd0dSJens Freimann { 35439711cd0dSJens Freimann bool should_be_hidden; 35449711cd0dSJens Freimann Error *err = NULL; 354507a5d816SJuan Quintela DeviceState *dev = failover_find_primary_device(n); 354607a5d816SJuan Quintela 354707a5d816SJuan Quintela if (!dev) { 354807a5d816SJuan Quintela return; 354907a5d816SJuan Quintela } 35509711cd0dSJens Freimann 3551e2bde83eSJuan Quintela should_be_hidden = qatomic_read(&n->failover_primary_hidden); 35529711cd0dSJens Freimann 35539d9babf7SSteve Sistare if (e->type == MIG_EVENT_PRECOPY_SETUP && !should_be_hidden) { 355407a5d816SJuan Quintela if (failover_unplug_primary(n, dev)) { 355507a5d816SJuan Quintela vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev); 355607a5d816SJuan Quintela qapi_event_send_unplug_primary(dev->id); 3557e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 35589711cd0dSJens Freimann } else { 35599711cd0dSJens Freimann warn_report("couldn't unplug primary device"); 35609711cd0dSJens Freimann } 35619d9babf7SSteve Sistare } else if (e->type == MIG_EVENT_PRECOPY_FAILED) { 3562150ab54aSJens Freimann /* We already unplugged the device let's plug it back */ 356307a5d816SJuan Quintela if (!failover_replug_primary(n, dev, &err)) { 35649711cd0dSJens Freimann if (err) { 35659711cd0dSJens Freimann error_report_err(err); 35669711cd0dSJens Freimann } 35679711cd0dSJens Freimann } 35689711cd0dSJens Freimann } 35699711cd0dSJens Freimann } 35709711cd0dSJens Freimann 35713e775730SSteve Sistare static int virtio_net_migration_state_notifier(NotifierWithReturn *notifier, 35725663dd3fSSteve Sistare MigrationEvent *e, Error **errp) 35739711cd0dSJens Freimann { 35749711cd0dSJens Freimann VirtIONet *n = container_of(notifier, VirtIONet, migration_state); 35759d9babf7SSteve Sistare virtio_net_handle_migration_primary(n, e); 35763e775730SSteve Sistare return 0; 35779711cd0dSJens Freimann } 35789711cd0dSJens Freimann 3579b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener, 3580f3558b1bSKevin Wolf const QDict *device_opts, 3581f3558b1bSKevin Wolf bool from_json, 3582f3558b1bSKevin Wolf Error **errp) 35839711cd0dSJens Freimann { 35849711cd0dSJens Freimann VirtIONet *n = container_of(listener, VirtIONet, primary_listener); 35854f0303aeSJuan Quintela const char *standby_id; 35869711cd0dSJens Freimann 35874d0e59acSJens Freimann if (!device_opts) { 358889631fedSJuan Quintela return false; 35894d0e59acSJens Freimann } 3590bcfc906bSLaurent Vivier 3591bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "failover_pair_id")) { 3592bcfc906bSLaurent Vivier return false; 3593bcfc906bSLaurent Vivier } 3594bcfc906bSLaurent Vivier 3595bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "id")) { 3596bcfc906bSLaurent Vivier error_setg(errp, "Device with failover_pair_id needs to have id"); 3597bcfc906bSLaurent Vivier return false; 3598bcfc906bSLaurent Vivier } 3599bcfc906bSLaurent Vivier 3600bcfc906bSLaurent Vivier standby_id = qdict_get_str(device_opts, "failover_pair_id"); 360189631fedSJuan Quintela if (g_strcmp0(standby_id, n->netclient_name) != 0) { 360289631fedSJuan Quintela return false; 36039711cd0dSJens Freimann } 36049711cd0dSJens Freimann 36057fe7791eSLaurent Vivier /* 36067fe7791eSLaurent Vivier * The hide helper can be called several times for a given device. 36077fe7791eSLaurent Vivier * Check there is only one primary for a virtio-net device but 36087fe7791eSLaurent Vivier * don't duplicate the qdict several times if it's called for the same 36097fe7791eSLaurent Vivier * device. 36107fe7791eSLaurent Vivier */ 3611259a10dbSKevin Wolf if (n->primary_opts) { 36127fe7791eSLaurent Vivier const char *old, *new; 36137fe7791eSLaurent Vivier /* devices with failover_pair_id always have an id */ 36147fe7791eSLaurent Vivier old = qdict_get_str(n->primary_opts, "id"); 36157fe7791eSLaurent Vivier new = qdict_get_str(device_opts, "id"); 36167fe7791eSLaurent Vivier if (strcmp(old, new) != 0) { 36177fe7791eSLaurent Vivier error_setg(errp, "Cannot attach more than one primary device to " 36187fe7791eSLaurent Vivier "'%s': '%s' and '%s'", n->netclient_name, old, new); 3619259a10dbSKevin Wolf return false; 3620259a10dbSKevin Wolf } 36217fe7791eSLaurent Vivier } else { 3622f3558b1bSKevin Wolf n->primary_opts = qdict_clone_shallow(device_opts); 3623f3558b1bSKevin Wolf n->primary_opts_from_json = from_json; 36247fe7791eSLaurent Vivier } 3625259a10dbSKevin Wolf 3626e2bde83eSJuan Quintela /* failover_primary_hidden is set during feature negotiation */ 36273abad4a2SJuan Quintela return qatomic_read(&n->failover_primary_hidden); 36289711cd0dSJens Freimann } 36299711cd0dSJens Freimann 3630e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp) 363117ec5a86SKONRAD Frederic { 3632e6f746b3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3633284a32f0SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3634284a32f0SAndreas Färber NetClientState *nc; 36351773d9eeSKONRAD Frederic int i; 363617ec5a86SKONRAD Frederic 3637a93e599dSMaxime Coquelin if (n->net_conf.mtu) { 3638127833eeSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_MTU); 3639a93e599dSMaxime Coquelin } 3640a93e599dSMaxime Coquelin 36419473939eSJason Baron if (n->net_conf.duplex_str) { 36429473939eSJason Baron if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) { 36439473939eSJason Baron n->net_conf.duplex = DUPLEX_HALF; 36449473939eSJason Baron } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) { 36459473939eSJason Baron n->net_conf.duplex = DUPLEX_FULL; 36469473939eSJason Baron } else { 36479473939eSJason Baron error_setg(errp, "'duplex' must be 'half' or 'full'"); 3648843c4cfcSMarkus Armbruster return; 36499473939eSJason Baron } 36509473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 36519473939eSJason Baron } else { 36529473939eSJason Baron n->net_conf.duplex = DUPLEX_UNKNOWN; 36539473939eSJason Baron } 36549473939eSJason Baron 36559473939eSJason Baron if (n->net_conf.speed < SPEED_UNKNOWN) { 36569473939eSJason Baron error_setg(errp, "'speed' must be between 0 and INT_MAX"); 3657843c4cfcSMarkus Armbruster return; 3658843c4cfcSMarkus Armbruster } 3659843c4cfcSMarkus Armbruster if (n->net_conf.speed >= 0) { 36609473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 36619473939eSJason Baron } 36629473939eSJason Baron 36639711cd0dSJens Freimann if (n->failover) { 3664b91ad981SJuan Quintela n->primary_listener.hide_device = failover_hide_primary_device; 3665e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 36669711cd0dSJens Freimann device_listener_register(&n->primary_listener); 3667d9cda213SSteve Sistare migration_add_notifier(&n->migration_state, 3668d9cda213SSteve Sistare virtio_net_migration_state_notifier); 36699711cd0dSJens Freimann n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY); 36709711cd0dSJens Freimann } 36719711cd0dSJens Freimann 3672da3e8a23SShannon Zhao virtio_net_set_config_size(n, n->host_features); 36733857cd5cSJonah Palmer virtio_init(vdev, VIRTIO_ID_NET, n->config_size); 367417ec5a86SKONRAD Frederic 36751c0fbfa3SMichael S. Tsirkin /* 36761c0fbfa3SMichael S. Tsirkin * We set a lower limit on RX queue size to what it always was. 36771c0fbfa3SMichael S. Tsirkin * Guests that want a smaller ring can always resize it without 36781c0fbfa3SMichael S. Tsirkin * help from us (using virtio 1 and up). 36791c0fbfa3SMichael S. Tsirkin */ 36801c0fbfa3SMichael S. Tsirkin if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE || 36811c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE || 36825f997fd1SMichal Privoznik !is_power_of_2(n->net_conf.rx_queue_size)) { 36831c0fbfa3SMichael S. Tsirkin error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), " 36841c0fbfa3SMichael S. Tsirkin "must be a power of 2 between %d and %d.", 36851c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE, 36861c0fbfa3SMichael S. Tsirkin VIRTQUEUE_MAX_SIZE); 36871c0fbfa3SMichael S. Tsirkin virtio_cleanup(vdev); 36881c0fbfa3SMichael S. Tsirkin return; 36891c0fbfa3SMichael S. Tsirkin } 36901c0fbfa3SMichael S. Tsirkin 36919b02e161SWei Wang if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE || 36924271f403SLaurent Vivier n->net_conf.tx_queue_size > virtio_net_max_tx_queue_size(n) || 36939b02e161SWei Wang !is_power_of_2(n->net_conf.tx_queue_size)) { 36949b02e161SWei Wang error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), " 36959b02e161SWei Wang "must be a power of 2 between %d and %d", 36969b02e161SWei Wang n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE, 36974271f403SLaurent Vivier virtio_net_max_tx_queue_size(n)); 36989b02e161SWei Wang virtio_cleanup(vdev); 36999b02e161SWei Wang return; 37009b02e161SWei Wang } 37019b02e161SWei Wang 370222288fe5SJason Wang n->max_ncs = MAX(n->nic_conf.peers.queues, 1); 370322288fe5SJason Wang 370422288fe5SJason Wang /* 370522288fe5SJason Wang * Figure out the datapath queue pairs since the backend could 370622288fe5SJason Wang * provide control queue via peers as well. 370722288fe5SJason Wang */ 370822288fe5SJason Wang if (n->nic_conf.peers.queues) { 370922288fe5SJason Wang for (i = 0; i < n->max_ncs; i++) { 371022288fe5SJason Wang if (n->nic_conf.peers.ncs[i]->is_datapath) { 371122288fe5SJason Wang ++n->max_queue_pairs; 371222288fe5SJason Wang } 371322288fe5SJason Wang } 371422288fe5SJason Wang } 371522288fe5SJason Wang n->max_queue_pairs = MAX(n->max_queue_pairs, 1); 371622288fe5SJason Wang 3717441537f1SJason Wang if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) { 371822288fe5SJason Wang error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), " 3719631b22eaSStefan Weil "must be a positive integer less than %d.", 3720441537f1SJason Wang n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2); 37217e0e736eSJason Wang virtio_cleanup(vdev); 37227e0e736eSJason Wang return; 37237e0e736eSJason Wang } 3724b21e2380SMarkus Armbruster n->vqs = g_new0(VirtIONetQueue, n->max_queue_pairs); 3725441537f1SJason Wang n->curr_queue_pairs = 1; 37261773d9eeSKONRAD Frederic n->tx_timeout = n->net_conf.txtimer; 37276e790746SPaolo Bonzini 37281773d9eeSKONRAD Frederic if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer") 37291773d9eeSKONRAD Frederic && strcmp(n->net_conf.tx, "bh")) { 37300765691eSMarkus Armbruster warn_report("virtio-net: " 37316e790746SPaolo Bonzini "Unknown option tx=%s, valid options: \"timer\" \"bh\"", 37321773d9eeSKONRAD Frederic n->net_conf.tx); 37330765691eSMarkus Armbruster error_printf("Defaulting to \"bh\""); 37346e790746SPaolo Bonzini } 37356e790746SPaolo Bonzini 37362eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n), 37372eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size); 37389b02e161SWei Wang 37398c497568SAkihiko Odaki virtio_net_add_queue(n, 0); 3740da51a335SJason Wang 374117a0ca55SKONRAD Frederic n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 37421773d9eeSKONRAD Frederic qemu_macaddr_default_if_unset(&n->nic_conf.macaddr); 37431773d9eeSKONRAD Frederic memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac)); 37446e790746SPaolo Bonzini n->status = VIRTIO_NET_S_LINK_UP; 37459d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 37469d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 3747f57fcf70SJason Wang virtio_net_announce_timer, n); 3748b2c929f0SDr. David Alan Gilbert n->announce_timer.round = 0; 37496e790746SPaolo Bonzini 37508a253ec2SKONRAD Frederic if (n->netclient_type) { 37518a253ec2SKONRAD Frederic /* 37528a253ec2SKONRAD Frederic * Happen when virtio_net_set_netclient_name has been called. 37538a253ec2SKONRAD Frederic */ 37548a253ec2SKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 37557d0fefdfSAkihiko Odaki n->netclient_type, n->netclient_name, 37567d0fefdfSAkihiko Odaki &dev->mem_reentrancy_guard, n); 37578a253ec2SKONRAD Frederic } else { 37581773d9eeSKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 37597d0fefdfSAkihiko Odaki object_get_typename(OBJECT(dev)), dev->id, 37607d0fefdfSAkihiko Odaki &dev->mem_reentrancy_guard, n); 37618a253ec2SKONRAD Frederic } 37628a253ec2SKONRAD Frederic 3763441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3764d4c62930SBin Meng n->nic->ncs[i].do_not_pad = true; 3765d4c62930SBin Meng } 3766d4c62930SBin Meng 37676e790746SPaolo Bonzini peer_test_vnet_hdr(n); 37686e790746SPaolo Bonzini if (peer_has_vnet_hdr(n)) { 37696e790746SPaolo Bonzini n->host_hdr_len = sizeof(struct virtio_net_hdr); 37706e790746SPaolo Bonzini } else { 37716e790746SPaolo Bonzini n->host_hdr_len = 0; 37726e790746SPaolo Bonzini } 37736e790746SPaolo Bonzini 37741773d9eeSKONRAD Frederic qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a); 37756e790746SPaolo Bonzini 37766e790746SPaolo Bonzini n->vqs[0].tx_waiting = 0; 37771773d9eeSKONRAD Frederic n->tx_burst = n->net_conf.txburst; 3778e22f0603SYuri Benditovich virtio_net_set_mrg_rx_bufs(n, 0, 0, 0); 37796e790746SPaolo Bonzini n->promisc = 1; /* for compatibility */ 37806e790746SPaolo Bonzini 37816e790746SPaolo Bonzini n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 37826e790746SPaolo Bonzini 37836e790746SPaolo Bonzini n->vlans = g_malloc0(MAX_VLAN >> 3); 37846e790746SPaolo Bonzini 3785b1be4280SAmos Kong nc = qemu_get_queue(n->nic); 3786b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 3787b1be4280SAmos Kong 3788e87936eaSCindy Lu if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 3789e87936eaSCindy Lu struct virtio_net_config netcfg = {}; 3790e87936eaSCindy Lu memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN); 3791e87936eaSCindy Lu vhost_net_set_config(get_vhost_net(nc->peer), 3792f8ed3648SManos Pitsidianakis (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_FRONTEND); 3793e87936eaSCindy Lu } 37942974e916SYuri Benditovich QTAILQ_INIT(&n->rsc_chains); 3795284a32f0SAndreas Färber n->qdev = dev; 37964474e37aSYuri Benditovich 3797aac8f89dSAkihiko Odaki net_rx_pkt_init(&n->rx_pkt); 37980145c393SAndrew Melnychenko 37990145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 3800283be596SAkihiko Odaki virtio_net_load_ebpf(n); 38010145c393SAndrew Melnychenko } 380217ec5a86SKONRAD Frederic } 380317ec5a86SKONRAD Frederic 3804b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev) 380517ec5a86SKONRAD Frederic { 3806306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3807306ec6c3SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3808441537f1SJason Wang int i, max_queue_pairs; 380917ec5a86SKONRAD Frederic 38100145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 38110145c393SAndrew Melnychenko virtio_net_unload_ebpf(n); 38120145c393SAndrew Melnychenko } 38130145c393SAndrew Melnychenko 381417ec5a86SKONRAD Frederic /* This will stop vhost backend if appropriate. */ 381517ec5a86SKONRAD Frederic virtio_net_set_status(vdev, 0); 381617ec5a86SKONRAD Frederic 38178a253ec2SKONRAD Frederic g_free(n->netclient_name); 38188a253ec2SKONRAD Frederic n->netclient_name = NULL; 38198a253ec2SKONRAD Frederic g_free(n->netclient_type); 38208a253ec2SKONRAD Frederic n->netclient_type = NULL; 38218a253ec2SKONRAD Frederic 382217ec5a86SKONRAD Frederic g_free(n->mac_table.macs); 382317ec5a86SKONRAD Frederic g_free(n->vlans); 382417ec5a86SKONRAD Frederic 38259711cd0dSJens Freimann if (n->failover) { 3826f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 382765018100SJuan Quintela device_listener_unregister(&n->primary_listener); 3828d9cda213SSteve Sistare migration_remove_notifier(&n->migration_state); 3829f3558b1bSKevin Wolf } else { 3830f3558b1bSKevin Wolf assert(n->primary_opts == NULL); 38319711cd0dSJens Freimann } 38329711cd0dSJens Freimann 3833441537f1SJason Wang max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3834441537f1SJason Wang for (i = 0; i < max_queue_pairs; i++) { 3835f9d6dbf0SWen Congyang virtio_net_del_queue(n, i); 383617ec5a86SKONRAD Frederic } 3837d945d9f1SYuri Benditovich /* delete also control vq */ 3838441537f1SJason Wang virtio_del_queue(vdev, max_queue_pairs * 2); 3839944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 384017ec5a86SKONRAD Frederic g_free(n->vqs); 384117ec5a86SKONRAD Frederic qemu_del_nic(n->nic); 38422974e916SYuri Benditovich virtio_net_rsc_cleanup(n); 384359079029SYuri Benditovich g_free(n->rss_data.indirections_table); 38444474e37aSYuri Benditovich net_rx_pkt_uninit(n->rx_pkt); 38456a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 384617ec5a86SKONRAD Frederic } 384717ec5a86SKONRAD Frederic 384817ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj) 384917ec5a86SKONRAD Frederic { 385017ec5a86SKONRAD Frederic VirtIONet *n = VIRTIO_NET(obj); 385117ec5a86SKONRAD Frederic 385217ec5a86SKONRAD Frederic /* 385317ec5a86SKONRAD Frederic * The default config_size is sizeof(struct virtio_net_config). 38542431f4f1SMichael Tokarev * Can be overridden with virtio_net_set_config_size. 385517ec5a86SKONRAD Frederic */ 385617ec5a86SKONRAD Frederic n->config_size = sizeof(struct virtio_net_config); 3857aa4197c3SGonglei device_add_bootindex_property(obj, &n->nic_conf.bootindex, 3858aa4197c3SGonglei "bootindex", "/ethernet-phy@0", 385940c2281cSMarkus Armbruster DEVICE(n)); 38600145c393SAndrew Melnychenko 38610145c393SAndrew Melnychenko ebpf_rss_init(&n->ebpf_rss); 386217ec5a86SKONRAD Frederic } 386317ec5a86SKONRAD Frederic 386444b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque) 38654d45dcfbSHalil Pasic { 38664d45dcfbSHalil Pasic VirtIONet *n = opaque; 38674d45dcfbSHalil Pasic 38684d45dcfbSHalil Pasic /* At this point, backend must be stopped, otherwise 38694d45dcfbSHalil Pasic * it might keep writing to memory. */ 38704d45dcfbSHalil Pasic assert(!n->vhost_started); 387144b1ff31SDr. David Alan Gilbert 387244b1ff31SDr. David Alan Gilbert return 0; 38734d45dcfbSHalil Pasic } 38744d45dcfbSHalil Pasic 38759711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque) 38769711cd0dSJens Freimann { 38779711cd0dSJens Freimann DeviceState *dev = opaque; 387821e8709bSJuan Quintela DeviceState *primary; 38799711cd0dSJens Freimann VirtIODevice *vdev = VIRTIO_DEVICE(dev); 38809711cd0dSJens Freimann VirtIONet *n = VIRTIO_NET(vdev); 38819711cd0dSJens Freimann 3882284f42a5SJens Freimann if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) { 3883284f42a5SJens Freimann return false; 3884284f42a5SJens Freimann } 388521e8709bSJuan Quintela primary = failover_find_primary_device(n); 388621e8709bSJuan Quintela return primary ? primary->pending_deleted_event : false; 38879711cd0dSJens Freimann } 38889711cd0dSJens Freimann 38899711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque) 38909711cd0dSJens Freimann { 38919711cd0dSJens Freimann DeviceState *dev = opaque; 38929711cd0dSJens Freimann VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev); 38939711cd0dSJens Freimann 38949711cd0dSJens Freimann return vdc->primary_unplug_pending(dev); 38959711cd0dSJens Freimann } 38969711cd0dSJens Freimann 3897c255488dSJonah Palmer static struct vhost_dev *virtio_net_get_vhost(VirtIODevice *vdev) 3898c255488dSJonah Palmer { 3899c255488dSJonah Palmer VirtIONet *n = VIRTIO_NET(vdev); 3900c255488dSJonah Palmer NetClientState *nc = qemu_get_queue(n->nic); 3901c255488dSJonah Palmer struct vhost_net *net = get_vhost_net(nc->peer); 3902c255488dSJonah Palmer return &net->dev; 3903c255488dSJonah Palmer } 3904c255488dSJonah Palmer 39054d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = { 39064d45dcfbSHalil Pasic .name = "virtio-net", 39074d45dcfbSHalil Pasic .minimum_version_id = VIRTIO_NET_VM_VERSION, 39084d45dcfbSHalil Pasic .version_id = VIRTIO_NET_VM_VERSION, 39091de81b42SRichard Henderson .fields = (const VMStateField[]) { 39104d45dcfbSHalil Pasic VMSTATE_VIRTIO_DEVICE, 39114d45dcfbSHalil Pasic VMSTATE_END_OF_LIST() 39124d45dcfbSHalil Pasic }, 39134d45dcfbSHalil Pasic .pre_save = virtio_net_pre_save, 39149711cd0dSJens Freimann .dev_unplug_pending = dev_unplug_pending, 39154d45dcfbSHalil Pasic }; 3916290c2428SDr. David Alan Gilbert 391717ec5a86SKONRAD Frederic static Property virtio_net_properties[] = { 3918127833eeSJason Baron DEFINE_PROP_BIT64("csum", VirtIONet, host_features, 3919127833eeSJason Baron VIRTIO_NET_F_CSUM, true), 3920127833eeSJason Baron DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features, 392187108bb2SShannon Zhao VIRTIO_NET_F_GUEST_CSUM, true), 3922127833eeSJason Baron DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true), 3923127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features, 392487108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO4, true), 3925127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features, 392687108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO6, true), 3927127833eeSJason Baron DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features, 392887108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ECN, true), 3929127833eeSJason Baron DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features, 393087108bb2SShannon Zhao VIRTIO_NET_F_GUEST_UFO, true), 3931127833eeSJason Baron DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features, 393287108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ANNOUNCE, true), 3933127833eeSJason Baron DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features, 393487108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO4, true), 3935127833eeSJason Baron DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features, 393687108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO6, true), 3937127833eeSJason Baron DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features, 393887108bb2SShannon Zhao VIRTIO_NET_F_HOST_ECN, true), 3939127833eeSJason Baron DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features, 394087108bb2SShannon Zhao VIRTIO_NET_F_HOST_UFO, true), 3941127833eeSJason Baron DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features, 394287108bb2SShannon Zhao VIRTIO_NET_F_MRG_RXBUF, true), 3943127833eeSJason Baron DEFINE_PROP_BIT64("status", VirtIONet, host_features, 394487108bb2SShannon Zhao VIRTIO_NET_F_STATUS, true), 3945127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features, 394687108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VQ, true), 3947127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features, 394887108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX, true), 3949127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features, 395087108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VLAN, true), 3951127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features, 395287108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX_EXTRA, true), 3953127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features, 395487108bb2SShannon Zhao VIRTIO_NET_F_CTRL_MAC_ADDR, true), 3955127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features, 395687108bb2SShannon Zhao VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true), 3957127833eeSJason Baron DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false), 395859079029SYuri Benditovich DEFINE_PROP_BIT64("rss", VirtIONet, host_features, 395959079029SYuri Benditovich VIRTIO_NET_F_RSS, false), 3960e22f0603SYuri Benditovich DEFINE_PROP_BIT64("hash", VirtIONet, host_features, 3961e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT, false), 39626b230b7dSAndrew Melnychenko DEFINE_PROP_ARRAY("ebpf-rss-fds", VirtIONet, nr_ebpf_rss_fds, 39636b230b7dSAndrew Melnychenko ebpf_rss_fds, qdev_prop_string, char*), 39642974e916SYuri Benditovich DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features, 39652974e916SYuri Benditovich VIRTIO_NET_F_RSC_EXT, false), 39662974e916SYuri Benditovich DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout, 39672974e916SYuri Benditovich VIRTIO_NET_RSC_DEFAULT_INTERVAL), 396817ec5a86SKONRAD Frederic DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf), 396917ec5a86SKONRAD Frederic DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer, 397017ec5a86SKONRAD Frederic TX_TIMER_INTERVAL), 397117ec5a86SKONRAD Frederic DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST), 397217ec5a86SKONRAD Frederic DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx), 39731c0fbfa3SMichael S. Tsirkin DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size, 39741c0fbfa3SMichael S. Tsirkin VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE), 39759b02e161SWei Wang DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size, 39769b02e161SWei Wang VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE), 3977a93e599dSMaxime Coquelin DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0), 397875ebec11SMaxime Coquelin DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend, 397975ebec11SMaxime Coquelin true), 39809473939eSJason Baron DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN), 39819473939eSJason Baron DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str), 39829711cd0dSJens Freimann DEFINE_PROP_BOOL("failover", VirtIONet, failover, false), 398353da8b5aSYuri Benditovich DEFINE_PROP_BIT64("guest_uso4", VirtIONet, host_features, 398453da8b5aSYuri Benditovich VIRTIO_NET_F_GUEST_USO4, true), 398553da8b5aSYuri Benditovich DEFINE_PROP_BIT64("guest_uso6", VirtIONet, host_features, 398653da8b5aSYuri Benditovich VIRTIO_NET_F_GUEST_USO6, true), 398753da8b5aSYuri Benditovich DEFINE_PROP_BIT64("host_uso", VirtIONet, host_features, 398853da8b5aSYuri Benditovich VIRTIO_NET_F_HOST_USO, true), 398917ec5a86SKONRAD Frederic DEFINE_PROP_END_OF_LIST(), 399017ec5a86SKONRAD Frederic }; 399117ec5a86SKONRAD Frederic 399217ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data) 399317ec5a86SKONRAD Frederic { 399417ec5a86SKONRAD Frederic DeviceClass *dc = DEVICE_CLASS(klass); 399517ec5a86SKONRAD Frederic VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 3996e6f746b3SAndreas Färber 39974f67d30bSMarc-André Lureau device_class_set_props(dc, virtio_net_properties); 3998290c2428SDr. David Alan Gilbert dc->vmsd = &vmstate_virtio_net; 3999125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_NETWORK, dc->categories); 4000e6f746b3SAndreas Färber vdc->realize = virtio_net_device_realize; 4001306ec6c3SAndreas Färber vdc->unrealize = virtio_net_device_unrealize; 400217ec5a86SKONRAD Frederic vdc->get_config = virtio_net_get_config; 400317ec5a86SKONRAD Frederic vdc->set_config = virtio_net_set_config; 400417ec5a86SKONRAD Frederic vdc->get_features = virtio_net_get_features; 400517ec5a86SKONRAD Frederic vdc->set_features = virtio_net_set_features; 400617ec5a86SKONRAD Frederic vdc->bad_features = virtio_net_bad_features; 400717ec5a86SKONRAD Frederic vdc->reset = virtio_net_reset; 40087dc6be52SXuan Zhuo vdc->queue_reset = virtio_net_queue_reset; 40097f863302SKangjie Xu vdc->queue_enable = virtio_net_queue_enable; 401017ec5a86SKONRAD Frederic vdc->set_status = virtio_net_set_status; 401117ec5a86SKONRAD Frederic vdc->guest_notifier_mask = virtio_net_guest_notifier_mask; 401217ec5a86SKONRAD Frederic vdc->guest_notifier_pending = virtio_net_guest_notifier_pending; 40132a083ffdSMichael S. Tsirkin vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO); 40147788c3f2SMikhail Sennikovsky vdc->post_load = virtio_net_post_load_virtio; 4015982b78c5SDr. David Alan Gilbert vdc->vmsd = &vmstate_virtio_net_device; 40169711cd0dSJens Freimann vdc->primary_unplug_pending = primary_unplug_pending; 4017c255488dSJonah Palmer vdc->get_vhost = virtio_net_get_vhost; 4018cd9b8346SViktor Prutyanov vdc->toggle_device_iotlb = vhost_toggle_device_iotlb; 401917ec5a86SKONRAD Frederic } 402017ec5a86SKONRAD Frederic 402117ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = { 402217ec5a86SKONRAD Frederic .name = TYPE_VIRTIO_NET, 402317ec5a86SKONRAD Frederic .parent = TYPE_VIRTIO_DEVICE, 402417ec5a86SKONRAD Frederic .instance_size = sizeof(VirtIONet), 402517ec5a86SKONRAD Frederic .instance_init = virtio_net_instance_init, 402617ec5a86SKONRAD Frederic .class_init = virtio_net_class_init, 402717ec5a86SKONRAD Frederic }; 402817ec5a86SKONRAD Frederic 402917ec5a86SKONRAD Frederic static void virtio_register_types(void) 403017ec5a86SKONRAD Frederic { 403117ec5a86SKONRAD Frederic type_register_static(&virtio_net_info); 403217ec5a86SKONRAD Frederic } 403317ec5a86SKONRAD Frederic 403417ec5a86SKONRAD Frederic type_init(virtio_register_types) 4035