16e790746SPaolo Bonzini /* 26e790746SPaolo Bonzini * Virtio Network Device 36e790746SPaolo Bonzini * 46e790746SPaolo Bonzini * Copyright IBM, Corp. 2007 56e790746SPaolo Bonzini * 66e790746SPaolo Bonzini * Authors: 76e790746SPaolo Bonzini * Anthony Liguori <aliguori@us.ibm.com> 86e790746SPaolo Bonzini * 96e790746SPaolo Bonzini * This work is licensed under the terms of the GNU GPL, version 2. See 106e790746SPaolo Bonzini * the COPYING file in the top-level directory. 116e790746SPaolo Bonzini * 126e790746SPaolo Bonzini */ 136e790746SPaolo Bonzini 149b8bfe21SPeter Maydell #include "qemu/osdep.h" 159711cd0dSJens Freimann #include "qemu/atomic.h" 166e790746SPaolo Bonzini #include "qemu/iov.h" 1768b0a639SSi-Wei Liu #include "qemu/log.h" 18db725815SMarkus Armbruster #include "qemu/main-loop.h" 190b8fa32fSMarkus Armbruster #include "qemu/module.h" 206e790746SPaolo Bonzini #include "hw/virtio/virtio.h" 216e790746SPaolo Bonzini #include "net/net.h" 226e790746SPaolo Bonzini #include "net/checksum.h" 236e790746SPaolo Bonzini #include "net/tap.h" 246e790746SPaolo Bonzini #include "qemu/error-report.h" 256e790746SPaolo Bonzini #include "qemu/timer.h" 269711cd0dSJens Freimann #include "qemu/option.h" 279711cd0dSJens Freimann #include "qemu/option_int.h" 289711cd0dSJens Freimann #include "qemu/config-file.h" 299711cd0dSJens Freimann #include "qapi/qmp/qdict.h" 306e790746SPaolo Bonzini #include "hw/virtio/virtio-net.h" 316e790746SPaolo Bonzini #include "net/vhost_net.h" 329d8c6a25SDr. David Alan Gilbert #include "net/announce.h" 3317ec5a86SKONRAD Frederic #include "hw/virtio/virtio-bus.h" 34e688df6bSMarkus Armbruster #include "qapi/error.h" 359af23989SMarkus Armbruster #include "qapi/qapi-events-net.h" 36a27bd6c7SMarkus Armbruster #include "hw/qdev-properties.h" 379711cd0dSJens Freimann #include "qapi/qapi-types-migration.h" 389711cd0dSJens Freimann #include "qapi/qapi-events-migration.h" 391399c60dSRusty Russell #include "hw/virtio/virtio-access.h" 40f8d806c9SJuan Quintela #include "migration/misc.h" 419473939eSJason Baron #include "standard-headers/linux/ethtool.h" 422f780b6aSMarkus Armbruster #include "sysemu/sysemu.h" 43a0bf401bSNicholas Piggin #include "sysemu/replay.h" 449d8c6a25SDr. David Alan Gilbert #include "trace.h" 459711cd0dSJens Freimann #include "monitor/qdev.h" 466b230b7dSAndrew Melnychenko #include "monitor/monitor.h" 47edf5ca5dSMarkus Armbruster #include "hw/pci/pci_device.h" 484474e37aSYuri Benditovich #include "net_rx_pkt.h" 49108a6481SCindy Lu #include "hw/virtio/vhost.h" 501b529d90SLaurent Vivier #include "sysemu/qtest.h" 516e790746SPaolo Bonzini 526e790746SPaolo Bonzini #define VIRTIO_NET_VM_VERSION 11 536e790746SPaolo Bonzini 541c0fbfa3SMichael S. Tsirkin /* previously fixed value */ 551c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256 569b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 256 579b02e161SWei Wang 58441537f1SJason Wang /* for now, only allow larger queue_pairs; with virtio-1, guest can downsize */ 591c0fbfa3SMichael S. Tsirkin #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 609b02e161SWei Wang #define VIRTIO_NET_TX_QUEUE_MIN_SIZE VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE 611c0fbfa3SMichael S. Tsirkin 622974e916SYuri Benditovich #define VIRTIO_NET_IP4_ADDR_SIZE 8 /* ipv4 saddr + daddr */ 632974e916SYuri Benditovich 642974e916SYuri Benditovich #define VIRTIO_NET_TCP_FLAG 0x3F 652974e916SYuri Benditovich #define VIRTIO_NET_TCP_HDR_LENGTH 0xF000 662974e916SYuri Benditovich 672974e916SYuri Benditovich /* IPv4 max payload, 16 bits in the header */ 682974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP4_PAYLOAD (65535 - sizeof(struct ip_header)) 692974e916SYuri Benditovich #define VIRTIO_NET_MAX_TCP_PAYLOAD 65535 702974e916SYuri Benditovich 712974e916SYuri Benditovich /* header length value in ip header without option */ 722974e916SYuri Benditovich #define VIRTIO_NET_IP4_HEADER_LENGTH 5 732974e916SYuri Benditovich 742974e916SYuri Benditovich #define VIRTIO_NET_IP6_ADDR_SIZE 32 /* ipv6 saddr + daddr */ 752974e916SYuri Benditovich #define VIRTIO_NET_MAX_IP6_PAYLOAD VIRTIO_NET_MAX_TCP_PAYLOAD 762974e916SYuri Benditovich 772974e916SYuri Benditovich /* Purge coalesced packets timer interval, This value affects the performance 782974e916SYuri Benditovich a lot, and should be tuned carefully, '300000'(300us) is the recommended 792974e916SYuri Benditovich value to pass the WHQL test, '50000' can gain 2x netperf throughput with 802974e916SYuri Benditovich tso/gso/gro 'off'. */ 812974e916SYuri Benditovich #define VIRTIO_NET_RSC_DEFAULT_INTERVAL 300000 822974e916SYuri Benditovich 8359079029SYuri Benditovich #define VIRTIO_NET_RSS_SUPPORTED_HASHES (VIRTIO_NET_RSS_HASH_TYPE_IPv4 | \ 8459079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv4 | \ 8559079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv4 | \ 8659079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IPv6 | \ 8759079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCPv6 | \ 8859079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDPv6 | \ 8959079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_IP_EX | \ 9059079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_TCP_EX | \ 9159079029SYuri Benditovich VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) 9259079029SYuri Benditovich 93ad6461adSPhilippe Mathieu-Daudé static const VirtIOFeature feature_sizes[] = { 94127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MAC, 955d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mac)}, 96127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_STATUS, 975d5b33c0SMax Reitz .end = endof(struct virtio_net_config, status)}, 98127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MQ, 995d5b33c0SMax Reitz .end = endof(struct virtio_net_config, max_virtqueue_pairs)}, 100127833eeSJason Baron {.flags = 1ULL << VIRTIO_NET_F_MTU, 1015d5b33c0SMax Reitz .end = endof(struct virtio_net_config, mtu)}, 1029473939eSJason Baron {.flags = 1ULL << VIRTIO_NET_F_SPEED_DUPLEX, 1035d5b33c0SMax Reitz .end = endof(struct virtio_net_config, duplex)}, 104e22f0603SYuri Benditovich {.flags = (1ULL << VIRTIO_NET_F_RSS) | (1ULL << VIRTIO_NET_F_HASH_REPORT), 10559079029SYuri Benditovich .end = endof(struct virtio_net_config, supported_hash_types)}, 1066e790746SPaolo Bonzini {} 1076e790746SPaolo Bonzini }; 1086e790746SPaolo Bonzini 109d74c30c8SDaniil Tatianin static const VirtIOConfigSizeParams cfg_size_params = { 110d74c30c8SDaniil Tatianin .min_size = endof(struct virtio_net_config, mac), 111d74c30c8SDaniil Tatianin .max_size = sizeof(struct virtio_net_config), 112d74c30c8SDaniil Tatianin .feature_sizes = feature_sizes 113d74c30c8SDaniil Tatianin }; 114d74c30c8SDaniil Tatianin 1156e790746SPaolo Bonzini static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc) 1166e790746SPaolo Bonzini { 1176e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1186e790746SPaolo Bonzini 1196e790746SPaolo Bonzini return &n->vqs[nc->queue_index]; 1206e790746SPaolo Bonzini } 1216e790746SPaolo Bonzini 1226e790746SPaolo Bonzini static int vq2q(int queue_index) 1236e790746SPaolo Bonzini { 1246e790746SPaolo Bonzini return queue_index / 2; 1256e790746SPaolo Bonzini } 1266e790746SPaolo Bonzini 1274fdf69abSKangjie Xu static void flush_or_purge_queued_packets(NetClientState *nc) 1284fdf69abSKangjie Xu { 1294fdf69abSKangjie Xu if (!nc->peer) { 1304fdf69abSKangjie Xu return; 1314fdf69abSKangjie Xu } 1324fdf69abSKangjie Xu 1334fdf69abSKangjie Xu qemu_flush_or_purge_queued_packets(nc->peer, true); 1344fdf69abSKangjie Xu assert(!virtio_net_get_subqueue(nc)->async_tx.elem); 1354fdf69abSKangjie Xu } 1364fdf69abSKangjie Xu 1376e790746SPaolo Bonzini /* TODO 1386e790746SPaolo Bonzini * - we could suppress RX interrupt if we were so inclined. 1396e790746SPaolo Bonzini */ 1406e790746SPaolo Bonzini 1416e790746SPaolo Bonzini static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config) 1426e790746SPaolo Bonzini { 14317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1446e790746SPaolo Bonzini struct virtio_net_config netcfg; 145c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 146fb592882SCindy Lu static const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } }; 1476e790746SPaolo Bonzini 148108a6481SCindy Lu int ret = 0; 149108a6481SCindy Lu memset(&netcfg, 0 , sizeof(struct virtio_net_config)); 1501399c60dSRusty Russell virtio_stw_p(vdev, &netcfg.status, n->status); 151441537f1SJason Wang virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queue_pairs); 152a93e599dSMaxime Coquelin virtio_stw_p(vdev, &netcfg.mtu, n->net_conf.mtu); 1536e790746SPaolo Bonzini memcpy(netcfg.mac, n->mac, ETH_ALEN); 1549473939eSJason Baron virtio_stl_p(vdev, &netcfg.speed, n->net_conf.speed); 1559473939eSJason Baron netcfg.duplex = n->net_conf.duplex; 15659079029SYuri Benditovich netcfg.rss_max_key_size = VIRTIO_NET_RSS_MAX_KEY_SIZE; 15759079029SYuri Benditovich virtio_stw_p(vdev, &netcfg.rss_max_indirection_table_length, 158e22f0603SYuri Benditovich virtio_host_has_feature(vdev, VIRTIO_NET_F_RSS) ? 159e22f0603SYuri Benditovich VIRTIO_NET_RSS_MAX_TABLE_LEN : 1); 16059079029SYuri Benditovich virtio_stl_p(vdev, &netcfg.supported_hash_types, 16159079029SYuri Benditovich VIRTIO_NET_RSS_SUPPORTED_HASHES); 1626e790746SPaolo Bonzini memcpy(config, &netcfg, n->config_size); 163108a6481SCindy Lu 164c546ecf2SJason Wang /* 165c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 166c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 167c546ecf2SJason Wang */ 168c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 169108a6481SCindy Lu ret = vhost_net_get_config(get_vhost_net(nc->peer), (uint8_t *)&netcfg, 170108a6481SCindy Lu n->config_size); 171ebc141a6SEugenio Pérez if (ret == -1) { 172ebc141a6SEugenio Pérez return; 173ebc141a6SEugenio Pérez } 174ebc141a6SEugenio Pérez 175fb592882SCindy Lu /* 176ebc141a6SEugenio Pérez * Some NIC/kernel combinations present 0 as the mac address. As that 177ebc141a6SEugenio Pérez * is not a legal address, try to proceed with the address from the 178ebc141a6SEugenio Pérez * QEMU command line in the hope that the address has been configured 179ebc141a6SEugenio Pérez * correctly elsewhere - just not reported by the device. 180fb592882SCindy Lu */ 181fb592882SCindy Lu if (memcmp(&netcfg.mac, &zero, sizeof(zero)) == 0) { 182fb592882SCindy Lu info_report("Zero hardware mac address detected. Ignoring."); 183fb592882SCindy Lu memcpy(netcfg.mac, n->mac, ETH_ALEN); 184fb592882SCindy Lu } 185ebc141a6SEugenio Pérez 1864f93aafcSEugenio Pérez netcfg.status |= virtio_tswap16(vdev, 1874f93aafcSEugenio Pérez n->status & VIRTIO_NET_S_ANNOUNCE); 188108a6481SCindy Lu memcpy(config, &netcfg, n->config_size); 189108a6481SCindy Lu } 190108a6481SCindy Lu } 1916e790746SPaolo Bonzini 1926e790746SPaolo Bonzini static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config) 1936e790746SPaolo Bonzini { 19417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 1956e790746SPaolo Bonzini struct virtio_net_config netcfg = {}; 196c546ecf2SJason Wang NetClientState *nc = qemu_get_queue(n->nic); 1976e790746SPaolo Bonzini 1986e790746SPaolo Bonzini memcpy(&netcfg, config, n->config_size); 1996e790746SPaolo Bonzini 20095129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) && 20195129d6fSCornelia Huck !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) && 2026e790746SPaolo Bonzini memcmp(netcfg.mac, n->mac, ETH_ALEN)) { 2036e790746SPaolo Bonzini memcpy(n->mac, netcfg.mac, ETH_ALEN); 2046e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 2056e790746SPaolo Bonzini } 206108a6481SCindy Lu 207c546ecf2SJason Wang /* 208c546ecf2SJason Wang * Is this VDPA? No peer means not VDPA: there's no way to 209c546ecf2SJason Wang * disconnect/reconnect a VDPA peer. 210c546ecf2SJason Wang */ 211c546ecf2SJason Wang if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 212c546ecf2SJason Wang vhost_net_set_config(get_vhost_net(nc->peer), 213c546ecf2SJason Wang (uint8_t *)&netcfg, 0, n->config_size, 214f8ed3648SManos Pitsidianakis VHOST_SET_CONFIG_TYPE_FRONTEND); 215108a6481SCindy Lu } 2166e790746SPaolo Bonzini } 2176e790746SPaolo Bonzini 2186e790746SPaolo Bonzini static bool virtio_net_started(VirtIONet *n, uint8_t status) 2196e790746SPaolo Bonzini { 22017a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2216e790746SPaolo Bonzini return (status & VIRTIO_CONFIG_S_DRIVER_OK) && 22217a0ca55SKONRAD Frederic (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running; 2236e790746SPaolo Bonzini } 2246e790746SPaolo Bonzini 225b2c929f0SDr. David Alan Gilbert static void virtio_net_announce_notify(VirtIONet *net) 226b2c929f0SDr. David Alan Gilbert { 227b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(net); 228b2c929f0SDr. David Alan Gilbert trace_virtio_net_announce_notify(); 229b2c929f0SDr. David Alan Gilbert 230b2c929f0SDr. David Alan Gilbert net->status |= VIRTIO_NET_S_ANNOUNCE; 231b2c929f0SDr. David Alan Gilbert virtio_notify_config(vdev); 232b2c929f0SDr. David Alan Gilbert } 233b2c929f0SDr. David Alan Gilbert 234f57fcf70SJason Wang static void virtio_net_announce_timer(void *opaque) 235f57fcf70SJason Wang { 236f57fcf70SJason Wang VirtIONet *n = opaque; 2379d8c6a25SDr. David Alan Gilbert trace_virtio_net_announce_timer(n->announce_timer.round); 238f57fcf70SJason Wang 2399d8c6a25SDr. David Alan Gilbert n->announce_timer.round--; 240b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 241b2c929f0SDr. David Alan Gilbert } 242b2c929f0SDr. David Alan Gilbert 243b2c929f0SDr. David Alan Gilbert static void virtio_net_announce(NetClientState *nc) 244b2c929f0SDr. David Alan Gilbert { 245b2c929f0SDr. David Alan Gilbert VirtIONet *n = qemu_get_nic_opaque(nc); 246b2c929f0SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 247b2c929f0SDr. David Alan Gilbert 248b2c929f0SDr. David Alan Gilbert /* 249b2c929f0SDr. David Alan Gilbert * Make sure the virtio migration announcement timer isn't running 250b2c929f0SDr. David Alan Gilbert * If it is, let it trigger announcement so that we do not cause 251b2c929f0SDr. David Alan Gilbert * confusion. 252b2c929f0SDr. David Alan Gilbert */ 253b2c929f0SDr. David Alan Gilbert if (n->announce_timer.round) { 254b2c929f0SDr. David Alan Gilbert return; 255b2c929f0SDr. David Alan Gilbert } 256b2c929f0SDr. David Alan Gilbert 257b2c929f0SDr. David Alan Gilbert if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 258b2c929f0SDr. David Alan Gilbert virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 259b2c929f0SDr. David Alan Gilbert virtio_net_announce_notify(n); 260b2c929f0SDr. David Alan Gilbert } 261f57fcf70SJason Wang } 262f57fcf70SJason Wang 2636e790746SPaolo Bonzini static void virtio_net_vhost_status(VirtIONet *n, uint8_t status) 2646e790746SPaolo Bonzini { 26517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2666e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 267441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 268aa858194SSi-Wei Liu int cvq = virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ) ? 269aa858194SSi-Wei Liu n->max_ncs - n->max_queue_pairs : 0; 2706e790746SPaolo Bonzini 271ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 2726e790746SPaolo Bonzini return; 2736e790746SPaolo Bonzini } 2746e790746SPaolo Bonzini 2758c1ac475SRadim Krčmář if ((virtio_net_started(n, status) && !nc->peer->link_down) == 2768c1ac475SRadim Krčmář !!n->vhost_started) { 2776e790746SPaolo Bonzini return; 2786e790746SPaolo Bonzini } 2796e790746SPaolo Bonzini if (!n->vhost_started) { 280086abc1cSMichael S. Tsirkin int r, i; 281086abc1cSMichael S. Tsirkin 2821bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 2831bfa316cSGreg Kurz error_report("backend does not support %s vnet headers; " 2841bfa316cSGreg Kurz "falling back on userspace virtio", 2851bfa316cSGreg Kurz virtio_is_big_endian(vdev) ? "BE" : "LE"); 2861bfa316cSGreg Kurz return; 2871bfa316cSGreg Kurz } 2881bfa316cSGreg Kurz 289086abc1cSMichael S. Tsirkin /* Any packets outstanding? Purge them to avoid touching rings 290086abc1cSMichael S. Tsirkin * when vhost is running. 291086abc1cSMichael S. Tsirkin */ 292441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 293086abc1cSMichael S. Tsirkin NetClientState *qnc = qemu_get_subqueue(n->nic, i); 294086abc1cSMichael S. Tsirkin 295086abc1cSMichael S. Tsirkin /* Purge both directions: TX and RX. */ 296086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->peer->incoming_queue, qnc); 297086abc1cSMichael S. Tsirkin qemu_net_queue_purge(qnc->incoming_queue, qnc->peer); 298086abc1cSMichael S. Tsirkin } 299086abc1cSMichael S. Tsirkin 300a93e599dSMaxime Coquelin if (virtio_has_feature(vdev->guest_features, VIRTIO_NET_F_MTU)) { 301a93e599dSMaxime Coquelin r = vhost_net_set_mtu(get_vhost_net(nc->peer), n->net_conf.mtu); 302a93e599dSMaxime Coquelin if (r < 0) { 303a93e599dSMaxime Coquelin error_report("%uBytes MTU not supported by the backend", 304a93e599dSMaxime Coquelin n->net_conf.mtu); 305a93e599dSMaxime Coquelin 306a93e599dSMaxime Coquelin return; 307a93e599dSMaxime Coquelin } 308a93e599dSMaxime Coquelin } 309a93e599dSMaxime Coquelin 3106e790746SPaolo Bonzini n->vhost_started = 1; 31122288fe5SJason Wang r = vhost_net_start(vdev, n->nic->ncs, queue_pairs, cvq); 3126e790746SPaolo Bonzini if (r < 0) { 3136e790746SPaolo Bonzini error_report("unable to start vhost net: %d: " 3146e790746SPaolo Bonzini "falling back on userspace virtio", -r); 3156e790746SPaolo Bonzini n->vhost_started = 0; 3166e790746SPaolo Bonzini } 3176e790746SPaolo Bonzini } else { 31822288fe5SJason Wang vhost_net_stop(vdev, n->nic->ncs, queue_pairs, cvq); 3196e790746SPaolo Bonzini n->vhost_started = 0; 3206e790746SPaolo Bonzini } 3216e790746SPaolo Bonzini } 3226e790746SPaolo Bonzini 3231bfa316cSGreg Kurz static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev, 3241bfa316cSGreg Kurz NetClientState *peer, 3251bfa316cSGreg Kurz bool enable) 3261bfa316cSGreg Kurz { 3271bfa316cSGreg Kurz if (virtio_is_big_endian(vdev)) { 3281bfa316cSGreg Kurz return qemu_set_vnet_be(peer, enable); 3291bfa316cSGreg Kurz } else { 3301bfa316cSGreg Kurz return qemu_set_vnet_le(peer, enable); 3311bfa316cSGreg Kurz } 3321bfa316cSGreg Kurz } 3331bfa316cSGreg Kurz 3341bfa316cSGreg Kurz static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs, 335441537f1SJason Wang int queue_pairs, bool enable) 3361bfa316cSGreg Kurz { 3371bfa316cSGreg Kurz int i; 3381bfa316cSGreg Kurz 339441537f1SJason Wang for (i = 0; i < queue_pairs; i++) { 3401bfa316cSGreg Kurz if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 && 3411bfa316cSGreg Kurz enable) { 3421bfa316cSGreg Kurz while (--i >= 0) { 3431bfa316cSGreg Kurz virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false); 3441bfa316cSGreg Kurz } 3451bfa316cSGreg Kurz 3461bfa316cSGreg Kurz return true; 3471bfa316cSGreg Kurz } 3481bfa316cSGreg Kurz } 3491bfa316cSGreg Kurz 3501bfa316cSGreg Kurz return false; 3511bfa316cSGreg Kurz } 3521bfa316cSGreg Kurz 3531bfa316cSGreg Kurz static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status) 3541bfa316cSGreg Kurz { 3551bfa316cSGreg Kurz VirtIODevice *vdev = VIRTIO_DEVICE(n); 356441537f1SJason Wang int queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3571bfa316cSGreg Kurz 3581bfa316cSGreg Kurz if (virtio_net_started(n, status)) { 3591bfa316cSGreg Kurz /* Before using the device, we tell the network backend about the 3601bfa316cSGreg Kurz * endianness to use when parsing vnet headers. If the backend 3611bfa316cSGreg Kurz * can't do it, we fallback onto fixing the headers in the core 3621bfa316cSGreg Kurz * virtio-net code. 3631bfa316cSGreg Kurz */ 364ad57f700SAkihiko Odaki n->needs_vnet_hdr_swap = n->has_vnet_hdr && 365ad57f700SAkihiko Odaki virtio_net_set_vnet_endian(vdev, n->nic->ncs, 366441537f1SJason Wang queue_pairs, true); 3671bfa316cSGreg Kurz } else if (virtio_net_started(n, vdev->status)) { 3681bfa316cSGreg Kurz /* After using the device, we need to reset the network backend to 3691bfa316cSGreg Kurz * the default (guest native endianness), otherwise the guest may 3701bfa316cSGreg Kurz * lose network connectivity if it is rebooted into a different 3711bfa316cSGreg Kurz * endianness. 3721bfa316cSGreg Kurz */ 373441537f1SJason Wang virtio_net_set_vnet_endian(vdev, n->nic->ncs, queue_pairs, false); 3741bfa316cSGreg Kurz } 3751bfa316cSGreg Kurz } 3761bfa316cSGreg Kurz 377283e2c2aSYuri Benditovich static void virtio_net_drop_tx_queue_data(VirtIODevice *vdev, VirtQueue *vq) 378283e2c2aSYuri Benditovich { 379283e2c2aSYuri Benditovich unsigned int dropped = virtqueue_drop_all(vq); 380283e2c2aSYuri Benditovich if (dropped) { 381283e2c2aSYuri Benditovich virtio_notify(vdev, vq); 382283e2c2aSYuri Benditovich } 383283e2c2aSYuri Benditovich } 384283e2c2aSYuri Benditovich 3856e790746SPaolo Bonzini static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status) 3866e790746SPaolo Bonzini { 38717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 3886e790746SPaolo Bonzini VirtIONetQueue *q; 3896e790746SPaolo Bonzini int i; 3906e790746SPaolo Bonzini uint8_t queue_status; 3916e790746SPaolo Bonzini 3921bfa316cSGreg Kurz virtio_net_vnet_endian_status(n, status); 3936e790746SPaolo Bonzini virtio_net_vhost_status(n, status); 3946e790746SPaolo Bonzini 395441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 39638705bb5SFam Zheng NetClientState *ncs = qemu_get_subqueue(n->nic, i); 39738705bb5SFam Zheng bool queue_started; 3986e790746SPaolo Bonzini q = &n->vqs[i]; 3996e790746SPaolo Bonzini 400441537f1SJason Wang if ((!n->multiqueue && i != 0) || i >= n->curr_queue_pairs) { 4016e790746SPaolo Bonzini queue_status = 0; 4026e790746SPaolo Bonzini } else { 4036e790746SPaolo Bonzini queue_status = status; 4046e790746SPaolo Bonzini } 40538705bb5SFam Zheng queue_started = 40638705bb5SFam Zheng virtio_net_started(n, queue_status) && !n->vhost_started; 40738705bb5SFam Zheng 40838705bb5SFam Zheng if (queue_started) { 40938705bb5SFam Zheng qemu_flush_queued_packets(ncs); 41038705bb5SFam Zheng } 4116e790746SPaolo Bonzini 4126e790746SPaolo Bonzini if (!q->tx_waiting) { 4136e790746SPaolo Bonzini continue; 4146e790746SPaolo Bonzini } 4156e790746SPaolo Bonzini 41638705bb5SFam Zheng if (queue_started) { 4176e790746SPaolo Bonzini if (q->tx_timer) { 418bc72ad67SAlex Bligh timer_mod(q->tx_timer, 419bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 4206e790746SPaolo Bonzini } else { 421a0bf401bSNicholas Piggin replay_bh_schedule_event(q->tx_bh); 4226e790746SPaolo Bonzini } 4236e790746SPaolo Bonzini } else { 4246e790746SPaolo Bonzini if (q->tx_timer) { 425bc72ad67SAlex Bligh timer_del(q->tx_timer); 4266e790746SPaolo Bonzini } else { 4276e790746SPaolo Bonzini qemu_bh_cancel(q->tx_bh); 4286e790746SPaolo Bonzini } 429283e2c2aSYuri Benditovich if ((n->status & VIRTIO_NET_S_LINK_UP) == 0 && 43070e53e6eSJason Wang (queue_status & VIRTIO_CONFIG_S_DRIVER_OK) && 43170e53e6eSJason Wang vdev->vm_running) { 432283e2c2aSYuri Benditovich /* if tx is waiting we are likely have some packets in tx queue 433283e2c2aSYuri Benditovich * and disabled notification */ 434283e2c2aSYuri Benditovich q->tx_waiting = 0; 435283e2c2aSYuri Benditovich virtio_queue_set_notification(q->tx_vq, 1); 436283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, q->tx_vq); 437283e2c2aSYuri Benditovich } 4386e790746SPaolo Bonzini } 4396e790746SPaolo Bonzini } 4406e790746SPaolo Bonzini } 4416e790746SPaolo Bonzini 4426e790746SPaolo Bonzini static void virtio_net_set_link_status(NetClientState *nc) 4436e790746SPaolo Bonzini { 4446e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 44517a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 4466e790746SPaolo Bonzini uint16_t old_status = n->status; 4476e790746SPaolo Bonzini 4486e790746SPaolo Bonzini if (nc->link_down) 4496e790746SPaolo Bonzini n->status &= ~VIRTIO_NET_S_LINK_UP; 4506e790746SPaolo Bonzini else 4516e790746SPaolo Bonzini n->status |= VIRTIO_NET_S_LINK_UP; 4526e790746SPaolo Bonzini 4536e790746SPaolo Bonzini if (n->status != old_status) 45417a0ca55SKONRAD Frederic virtio_notify_config(vdev); 4556e790746SPaolo Bonzini 45617a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 4576e790746SPaolo Bonzini } 4586e790746SPaolo Bonzini 459b1be4280SAmos Kong static void rxfilter_notify(NetClientState *nc) 460b1be4280SAmos Kong { 461b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 462b1be4280SAmos Kong 463b1be4280SAmos Kong if (nc->rxfilter_notify_enabled) { 464ddfb0baaSMarkus Armbruster char *path = object_get_canonical_path(OBJECT(n->qdev)); 4657480874aSMarkus Armbruster qapi_event_send_nic_rx_filter_changed(n->netclient_name, path); 46696e35046SAmos Kong g_free(path); 467b1be4280SAmos Kong 468b1be4280SAmos Kong /* disable event notification to avoid events flooding */ 469b1be4280SAmos Kong nc->rxfilter_notify_enabled = 0; 470b1be4280SAmos Kong } 471b1be4280SAmos Kong } 472b1be4280SAmos Kong 473f7bc8ef8SAmos Kong static intList *get_vlan_table(VirtIONet *n) 474f7bc8ef8SAmos Kong { 47554aa3de7SEric Blake intList *list; 476f7bc8ef8SAmos Kong int i, j; 477f7bc8ef8SAmos Kong 478f7bc8ef8SAmos Kong list = NULL; 479f7bc8ef8SAmos Kong for (i = 0; i < MAX_VLAN >> 5; i++) { 480f7bc8ef8SAmos Kong for (j = 0; n->vlans[i] && j <= 0x1f; j++) { 481f7bc8ef8SAmos Kong if (n->vlans[i] & (1U << j)) { 48254aa3de7SEric Blake QAPI_LIST_PREPEND(list, (i << 5) + j); 483f7bc8ef8SAmos Kong } 484f7bc8ef8SAmos Kong } 485f7bc8ef8SAmos Kong } 486f7bc8ef8SAmos Kong 487f7bc8ef8SAmos Kong return list; 488f7bc8ef8SAmos Kong } 489f7bc8ef8SAmos Kong 490b1be4280SAmos Kong static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc) 491b1be4280SAmos Kong { 492b1be4280SAmos Kong VirtIONet *n = qemu_get_nic_opaque(nc); 493f7bc8ef8SAmos Kong VirtIODevice *vdev = VIRTIO_DEVICE(n); 494b1be4280SAmos Kong RxFilterInfo *info; 49554aa3de7SEric Blake strList *str_list; 496f7bc8ef8SAmos Kong int i; 497b1be4280SAmos Kong 498b1be4280SAmos Kong info = g_malloc0(sizeof(*info)); 499b1be4280SAmos Kong info->name = g_strdup(nc->name); 500b1be4280SAmos Kong info->promiscuous = n->promisc; 501b1be4280SAmos Kong 502b1be4280SAmos Kong if (n->nouni) { 503b1be4280SAmos Kong info->unicast = RX_STATE_NONE; 504b1be4280SAmos Kong } else if (n->alluni) { 505b1be4280SAmos Kong info->unicast = RX_STATE_ALL; 506b1be4280SAmos Kong } else { 507b1be4280SAmos Kong info->unicast = RX_STATE_NORMAL; 508b1be4280SAmos Kong } 509b1be4280SAmos Kong 510b1be4280SAmos Kong if (n->nomulti) { 511b1be4280SAmos Kong info->multicast = RX_STATE_NONE; 512b1be4280SAmos Kong } else if (n->allmulti) { 513b1be4280SAmos Kong info->multicast = RX_STATE_ALL; 514b1be4280SAmos Kong } else { 515b1be4280SAmos Kong info->multicast = RX_STATE_NORMAL; 516b1be4280SAmos Kong } 517b1be4280SAmos Kong 518b1be4280SAmos Kong info->broadcast_allowed = n->nobcast; 519b1be4280SAmos Kong info->multicast_overflow = n->mac_table.multi_overflow; 520b1be4280SAmos Kong info->unicast_overflow = n->mac_table.uni_overflow; 521b1be4280SAmos Kong 522b0575ba4SScott Feldman info->main_mac = qemu_mac_strdup_printf(n->mac); 523b1be4280SAmos Kong 524b1be4280SAmos Kong str_list = NULL; 525b1be4280SAmos Kong for (i = 0; i < n->mac_table.first_multi; i++) { 52654aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 52754aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 528b1be4280SAmos Kong } 529b1be4280SAmos Kong info->unicast_table = str_list; 530b1be4280SAmos Kong 531b1be4280SAmos Kong str_list = NULL; 532b1be4280SAmos Kong for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 53354aa3de7SEric Blake QAPI_LIST_PREPEND(str_list, 53454aa3de7SEric Blake qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN)); 535b1be4280SAmos Kong } 536b1be4280SAmos Kong info->multicast_table = str_list; 537f7bc8ef8SAmos Kong info->vlan_table = get_vlan_table(n); 538b1be4280SAmos Kong 53995129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) { 540f7bc8ef8SAmos Kong info->vlan = RX_STATE_ALL; 541f7bc8ef8SAmos Kong } else if (!info->vlan_table) { 542f7bc8ef8SAmos Kong info->vlan = RX_STATE_NONE; 543f7bc8ef8SAmos Kong } else { 544f7bc8ef8SAmos Kong info->vlan = RX_STATE_NORMAL; 545b1be4280SAmos Kong } 546b1be4280SAmos Kong 547b1be4280SAmos Kong /* enable event notification after query */ 548b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 549b1be4280SAmos Kong 550b1be4280SAmos Kong return info; 551b1be4280SAmos Kong } 552b1be4280SAmos Kong 5537dc6be52SXuan Zhuo static void virtio_net_queue_reset(VirtIODevice *vdev, uint32_t queue_index) 5547dc6be52SXuan Zhuo { 5557dc6be52SXuan Zhuo VirtIONet *n = VIRTIO_NET(vdev); 556f47af0afSXuan Zhuo NetClientState *nc; 557f47af0afSXuan Zhuo 558f47af0afSXuan Zhuo /* validate queue_index and skip for cvq */ 559f47af0afSXuan Zhuo if (queue_index >= n->max_queue_pairs * 2) { 560f47af0afSXuan Zhuo return; 561f47af0afSXuan Zhuo } 562f47af0afSXuan Zhuo 563f47af0afSXuan Zhuo nc = qemu_get_subqueue(n->nic, vq2q(queue_index)); 5647dc6be52SXuan Zhuo 5657dc6be52SXuan Zhuo if (!nc->peer) { 5667dc6be52SXuan Zhuo return; 5677dc6be52SXuan Zhuo } 5687dc6be52SXuan Zhuo 5697dc6be52SXuan Zhuo if (get_vhost_net(nc->peer) && 5707dc6be52SXuan Zhuo nc->peer->info->type == NET_CLIENT_DRIVER_TAP) { 5717dc6be52SXuan Zhuo vhost_net_virtqueue_reset(vdev, nc, queue_index); 5727dc6be52SXuan Zhuo } 5737dc6be52SXuan Zhuo 5747dc6be52SXuan Zhuo flush_or_purge_queued_packets(nc); 5757dc6be52SXuan Zhuo } 5767dc6be52SXuan Zhuo 5777f863302SKangjie Xu static void virtio_net_queue_enable(VirtIODevice *vdev, uint32_t queue_index) 5787f863302SKangjie Xu { 5797f863302SKangjie Xu VirtIONet *n = VIRTIO_NET(vdev); 580f47af0afSXuan Zhuo NetClientState *nc; 5817f863302SKangjie Xu int r; 5827f863302SKangjie Xu 583f47af0afSXuan Zhuo /* validate queue_index and skip for cvq */ 584f47af0afSXuan Zhuo if (queue_index >= n->max_queue_pairs * 2) { 585f47af0afSXuan Zhuo return; 586f47af0afSXuan Zhuo } 587f47af0afSXuan Zhuo 588f47af0afSXuan Zhuo nc = qemu_get_subqueue(n->nic, vq2q(queue_index)); 589f47af0afSXuan Zhuo 5907f863302SKangjie Xu if (!nc->peer || !vdev->vhost_started) { 5917f863302SKangjie Xu return; 5927f863302SKangjie Xu } 5937f863302SKangjie Xu 5947f863302SKangjie Xu if (get_vhost_net(nc->peer) && 5957f863302SKangjie Xu nc->peer->info->type == NET_CLIENT_DRIVER_TAP) { 5967f863302SKangjie Xu r = vhost_net_virtqueue_restart(vdev, nc, queue_index); 5977f863302SKangjie Xu if (r < 0) { 5987f863302SKangjie Xu error_report("unable to restart vhost net virtqueue: %d, " 5997f863302SKangjie Xu "when resetting the queue", queue_index); 6007f863302SKangjie Xu } 6017f863302SKangjie Xu } 6027f863302SKangjie Xu } 6037f863302SKangjie Xu 6046e790746SPaolo Bonzini static void peer_test_vnet_hdr(VirtIONet *n) 6056e790746SPaolo Bonzini { 6066e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 6076e790746SPaolo Bonzini if (!nc->peer) { 6086e790746SPaolo Bonzini return; 6096e790746SPaolo Bonzini } 6106e790746SPaolo Bonzini 611d6085e3aSStefan Hajnoczi n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer); 6126e790746SPaolo Bonzini } 6136e790746SPaolo Bonzini 6146e790746SPaolo Bonzini static int peer_has_vnet_hdr(VirtIONet *n) 6156e790746SPaolo Bonzini { 6166e790746SPaolo Bonzini return n->has_vnet_hdr; 6176e790746SPaolo Bonzini } 6186e790746SPaolo Bonzini 6196e790746SPaolo Bonzini static int peer_has_ufo(VirtIONet *n) 6206e790746SPaolo Bonzini { 6216e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) 6226e790746SPaolo Bonzini return 0; 6236e790746SPaolo Bonzini 624d6085e3aSStefan Hajnoczi n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer); 6256e790746SPaolo Bonzini 6266e790746SPaolo Bonzini return n->has_ufo; 6276e790746SPaolo Bonzini } 6286e790746SPaolo Bonzini 62953da8b5aSYuri Benditovich static int peer_has_uso(VirtIONet *n) 63053da8b5aSYuri Benditovich { 63153da8b5aSYuri Benditovich if (!peer_has_vnet_hdr(n)) { 63253da8b5aSYuri Benditovich return 0; 63353da8b5aSYuri Benditovich } 63453da8b5aSYuri Benditovich 63553da8b5aSYuri Benditovich return qemu_has_uso(qemu_get_queue(n->nic)->peer); 63653da8b5aSYuri Benditovich } 63753da8b5aSYuri Benditovich 638bb9d17f8SCornelia Huck static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs, 639e22f0603SYuri Benditovich int version_1, int hash_report) 6406e790746SPaolo Bonzini { 6416e790746SPaolo Bonzini int i; 6426e790746SPaolo Bonzini NetClientState *nc; 6436e790746SPaolo Bonzini 6446e790746SPaolo Bonzini n->mergeable_rx_bufs = mergeable_rx_bufs; 6456e790746SPaolo Bonzini 646bb9d17f8SCornelia Huck if (version_1) { 647e22f0603SYuri Benditovich n->guest_hdr_len = hash_report ? 648e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_v1_hash) : 649e22f0603SYuri Benditovich sizeof(struct virtio_net_hdr_mrg_rxbuf); 650e22f0603SYuri Benditovich n->rss_data.populate_hash = !!hash_report; 651bb9d17f8SCornelia Huck } else { 6526e790746SPaolo Bonzini n->guest_hdr_len = n->mergeable_rx_bufs ? 653bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr_mrg_rxbuf) : 654bb9d17f8SCornelia Huck sizeof(struct virtio_net_hdr); 65513d40aa8SAkihiko Odaki n->rss_data.populate_hash = false; 656bb9d17f8SCornelia Huck } 6576e790746SPaolo Bonzini 658441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 6596e790746SPaolo Bonzini nc = qemu_get_subqueue(n->nic, i); 6606e790746SPaolo Bonzini 6616e790746SPaolo Bonzini if (peer_has_vnet_hdr(n) && 662d6085e3aSStefan Hajnoczi qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) { 663d6085e3aSStefan Hajnoczi qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len); 6646e790746SPaolo Bonzini n->host_hdr_len = n->guest_hdr_len; 6656e790746SPaolo Bonzini } 6666e790746SPaolo Bonzini } 6676e790746SPaolo Bonzini } 6686e790746SPaolo Bonzini 6692eef278bSMichael S. Tsirkin static int virtio_net_max_tx_queue_size(VirtIONet *n) 6702eef278bSMichael S. Tsirkin { 6712eef278bSMichael S. Tsirkin NetClientState *peer = n->nic_conf.peers.ncs[0]; 6722eef278bSMichael S. Tsirkin 6732eef278bSMichael S. Tsirkin /* 6740ea5778fSEugenio Pérez * Backends other than vhost-user or vhost-vdpa don't support max queue 6750ea5778fSEugenio Pérez * size. 6762eef278bSMichael S. Tsirkin */ 6772eef278bSMichael S. Tsirkin if (!peer) { 6782eef278bSMichael S. Tsirkin return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 6792eef278bSMichael S. Tsirkin } 6802eef278bSMichael S. Tsirkin 6810ea5778fSEugenio Pérez switch(peer->info->type) { 6820ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_USER: 6830ea5778fSEugenio Pérez case NET_CLIENT_DRIVER_VHOST_VDPA: 6842eef278bSMichael S. Tsirkin return VIRTQUEUE_MAX_SIZE; 6850ea5778fSEugenio Pérez default: 6860ea5778fSEugenio Pérez return VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE; 6870ea5778fSEugenio Pérez }; 6882eef278bSMichael S. Tsirkin } 6892eef278bSMichael S. Tsirkin 6906e790746SPaolo Bonzini static int peer_attach(VirtIONet *n, int index) 6916e790746SPaolo Bonzini { 6926e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 6936e790746SPaolo Bonzini 6946e790746SPaolo Bonzini if (!nc->peer) { 6956e790746SPaolo Bonzini return 0; 6966e790746SPaolo Bonzini } 6976e790746SPaolo Bonzini 698f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 6997263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 1); 7007263a0adSChangchun Ouyang } 7017263a0adSChangchun Ouyang 702f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 7036e790746SPaolo Bonzini return 0; 7046e790746SPaolo Bonzini } 7056e790746SPaolo Bonzini 706441537f1SJason Wang if (n->max_queue_pairs == 1) { 7071074b879SJason Wang return 0; 7081074b879SJason Wang } 7091074b879SJason Wang 7106e790746SPaolo Bonzini return tap_enable(nc->peer); 7116e790746SPaolo Bonzini } 7126e790746SPaolo Bonzini 7136e790746SPaolo Bonzini static int peer_detach(VirtIONet *n, int index) 7146e790746SPaolo Bonzini { 7156e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, index); 7166e790746SPaolo Bonzini 7176e790746SPaolo Bonzini if (!nc->peer) { 7186e790746SPaolo Bonzini return 0; 7196e790746SPaolo Bonzini } 7206e790746SPaolo Bonzini 721f394b2e2SEric Blake if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) { 7227263a0adSChangchun Ouyang vhost_set_vring_enable(nc->peer, 0); 7237263a0adSChangchun Ouyang } 7247263a0adSChangchun Ouyang 725f394b2e2SEric Blake if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) { 7266e790746SPaolo Bonzini return 0; 7276e790746SPaolo Bonzini } 7286e790746SPaolo Bonzini 7296e790746SPaolo Bonzini return tap_disable(nc->peer); 7306e790746SPaolo Bonzini } 7316e790746SPaolo Bonzini 732441537f1SJason Wang static void virtio_net_set_queue_pairs(VirtIONet *n) 7336e790746SPaolo Bonzini { 7346e790746SPaolo Bonzini int i; 735ddfa83eaSJoel Stanley int r; 7366e790746SPaolo Bonzini 73768b5f314SYuri Benditovich if (n->nic->peer_deleted) { 73868b5f314SYuri Benditovich return; 73968b5f314SYuri Benditovich } 74068b5f314SYuri Benditovich 741441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 742441537f1SJason Wang if (i < n->curr_queue_pairs) { 743ddfa83eaSJoel Stanley r = peer_attach(n, i); 744ddfa83eaSJoel Stanley assert(!r); 7456e790746SPaolo Bonzini } else { 746ddfa83eaSJoel Stanley r = peer_detach(n, i); 747ddfa83eaSJoel Stanley assert(!r); 7486e790746SPaolo Bonzini } 7496e790746SPaolo Bonzini } 7506e790746SPaolo Bonzini } 7516e790746SPaolo Bonzini 752ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue); 7536e790746SPaolo Bonzini 7549d5b731dSJason Wang static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features, 7559d5b731dSJason Wang Error **errp) 7566e790746SPaolo Bonzini { 75717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 7586e790746SPaolo Bonzini NetClientState *nc = qemu_get_queue(n->nic); 7596e790746SPaolo Bonzini 760da3e8a23SShannon Zhao /* Firstly sync all virtio-net possible supported features */ 761da3e8a23SShannon Zhao features |= n->host_features; 762da3e8a23SShannon Zhao 7630cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 7646e790746SPaolo Bonzini 7656e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n)) { 7660cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_CSUM); 7670cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4); 7680cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6); 7690cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN); 7706e790746SPaolo Bonzini 7710cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM); 7720cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4); 7730cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6); 7740cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN); 775e22f0603SYuri Benditovich 77653da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HOST_USO); 77753da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO4); 77853da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO6); 77953da8b5aSYuri Benditovich 780e22f0603SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HASH_REPORT); 7816e790746SPaolo Bonzini } 7826e790746SPaolo Bonzini 7836e790746SPaolo Bonzini if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) { 7840cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO); 7850cd09c3aSCornelia Huck virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO); 7866e790746SPaolo Bonzini } 7876e790746SPaolo Bonzini 78853da8b5aSYuri Benditovich if (!peer_has_uso(n)) { 78953da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_HOST_USO); 79053da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO4); 79153da8b5aSYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_USO6); 79253da8b5aSYuri Benditovich } 79353da8b5aSYuri Benditovich 794ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 7956e790746SPaolo Bonzini return features; 7966e790746SPaolo Bonzini } 7972974e916SYuri Benditovich 7980145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 79959079029SYuri Benditovich virtio_clear_feature(&features, VIRTIO_NET_F_RSS); 8000145c393SAndrew Melnychenko } 80175ebec11SMaxime Coquelin features = vhost_net_get_features(get_vhost_net(nc->peer), features); 80275ebec11SMaxime Coquelin vdev->backend_features = features; 80375ebec11SMaxime Coquelin 80475ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 80575ebec11SMaxime Coquelin (n->host_features & 1ULL << VIRTIO_NET_F_MTU)) { 80675ebec11SMaxime Coquelin features |= (1ULL << VIRTIO_NET_F_MTU); 80775ebec11SMaxime Coquelin } 80875ebec11SMaxime Coquelin 809cd69d47cSEugenio Pérez /* 810cd69d47cSEugenio Pérez * Since GUEST_ANNOUNCE is emulated the feature bit could be set without 811cd69d47cSEugenio Pérez * enabled. This happens in the vDPA case. 812cd69d47cSEugenio Pérez * 813cd69d47cSEugenio Pérez * Make sure the feature set is not incoherent, as the driver could refuse 814cd69d47cSEugenio Pérez * to start. 815cd69d47cSEugenio Pérez * 816cd69d47cSEugenio Pérez * TODO: QEMU is able to emulate a CVQ just for guest_announce purposes, 817cd69d47cSEugenio Pérez * helping guest to notify the new location with vDPA devices that does not 818cd69d47cSEugenio Pérez * support it. 819cd69d47cSEugenio Pérez */ 820cd69d47cSEugenio Pérez if (!virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_CTRL_VQ)) { 821cd69d47cSEugenio Pérez virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ANNOUNCE); 822cd69d47cSEugenio Pérez } 823cd69d47cSEugenio Pérez 82475ebec11SMaxime Coquelin return features; 8256e790746SPaolo Bonzini } 8266e790746SPaolo Bonzini 827019a3edbSGerd Hoffmann static uint64_t virtio_net_bad_features(VirtIODevice *vdev) 8286e790746SPaolo Bonzini { 829019a3edbSGerd Hoffmann uint64_t features = 0; 8306e790746SPaolo Bonzini 8316e790746SPaolo Bonzini /* Linux kernel 2.6.25. It understood MAC (as everyone must), 8326e790746SPaolo Bonzini * but also these: */ 8330cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_MAC); 8340cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_CSUM); 8350cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4); 8360cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6); 8370cd09c3aSCornelia Huck virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN); 8386e790746SPaolo Bonzini 8396e790746SPaolo Bonzini return features; 8406e790746SPaolo Bonzini } 8416e790746SPaolo Bonzini 842644c9858SDmitry Fleytman static void virtio_net_apply_guest_offloads(VirtIONet *n) 843644c9858SDmitry Fleytman { 844ad37bb3bSStefan Hajnoczi qemu_set_offload(qemu_get_queue(n->nic)->peer, 845644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)), 846644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)), 847644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)), 848644c9858SDmitry Fleytman !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)), 8492ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)), 8502ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_USO4)), 8512ab0ec31SAndrew Melnychenko !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_USO6))); 852644c9858SDmitry Fleytman } 853644c9858SDmitry Fleytman 85453da8b5aSYuri Benditovich static uint64_t virtio_net_guest_offloads_by_features(uint64_t features) 855644c9858SDmitry Fleytman { 856644c9858SDmitry Fleytman static const uint64_t guest_offloads_mask = 857644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_CSUM) | 858644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO4) | 859644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_TSO6) | 860644c9858SDmitry Fleytman (1ULL << VIRTIO_NET_F_GUEST_ECN) | 86153da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_UFO) | 86253da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_USO4) | 86353da8b5aSYuri Benditovich (1ULL << VIRTIO_NET_F_GUEST_USO6); 864644c9858SDmitry Fleytman 865644c9858SDmitry Fleytman return guest_offloads_mask & features; 866644c9858SDmitry Fleytman } 867644c9858SDmitry Fleytman 8680b545b1eSHawkins Jiawei uint64_t virtio_net_supported_guest_offloads(const VirtIONet *n) 869644c9858SDmitry Fleytman { 870644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 871644c9858SDmitry Fleytman return virtio_net_guest_offloads_by_features(vdev->guest_features); 872644c9858SDmitry Fleytman } 873644c9858SDmitry Fleytman 874f5e1847bSJuan Quintela typedef struct { 875f5e1847bSJuan Quintela VirtIONet *n; 87612b2fad7SKevin Wolf DeviceState *dev; 87712b2fad7SKevin Wolf } FailoverDevice; 878f5e1847bSJuan Quintela 879f5e1847bSJuan Quintela /** 88012b2fad7SKevin Wolf * Set the failover primary device 881f5e1847bSJuan Quintela * 882f5e1847bSJuan Quintela * @opaque: FailoverId to setup 883f5e1847bSJuan Quintela * @opts: opts for device we are handling 884f5e1847bSJuan Quintela * @errp: returns an error if this function fails 885f5e1847bSJuan Quintela */ 88612b2fad7SKevin Wolf static int failover_set_primary(DeviceState *dev, void *opaque) 887f5e1847bSJuan Quintela { 88812b2fad7SKevin Wolf FailoverDevice *fdev = opaque; 88912b2fad7SKevin Wolf PCIDevice *pci_dev = (PCIDevice *) 89012b2fad7SKevin Wolf object_dynamic_cast(OBJECT(dev), TYPE_PCI_DEVICE); 891f5e1847bSJuan Quintela 89212b2fad7SKevin Wolf if (!pci_dev) { 89312b2fad7SKevin Wolf return 0; 89412b2fad7SKevin Wolf } 89512b2fad7SKevin Wolf 89612b2fad7SKevin Wolf if (!g_strcmp0(pci_dev->failover_pair_id, fdev->n->netclient_name)) { 89712b2fad7SKevin Wolf fdev->dev = dev; 898f5e1847bSJuan Quintela return 1; 899f5e1847bSJuan Quintela } 900f5e1847bSJuan Quintela 901f5e1847bSJuan Quintela return 0; 902f5e1847bSJuan Quintela } 903f5e1847bSJuan Quintela 904f5e1847bSJuan Quintela /** 90585d3b931SJuan Quintela * Find the primary device for this failover virtio-net 90685d3b931SJuan Quintela * 90785d3b931SJuan Quintela * @n: VirtIONet device 90885d3b931SJuan Quintela * @errp: returns an error if this function fails 90985d3b931SJuan Quintela */ 9100a0a27d6SJuan Quintela static DeviceState *failover_find_primary_device(VirtIONet *n) 9119711cd0dSJens Freimann { 91212b2fad7SKevin Wolf FailoverDevice fdev = { 91312b2fad7SKevin Wolf .n = n, 91412b2fad7SKevin Wolf }; 9159711cd0dSJens Freimann 91612b2fad7SKevin Wolf qbus_walk_children(sysbus_get_default(), failover_set_primary, NULL, 91712b2fad7SKevin Wolf NULL, NULL, &fdev); 91812b2fad7SKevin Wolf return fdev.dev; 9199711cd0dSJens Freimann } 9209711cd0dSJens Freimann 92121e8709bSJuan Quintela static void failover_add_primary(VirtIONet *n, Error **errp) 92221e8709bSJuan Quintela { 92321e8709bSJuan Quintela Error *err = NULL; 92421e8709bSJuan Quintela DeviceState *dev = failover_find_primary_device(n); 92521e8709bSJuan Quintela 92621e8709bSJuan Quintela if (dev) { 92721e8709bSJuan Quintela return; 92821e8709bSJuan Quintela } 92921e8709bSJuan Quintela 930259a10dbSKevin Wolf if (!n->primary_opts) { 93197ca9c59SLaurent Vivier error_setg(errp, "Primary device not found"); 93297ca9c59SLaurent Vivier error_append_hint(errp, "Virtio-net failover will not work. Make " 93397ca9c59SLaurent Vivier "sure primary device has parameter" 93497ca9c59SLaurent Vivier " failover_pair_id=%s\n", n->netclient_name); 93521e8709bSJuan Quintela return; 93621e8709bSJuan Quintela } 937259a10dbSKevin Wolf 938f3558b1bSKevin Wolf dev = qdev_device_add_from_qdict(n->primary_opts, 939f3558b1bSKevin Wolf n->primary_opts_from_json, 940f3558b1bSKevin Wolf &err); 94121e8709bSJuan Quintela if (err) { 942f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 943259a10dbSKevin Wolf n->primary_opts = NULL; 94400e7b129SLaurent Vivier } else { 94500e7b129SLaurent Vivier object_unref(OBJECT(dev)); 94621e8709bSJuan Quintela } 94721e8709bSJuan Quintela error_propagate(errp, err); 94821e8709bSJuan Quintela } 94921e8709bSJuan Quintela 950d5aaa1b0SGerd Hoffmann static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features) 9516e790746SPaolo Bonzini { 95217a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 9539711cd0dSJens Freimann Error *err = NULL; 9546e790746SPaolo Bonzini int i; 9556e790746SPaolo Bonzini 95675ebec11SMaxime Coquelin if (n->mtu_bypass_backend && 95775ebec11SMaxime Coquelin !virtio_has_feature(vdev->backend_features, VIRTIO_NET_F_MTU)) { 95875ebec11SMaxime Coquelin features &= ~(1ULL << VIRTIO_NET_F_MTU); 95975ebec11SMaxime Coquelin } 96075ebec11SMaxime Coquelin 961ef546f12SCornelia Huck virtio_net_set_multiqueue(n, 96259079029SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_RSS) || 96395129d6fSCornelia Huck virtio_has_feature(features, VIRTIO_NET_F_MQ)); 9646e790746SPaolo Bonzini 965ef546f12SCornelia Huck virtio_net_set_mrg_rx_bufs(n, 96695129d6fSCornelia Huck virtio_has_feature(features, 967bb9d17f8SCornelia Huck VIRTIO_NET_F_MRG_RXBUF), 96895129d6fSCornelia Huck virtio_has_feature(features, 969e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 970e22f0603SYuri Benditovich virtio_has_feature(features, 971e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 9726e790746SPaolo Bonzini 9732974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 9742974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO4); 9752974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(features, VIRTIO_NET_F_RSC_EXT) && 9762974e916SYuri Benditovich virtio_has_feature(features, VIRTIO_NET_F_GUEST_TSO6); 977e22f0603SYuri Benditovich n->rss_data.redirect = virtio_has_feature(features, VIRTIO_NET_F_RSS); 9782974e916SYuri Benditovich 9796e790746SPaolo Bonzini if (n->has_vnet_hdr) { 980644c9858SDmitry Fleytman n->curr_guest_offloads = 981644c9858SDmitry Fleytman virtio_net_guest_offloads_by_features(features); 982644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 9836e790746SPaolo Bonzini } 9846e790746SPaolo Bonzini 985441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 9866e790746SPaolo Bonzini NetClientState *nc = qemu_get_subqueue(n->nic, i); 9876e790746SPaolo Bonzini 988ed8b4afeSNikolay Nikolaev if (!get_vhost_net(nc->peer)) { 9896e790746SPaolo Bonzini continue; 9906e790746SPaolo Bonzini } 991ed8b4afeSNikolay Nikolaev vhost_net_ack_features(get_vhost_net(nc->peer), features); 992c9bdc449SHyman Huang(黄勇) 993c9bdc449SHyman Huang(黄勇) /* 994c9bdc449SHyman Huang(黄勇) * keep acked_features in NetVhostUserState up-to-date so it 995c9bdc449SHyman Huang(黄勇) * can't miss any features configured by guest virtio driver. 996c9bdc449SHyman Huang(黄勇) */ 997c9bdc449SHyman Huang(黄勇) vhost_net_save_acked_features(nc->peer); 9986e790746SPaolo Bonzini } 9990b1eaa88SStefan Fritsch 100006b636a1SHawkins Jiawei if (!virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) { 10010b1eaa88SStefan Fritsch memset(n->vlans, 0xff, MAX_VLAN >> 3); 10020b1eaa88SStefan Fritsch } 10039711cd0dSJens Freimann 10049711cd0dSJens Freimann if (virtio_has_feature(features, VIRTIO_NET_F_STANDBY)) { 10059711cd0dSJens Freimann qapi_event_send_failover_negotiated(n->netclient_name); 1006e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 10079711cd0dSJens Freimann failover_add_primary(n, &err); 10089711cd0dSJens Freimann if (err) { 10091b529d90SLaurent Vivier if (!qtest_enabled()) { 10109711cd0dSJens Freimann warn_report_err(err); 10111b529d90SLaurent Vivier } else { 10121b529d90SLaurent Vivier error_free(err); 10131b529d90SLaurent Vivier } 10149711cd0dSJens Freimann } 10156e790746SPaolo Bonzini } 101621e8709bSJuan Quintela } 10176e790746SPaolo Bonzini 10186e790746SPaolo Bonzini static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd, 10196e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 10206e790746SPaolo Bonzini { 10216e790746SPaolo Bonzini uint8_t on; 10226e790746SPaolo Bonzini size_t s; 1023b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 10246e790746SPaolo Bonzini 10256e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on)); 10266e790746SPaolo Bonzini if (s != sizeof(on)) { 10276e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10286e790746SPaolo Bonzini } 10296e790746SPaolo Bonzini 10306e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) { 10316e790746SPaolo Bonzini n->promisc = on; 10326e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) { 10336e790746SPaolo Bonzini n->allmulti = on; 10346e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) { 10356e790746SPaolo Bonzini n->alluni = on; 10366e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) { 10376e790746SPaolo Bonzini n->nomulti = on; 10386e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) { 10396e790746SPaolo Bonzini n->nouni = on; 10406e790746SPaolo Bonzini } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) { 10416e790746SPaolo Bonzini n->nobcast = on; 10426e790746SPaolo Bonzini } else { 10436e790746SPaolo Bonzini return VIRTIO_NET_ERR; 10446e790746SPaolo Bonzini } 10456e790746SPaolo Bonzini 1046b1be4280SAmos Kong rxfilter_notify(nc); 1047b1be4280SAmos Kong 10486e790746SPaolo Bonzini return VIRTIO_NET_OK; 10496e790746SPaolo Bonzini } 10506e790746SPaolo Bonzini 1051644c9858SDmitry Fleytman static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd, 1052644c9858SDmitry Fleytman struct iovec *iov, unsigned int iov_cnt) 1053644c9858SDmitry Fleytman { 1054644c9858SDmitry Fleytman VirtIODevice *vdev = VIRTIO_DEVICE(n); 1055644c9858SDmitry Fleytman uint64_t offloads; 1056644c9858SDmitry Fleytman size_t s; 1057644c9858SDmitry Fleytman 105895129d6fSCornelia Huck if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 1059644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1060644c9858SDmitry Fleytman } 1061644c9858SDmitry Fleytman 1062644c9858SDmitry Fleytman s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads)); 1063644c9858SDmitry Fleytman if (s != sizeof(offloads)) { 1064644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1065644c9858SDmitry Fleytman } 1066644c9858SDmitry Fleytman 1067644c9858SDmitry Fleytman if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) { 1068644c9858SDmitry Fleytman uint64_t supported_offloads; 1069644c9858SDmitry Fleytman 1070189ae6bbSJason Wang offloads = virtio_ldq_p(vdev, &offloads); 1071189ae6bbSJason Wang 1072644c9858SDmitry Fleytman if (!n->has_vnet_hdr) { 1073644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1074644c9858SDmitry Fleytman } 1075644c9858SDmitry Fleytman 10762974e916SYuri Benditovich n->rsc4_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 10772974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO4); 10782974e916SYuri Benditovich n->rsc6_enabled = virtio_has_feature(offloads, VIRTIO_NET_F_RSC_EXT) && 10792974e916SYuri Benditovich virtio_has_feature(offloads, VIRTIO_NET_F_GUEST_TSO6); 10802974e916SYuri Benditovich virtio_clear_feature(&offloads, VIRTIO_NET_F_RSC_EXT); 10812974e916SYuri Benditovich 1082644c9858SDmitry Fleytman supported_offloads = virtio_net_supported_guest_offloads(n); 1083644c9858SDmitry Fleytman if (offloads & ~supported_offloads) { 1084644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1085644c9858SDmitry Fleytman } 1086644c9858SDmitry Fleytman 1087644c9858SDmitry Fleytman n->curr_guest_offloads = offloads; 1088644c9858SDmitry Fleytman virtio_net_apply_guest_offloads(n); 1089644c9858SDmitry Fleytman 1090644c9858SDmitry Fleytman return VIRTIO_NET_OK; 1091644c9858SDmitry Fleytman } else { 1092644c9858SDmitry Fleytman return VIRTIO_NET_ERR; 1093644c9858SDmitry Fleytman } 1094644c9858SDmitry Fleytman } 1095644c9858SDmitry Fleytman 10966e790746SPaolo Bonzini static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd, 10976e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 10986e790746SPaolo Bonzini { 10991399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 11006e790746SPaolo Bonzini struct virtio_net_ctrl_mac mac_data; 11016e790746SPaolo Bonzini size_t s; 1102b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 11036e790746SPaolo Bonzini 11046e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) { 11056e790746SPaolo Bonzini if (iov_size(iov, iov_cnt) != sizeof(n->mac)) { 11066e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11076e790746SPaolo Bonzini } 11086e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac)); 11096e790746SPaolo Bonzini assert(s == sizeof(n->mac)); 11106e790746SPaolo Bonzini qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 1111b1be4280SAmos Kong rxfilter_notify(nc); 1112b1be4280SAmos Kong 11136e790746SPaolo Bonzini return VIRTIO_NET_OK; 11146e790746SPaolo Bonzini } 11156e790746SPaolo Bonzini 11166e790746SPaolo Bonzini if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) { 11176e790746SPaolo Bonzini return VIRTIO_NET_ERR; 11186e790746SPaolo Bonzini } 11196e790746SPaolo Bonzini 1120cae2e556SAmos Kong int in_use = 0; 1121cae2e556SAmos Kong int first_multi = 0; 1122cae2e556SAmos Kong uint8_t uni_overflow = 0; 1123cae2e556SAmos Kong uint8_t multi_overflow = 0; 1124cae2e556SAmos Kong uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 11256e790746SPaolo Bonzini 11266e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 11276e790746SPaolo Bonzini sizeof(mac_data.entries)); 11281399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 11296e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1130b1be4280SAmos Kong goto error; 11316e790746SPaolo Bonzini } 11326e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 11336e790746SPaolo Bonzini 11346e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) { 1135b1be4280SAmos Kong goto error; 11366e790746SPaolo Bonzini } 11376e790746SPaolo Bonzini 11386e790746SPaolo Bonzini if (mac_data.entries <= MAC_TABLE_ENTRIES) { 1139cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, macs, 11406e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 11416e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1142b1be4280SAmos Kong goto error; 11436e790746SPaolo Bonzini } 1144cae2e556SAmos Kong in_use += mac_data.entries; 11456e790746SPaolo Bonzini } else { 1146cae2e556SAmos Kong uni_overflow = 1; 11476e790746SPaolo Bonzini } 11486e790746SPaolo Bonzini 11496e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN); 11506e790746SPaolo Bonzini 1151cae2e556SAmos Kong first_multi = in_use; 11526e790746SPaolo Bonzini 11536e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries, 11546e790746SPaolo Bonzini sizeof(mac_data.entries)); 11551399c60dSRusty Russell mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries); 11566e790746SPaolo Bonzini if (s != sizeof(mac_data.entries)) { 1157b1be4280SAmos Kong goto error; 11586e790746SPaolo Bonzini } 11596e790746SPaolo Bonzini 11606e790746SPaolo Bonzini iov_discard_front(&iov, &iov_cnt, s); 11616e790746SPaolo Bonzini 11626e790746SPaolo Bonzini if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) { 1163b1be4280SAmos Kong goto error; 11646e790746SPaolo Bonzini } 11656e790746SPaolo Bonzini 1166edc24385SMichael S. Tsirkin if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) { 1167cae2e556SAmos Kong s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN], 11686e790746SPaolo Bonzini mac_data.entries * ETH_ALEN); 11696e790746SPaolo Bonzini if (s != mac_data.entries * ETH_ALEN) { 1170b1be4280SAmos Kong goto error; 11716e790746SPaolo Bonzini } 1172cae2e556SAmos Kong in_use += mac_data.entries; 11736e790746SPaolo Bonzini } else { 1174cae2e556SAmos Kong multi_overflow = 1; 11756e790746SPaolo Bonzini } 11766e790746SPaolo Bonzini 1177cae2e556SAmos Kong n->mac_table.in_use = in_use; 1178cae2e556SAmos Kong n->mac_table.first_multi = first_multi; 1179cae2e556SAmos Kong n->mac_table.uni_overflow = uni_overflow; 1180cae2e556SAmos Kong n->mac_table.multi_overflow = multi_overflow; 1181cae2e556SAmos Kong memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN); 1182cae2e556SAmos Kong g_free(macs); 1183b1be4280SAmos Kong rxfilter_notify(nc); 1184b1be4280SAmos Kong 11856e790746SPaolo Bonzini return VIRTIO_NET_OK; 1186b1be4280SAmos Kong 1187b1be4280SAmos Kong error: 1188cae2e556SAmos Kong g_free(macs); 1189b1be4280SAmos Kong return VIRTIO_NET_ERR; 11906e790746SPaolo Bonzini } 11916e790746SPaolo Bonzini 11926e790746SPaolo Bonzini static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd, 11936e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 11946e790746SPaolo Bonzini { 11951399c60dSRusty Russell VirtIODevice *vdev = VIRTIO_DEVICE(n); 11966e790746SPaolo Bonzini uint16_t vid; 11976e790746SPaolo Bonzini size_t s; 1198b1be4280SAmos Kong NetClientState *nc = qemu_get_queue(n->nic); 11996e790746SPaolo Bonzini 12006e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid)); 12011399c60dSRusty Russell vid = virtio_lduw_p(vdev, &vid); 12026e790746SPaolo Bonzini if (s != sizeof(vid)) { 12036e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12046e790746SPaolo Bonzini } 12056e790746SPaolo Bonzini 12066e790746SPaolo Bonzini if (vid >= MAX_VLAN) 12076e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12086e790746SPaolo Bonzini 12096e790746SPaolo Bonzini if (cmd == VIRTIO_NET_CTRL_VLAN_ADD) 12106e790746SPaolo Bonzini n->vlans[vid >> 5] |= (1U << (vid & 0x1f)); 12116e790746SPaolo Bonzini else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL) 12126e790746SPaolo Bonzini n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f)); 12136e790746SPaolo Bonzini else 12146e790746SPaolo Bonzini return VIRTIO_NET_ERR; 12156e790746SPaolo Bonzini 1216b1be4280SAmos Kong rxfilter_notify(nc); 1217b1be4280SAmos Kong 12186e790746SPaolo Bonzini return VIRTIO_NET_OK; 12196e790746SPaolo Bonzini } 12206e790746SPaolo Bonzini 1221f57fcf70SJason Wang static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd, 1222f57fcf70SJason Wang struct iovec *iov, unsigned int iov_cnt) 1223f57fcf70SJason Wang { 12249d8c6a25SDr. David Alan Gilbert trace_virtio_net_handle_announce(n->announce_timer.round); 1225f57fcf70SJason Wang if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK && 1226f57fcf70SJason Wang n->status & VIRTIO_NET_S_ANNOUNCE) { 1227f57fcf70SJason Wang n->status &= ~VIRTIO_NET_S_ANNOUNCE; 12289d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 12299d8c6a25SDr. David Alan Gilbert qemu_announce_timer_step(&n->announce_timer); 1230f57fcf70SJason Wang } 1231f57fcf70SJason Wang return VIRTIO_NET_OK; 1232f57fcf70SJason Wang } else { 1233f57fcf70SJason Wang return VIRTIO_NET_ERR; 1234f57fcf70SJason Wang } 1235f57fcf70SJason Wang } 1236f57fcf70SJason Wang 12370145c393SAndrew Melnychenko static bool virtio_net_attach_ebpf_to_backend(NICState *nic, int prog_fd) 12380145c393SAndrew Melnychenko { 12390145c393SAndrew Melnychenko NetClientState *nc = qemu_get_peer(qemu_get_queue(nic), 0); 12400145c393SAndrew Melnychenko if (nc == NULL || nc->info->set_steering_ebpf == NULL) { 12410145c393SAndrew Melnychenko return false; 12420145c393SAndrew Melnychenko } 12430145c393SAndrew Melnychenko 1244*ae311fb3SDaniel P. Berrangé trace_virtio_net_rss_attach_ebpf(nic, prog_fd); 12450145c393SAndrew Melnychenko return nc->info->set_steering_ebpf(nc, prog_fd); 12460145c393SAndrew Melnychenko } 12470145c393SAndrew Melnychenko 12480145c393SAndrew Melnychenko static void rss_data_to_rss_config(struct VirtioNetRssData *data, 12490145c393SAndrew Melnychenko struct EBPFRSSConfig *config) 12500145c393SAndrew Melnychenko { 12510145c393SAndrew Melnychenko config->redirect = data->redirect; 12520145c393SAndrew Melnychenko config->populate_hash = data->populate_hash; 12530145c393SAndrew Melnychenko config->hash_types = data->hash_types; 12540145c393SAndrew Melnychenko config->indirections_len = data->indirections_len; 12550145c393SAndrew Melnychenko config->default_queue = data->default_queue; 12560145c393SAndrew Melnychenko } 12570145c393SAndrew Melnychenko 1258493a2403SDaniel P. Berrangé static bool virtio_net_attach_ebpf_rss(VirtIONet *n) 12590145c393SAndrew Melnychenko { 12600145c393SAndrew Melnychenko struct EBPFRSSConfig config = {}; 12610145c393SAndrew Melnychenko 12620145c393SAndrew Melnychenko if (!ebpf_rss_is_loaded(&n->ebpf_rss)) { 12630145c393SAndrew Melnychenko return false; 12640145c393SAndrew Melnychenko } 12650145c393SAndrew Melnychenko 12660145c393SAndrew Melnychenko rss_data_to_rss_config(&n->rss_data, &config); 12670145c393SAndrew Melnychenko 12680145c393SAndrew Melnychenko if (!ebpf_rss_set_all(&n->ebpf_rss, &config, 126900b69f1dSDaniel P. Berrangé n->rss_data.indirections_table, n->rss_data.key, 127000b69f1dSDaniel P. Berrangé NULL)) { 12710145c393SAndrew Melnychenko return false; 12720145c393SAndrew Melnychenko } 12730145c393SAndrew Melnychenko 12740145c393SAndrew Melnychenko if (!virtio_net_attach_ebpf_to_backend(n->nic, n->ebpf_rss.program_fd)) { 12750145c393SAndrew Melnychenko return false; 12760145c393SAndrew Melnychenko } 12770145c393SAndrew Melnychenko 12780145c393SAndrew Melnychenko return true; 12790145c393SAndrew Melnychenko } 12800145c393SAndrew Melnychenko 1281493a2403SDaniel P. Berrangé static void virtio_net_detach_ebpf_rss(VirtIONet *n) 12820145c393SAndrew Melnychenko { 12830145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 12840145c393SAndrew Melnychenko } 12850145c393SAndrew Melnychenko 12860e07198eSAkihiko Odaki static void virtio_net_commit_rss_config(VirtIONet *n) 12870e07198eSAkihiko Odaki { 12880e07198eSAkihiko Odaki if (n->rss_data.enabled) { 12890e07198eSAkihiko Odaki n->rss_data.enabled_software_rss = n->rss_data.populate_hash; 12900e07198eSAkihiko Odaki if (n->rss_data.populate_hash) { 1291493a2403SDaniel P. Berrangé virtio_net_detach_ebpf_rss(n); 1292493a2403SDaniel P. Berrangé } else if (!virtio_net_attach_ebpf_rss(n)) { 12930e07198eSAkihiko Odaki if (get_vhost_net(qemu_get_queue(n->nic)->peer)) { 12940e07198eSAkihiko Odaki warn_report("Can't load eBPF RSS for vhost"); 12950e07198eSAkihiko Odaki } else { 12960e07198eSAkihiko Odaki warn_report("Can't load eBPF RSS - fallback to software RSS"); 12970e07198eSAkihiko Odaki n->rss_data.enabled_software_rss = true; 12980e07198eSAkihiko Odaki } 12990e07198eSAkihiko Odaki } 13000e07198eSAkihiko Odaki 1301*ae311fb3SDaniel P. Berrangé trace_virtio_net_rss_enable(n, 1302*ae311fb3SDaniel P. Berrangé n->rss_data.hash_types, 13030e07198eSAkihiko Odaki n->rss_data.indirections_len, 13040e07198eSAkihiko Odaki sizeof(n->rss_data.key)); 13050e07198eSAkihiko Odaki } else { 1306493a2403SDaniel P. Berrangé virtio_net_detach_ebpf_rss(n); 1307*ae311fb3SDaniel P. Berrangé trace_virtio_net_rss_disable(n); 13080e07198eSAkihiko Odaki } 13090e07198eSAkihiko Odaki } 13100e07198eSAkihiko Odaki 13110e07198eSAkihiko Odaki static void virtio_net_disable_rss(VirtIONet *n) 13120e07198eSAkihiko Odaki { 13130e07198eSAkihiko Odaki if (!n->rss_data.enabled) { 13140e07198eSAkihiko Odaki return; 13150e07198eSAkihiko Odaki } 13160e07198eSAkihiko Odaki 13170e07198eSAkihiko Odaki n->rss_data.enabled = false; 13180e07198eSAkihiko Odaki virtio_net_commit_rss_config(n); 13190e07198eSAkihiko Odaki } 13200e07198eSAkihiko Odaki 1321b5900dffSDaniel P. Berrangé static bool virtio_net_load_ebpf_fds(VirtIONet *n, Error **errp) 13220145c393SAndrew Melnychenko { 13236b230b7dSAndrew Melnychenko int fds[EBPF_RSS_MAX_FDS] = { [0 ... EBPF_RSS_MAX_FDS - 1] = -1}; 13246b230b7dSAndrew Melnychenko int ret = true; 13256b230b7dSAndrew Melnychenko int i = 0; 13266b230b7dSAndrew Melnychenko 13276b230b7dSAndrew Melnychenko if (n->nr_ebpf_rss_fds != EBPF_RSS_MAX_FDS) { 1328b5900dffSDaniel P. Berrangé error_setg(errp, "Expected %d file descriptors but got %d", 13296b230b7dSAndrew Melnychenko EBPF_RSS_MAX_FDS, n->nr_ebpf_rss_fds); 13300145c393SAndrew Melnychenko return false; 13310145c393SAndrew Melnychenko } 13320145c393SAndrew Melnychenko 13336b230b7dSAndrew Melnychenko for (i = 0; i < n->nr_ebpf_rss_fds; i++) { 1334b5900dffSDaniel P. Berrangé fds[i] = monitor_fd_param(monitor_cur(), n->ebpf_rss_fds[i], errp); 1335283be596SAkihiko Odaki if (fds[i] < 0) { 13366b230b7dSAndrew Melnychenko ret = false; 13376b230b7dSAndrew Melnychenko goto exit; 13386b230b7dSAndrew Melnychenko } 13396b230b7dSAndrew Melnychenko } 13406b230b7dSAndrew Melnychenko 1341b5900dffSDaniel P. Berrangé ret = ebpf_rss_load_fds(&n->ebpf_rss, fds[0], fds[1], fds[2], fds[3], errp); 13426b230b7dSAndrew Melnychenko 13436b230b7dSAndrew Melnychenko exit: 1344283be596SAkihiko Odaki if (!ret) { 13456b230b7dSAndrew Melnychenko for (i = 0; i < n->nr_ebpf_rss_fds && fds[i] != -1; i++) { 13466b230b7dSAndrew Melnychenko close(fds[i]); 13476b230b7dSAndrew Melnychenko } 13486b230b7dSAndrew Melnychenko } 13496b230b7dSAndrew Melnychenko 13506b230b7dSAndrew Melnychenko return ret; 13516b230b7dSAndrew Melnychenko } 13526b230b7dSAndrew Melnychenko 1353b5900dffSDaniel P. Berrangé static bool virtio_net_load_ebpf(VirtIONet *n, Error **errp) 13546b230b7dSAndrew Melnychenko { 13556b230b7dSAndrew Melnychenko bool ret = false; 13566b230b7dSAndrew Melnychenko 13576b230b7dSAndrew Melnychenko if (virtio_net_attach_ebpf_to_backend(n->nic, -1)) { 1358*ae311fb3SDaniel P. Berrangé trace_virtio_net_rss_load(n, n->nr_ebpf_rss_fds, n->ebpf_rss_fds); 1359b5900dffSDaniel P. Berrangé if (n->ebpf_rss_fds) { 1360b5900dffSDaniel P. Berrangé ret = virtio_net_load_ebpf_fds(n, errp); 1361b5900dffSDaniel P. Berrangé } else { 1362b5900dffSDaniel P. Berrangé ret = ebpf_rss_load(&n->ebpf_rss, errp); 13636b230b7dSAndrew Melnychenko } 13646b230b7dSAndrew Melnychenko } 13656b230b7dSAndrew Melnychenko 13666b230b7dSAndrew Melnychenko return ret; 13670145c393SAndrew Melnychenko } 13680145c393SAndrew Melnychenko 13690145c393SAndrew Melnychenko static void virtio_net_unload_ebpf(VirtIONet *n) 13700145c393SAndrew Melnychenko { 13710145c393SAndrew Melnychenko virtio_net_attach_ebpf_to_backend(n->nic, -1); 13720145c393SAndrew Melnychenko ebpf_rss_unload(&n->ebpf_rss); 137359079029SYuri Benditovich } 137459079029SYuri Benditovich 137559079029SYuri Benditovich static uint16_t virtio_net_handle_rss(VirtIONet *n, 1376e22f0603SYuri Benditovich struct iovec *iov, 1377e22f0603SYuri Benditovich unsigned int iov_cnt, 1378e22f0603SYuri Benditovich bool do_rss) 137959079029SYuri Benditovich { 138059079029SYuri Benditovich VirtIODevice *vdev = VIRTIO_DEVICE(n); 138159079029SYuri Benditovich struct virtio_net_rss_config cfg; 138259079029SYuri Benditovich size_t s, offset = 0, size_get; 1383441537f1SJason Wang uint16_t queue_pairs, i; 138459079029SYuri Benditovich struct { 138559079029SYuri Benditovich uint16_t us; 138659079029SYuri Benditovich uint8_t b; 138759079029SYuri Benditovich } QEMU_PACKED temp; 138859079029SYuri Benditovich const char *err_msg = ""; 138959079029SYuri Benditovich uint32_t err_value = 0; 139059079029SYuri Benditovich 1391e22f0603SYuri Benditovich if (do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_RSS)) { 139259079029SYuri Benditovich err_msg = "RSS is not negotiated"; 139359079029SYuri Benditovich goto error; 139459079029SYuri Benditovich } 1395e22f0603SYuri Benditovich if (!do_rss && !virtio_vdev_has_feature(vdev, VIRTIO_NET_F_HASH_REPORT)) { 1396e22f0603SYuri Benditovich err_msg = "Hash report is not negotiated"; 1397e22f0603SYuri Benditovich goto error; 1398e22f0603SYuri Benditovich } 139959079029SYuri Benditovich size_get = offsetof(struct virtio_net_rss_config, indirection_table); 140059079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &cfg, size_get); 140159079029SYuri Benditovich if (s != size_get) { 140259079029SYuri Benditovich err_msg = "Short command buffer"; 140359079029SYuri Benditovich err_value = (uint32_t)s; 140459079029SYuri Benditovich goto error; 140559079029SYuri Benditovich } 140659079029SYuri Benditovich n->rss_data.hash_types = virtio_ldl_p(vdev, &cfg.hash_types); 140759079029SYuri Benditovich n->rss_data.indirections_len = 140859079029SYuri Benditovich virtio_lduw_p(vdev, &cfg.indirection_table_mask); 140959079029SYuri Benditovich n->rss_data.indirections_len++; 1410e22f0603SYuri Benditovich if (!do_rss) { 1411e22f0603SYuri Benditovich n->rss_data.indirections_len = 1; 1412e22f0603SYuri Benditovich } 141359079029SYuri Benditovich if (!is_power_of_2(n->rss_data.indirections_len)) { 141459079029SYuri Benditovich err_msg = "Invalid size of indirection table"; 141559079029SYuri Benditovich err_value = n->rss_data.indirections_len; 141659079029SYuri Benditovich goto error; 141759079029SYuri Benditovich } 141859079029SYuri Benditovich if (n->rss_data.indirections_len > VIRTIO_NET_RSS_MAX_TABLE_LEN) { 141959079029SYuri Benditovich err_msg = "Too large indirection table"; 142059079029SYuri Benditovich err_value = n->rss_data.indirections_len; 142159079029SYuri Benditovich goto error; 142259079029SYuri Benditovich } 1423e22f0603SYuri Benditovich n->rss_data.default_queue = do_rss ? 1424e22f0603SYuri Benditovich virtio_lduw_p(vdev, &cfg.unclassified_queue) : 0; 1425441537f1SJason Wang if (n->rss_data.default_queue >= n->max_queue_pairs) { 142659079029SYuri Benditovich err_msg = "Invalid default queue"; 142759079029SYuri Benditovich err_value = n->rss_data.default_queue; 142859079029SYuri Benditovich goto error; 142959079029SYuri Benditovich } 143059079029SYuri Benditovich offset += size_get; 143159079029SYuri Benditovich size_get = sizeof(uint16_t) * n->rss_data.indirections_len; 143259079029SYuri Benditovich g_free(n->rss_data.indirections_table); 143359079029SYuri Benditovich n->rss_data.indirections_table = g_malloc(size_get); 143459079029SYuri Benditovich if (!n->rss_data.indirections_table) { 143559079029SYuri Benditovich err_msg = "Can't allocate indirections table"; 143659079029SYuri Benditovich err_value = n->rss_data.indirections_len; 143759079029SYuri Benditovich goto error; 143859079029SYuri Benditovich } 143959079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, 144059079029SYuri Benditovich n->rss_data.indirections_table, size_get); 144159079029SYuri Benditovich if (s != size_get) { 144259079029SYuri Benditovich err_msg = "Short indirection table buffer"; 144359079029SYuri Benditovich err_value = (uint32_t)s; 144459079029SYuri Benditovich goto error; 144559079029SYuri Benditovich } 144659079029SYuri Benditovich for (i = 0; i < n->rss_data.indirections_len; ++i) { 144759079029SYuri Benditovich uint16_t val = n->rss_data.indirections_table[i]; 144859079029SYuri Benditovich n->rss_data.indirections_table[i] = virtio_lduw_p(vdev, &val); 144959079029SYuri Benditovich } 145059079029SYuri Benditovich offset += size_get; 145159079029SYuri Benditovich size_get = sizeof(temp); 145259079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, &temp, size_get); 145359079029SYuri Benditovich if (s != size_get) { 1454441537f1SJason Wang err_msg = "Can't get queue_pairs"; 145559079029SYuri Benditovich err_value = (uint32_t)s; 145659079029SYuri Benditovich goto error; 145759079029SYuri Benditovich } 1458441537f1SJason Wang queue_pairs = do_rss ? virtio_lduw_p(vdev, &temp.us) : n->curr_queue_pairs; 1459441537f1SJason Wang if (queue_pairs == 0 || queue_pairs > n->max_queue_pairs) { 1460441537f1SJason Wang err_msg = "Invalid number of queue_pairs"; 1461441537f1SJason Wang err_value = queue_pairs; 146259079029SYuri Benditovich goto error; 146359079029SYuri Benditovich } 146459079029SYuri Benditovich if (temp.b > VIRTIO_NET_RSS_MAX_KEY_SIZE) { 146559079029SYuri Benditovich err_msg = "Invalid key size"; 146659079029SYuri Benditovich err_value = temp.b; 146759079029SYuri Benditovich goto error; 146859079029SYuri Benditovich } 146959079029SYuri Benditovich if (!temp.b && n->rss_data.hash_types) { 147059079029SYuri Benditovich err_msg = "No key provided"; 147159079029SYuri Benditovich err_value = 0; 147259079029SYuri Benditovich goto error; 147359079029SYuri Benditovich } 147459079029SYuri Benditovich if (!temp.b && !n->rss_data.hash_types) { 147559079029SYuri Benditovich virtio_net_disable_rss(n); 1476441537f1SJason Wang return queue_pairs; 147759079029SYuri Benditovich } 147859079029SYuri Benditovich offset += size_get; 147959079029SYuri Benditovich size_get = temp.b; 148059079029SYuri Benditovich s = iov_to_buf(iov, iov_cnt, offset, n->rss_data.key, size_get); 148159079029SYuri Benditovich if (s != size_get) { 148259079029SYuri Benditovich err_msg = "Can get key buffer"; 148359079029SYuri Benditovich err_value = (uint32_t)s; 148459079029SYuri Benditovich goto error; 148559079029SYuri Benditovich } 148659079029SYuri Benditovich n->rss_data.enabled = true; 14870e07198eSAkihiko Odaki virtio_net_commit_rss_config(n); 1488441537f1SJason Wang return queue_pairs; 148959079029SYuri Benditovich error: 1490*ae311fb3SDaniel P. Berrangé trace_virtio_net_rss_error(n, err_msg, err_value); 149159079029SYuri Benditovich virtio_net_disable_rss(n); 149259079029SYuri Benditovich return 0; 149359079029SYuri Benditovich } 149459079029SYuri Benditovich 14956e790746SPaolo Bonzini static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd, 14966e790746SPaolo Bonzini struct iovec *iov, unsigned int iov_cnt) 14976e790746SPaolo Bonzini { 149817a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1499441537f1SJason Wang uint16_t queue_pairs; 15002a7888ccSSi-Wei Liu NetClientState *nc = qemu_get_queue(n->nic); 15016e790746SPaolo Bonzini 150259079029SYuri Benditovich virtio_net_disable_rss(n); 1503e22f0603SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_HASH_CONFIG) { 1504441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, false); 1505441537f1SJason Wang return queue_pairs ? VIRTIO_NET_OK : VIRTIO_NET_ERR; 1506e22f0603SYuri Benditovich } 150759079029SYuri Benditovich if (cmd == VIRTIO_NET_CTRL_MQ_RSS_CONFIG) { 1508441537f1SJason Wang queue_pairs = virtio_net_handle_rss(n, iov, iov_cnt, true); 150959079029SYuri Benditovich } else if (cmd == VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) { 151059079029SYuri Benditovich struct virtio_net_ctrl_mq mq; 151159079029SYuri Benditovich size_t s; 151259079029SYuri Benditovich if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_MQ)) { 151359079029SYuri Benditovich return VIRTIO_NET_ERR; 151459079029SYuri Benditovich } 15156e790746SPaolo Bonzini s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq)); 15166e790746SPaolo Bonzini if (s != sizeof(mq)) { 15176e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15186e790746SPaolo Bonzini } 1519441537f1SJason Wang queue_pairs = virtio_lduw_p(vdev, &mq.virtqueue_pairs); 15206e790746SPaolo Bonzini 152159079029SYuri Benditovich } else { 15226e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15236e790746SPaolo Bonzini } 15246e790746SPaolo Bonzini 1525441537f1SJason Wang if (queue_pairs < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN || 1526441537f1SJason Wang queue_pairs > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX || 1527441537f1SJason Wang queue_pairs > n->max_queue_pairs || 15286e790746SPaolo Bonzini !n->multiqueue) { 15296e790746SPaolo Bonzini return VIRTIO_NET_ERR; 15306e790746SPaolo Bonzini } 15316e790746SPaolo Bonzini 1532441537f1SJason Wang n->curr_queue_pairs = queue_pairs; 1533ca8717f9SEugenio Pérez if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 1534ca8717f9SEugenio Pérez /* 1535ca8717f9SEugenio Pérez * Avoid updating the backend for a vdpa device: We're only interested 1536ca8717f9SEugenio Pérez * in updating the device model queues. 1537ca8717f9SEugenio Pérez */ 1538ca8717f9SEugenio Pérez return VIRTIO_NET_OK; 1539ca8717f9SEugenio Pérez } 1540441537f1SJason Wang /* stop the backend before changing the number of queue_pairs to avoid handling a 15416e790746SPaolo Bonzini * disabled queue */ 154217a0ca55SKONRAD Frederic virtio_net_set_status(vdev, vdev->status); 1543441537f1SJason Wang virtio_net_set_queue_pairs(n); 15446e790746SPaolo Bonzini 15456e790746SPaolo Bonzini return VIRTIO_NET_OK; 15466e790746SPaolo Bonzini } 1547ba7eadb5SGreg Kurz 1548640b8a1cSEugenio Pérez size_t virtio_net_handle_ctrl_iov(VirtIODevice *vdev, 1549640b8a1cSEugenio Pérez const struct iovec *in_sg, unsigned in_num, 1550640b8a1cSEugenio Pérez const struct iovec *out_sg, 1551640b8a1cSEugenio Pérez unsigned out_num) 15526e790746SPaolo Bonzini { 155317a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 15546e790746SPaolo Bonzini struct virtio_net_ctrl_hdr ctrl; 15556e790746SPaolo Bonzini virtio_net_ctrl_ack status = VIRTIO_NET_ERR; 15566e790746SPaolo Bonzini size_t s; 1557771b6ed3SJason Wang struct iovec *iov, *iov2; 1558640b8a1cSEugenio Pérez 1559640b8a1cSEugenio Pérez if (iov_size(in_sg, in_num) < sizeof(status) || 1560640b8a1cSEugenio Pérez iov_size(out_sg, out_num) < sizeof(ctrl)) { 1561640b8a1cSEugenio Pérez virtio_error(vdev, "virtio-net ctrl missing headers"); 1562640b8a1cSEugenio Pérez return 0; 1563640b8a1cSEugenio Pérez } 1564640b8a1cSEugenio Pérez 1565640b8a1cSEugenio Pérez iov2 = iov = g_memdup2(out_sg, sizeof(struct iovec) * out_num); 1566640b8a1cSEugenio Pérez s = iov_to_buf(iov, out_num, 0, &ctrl, sizeof(ctrl)); 1567640b8a1cSEugenio Pérez iov_discard_front(&iov, &out_num, sizeof(ctrl)); 1568640b8a1cSEugenio Pérez if (s != sizeof(ctrl)) { 1569640b8a1cSEugenio Pérez status = VIRTIO_NET_ERR; 1570640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_RX) { 1571640b8a1cSEugenio Pérez status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, out_num); 1572640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) { 1573640b8a1cSEugenio Pérez status = virtio_net_handle_mac(n, ctrl.cmd, iov, out_num); 1574640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) { 1575640b8a1cSEugenio Pérez status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, out_num); 1576640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) { 1577640b8a1cSEugenio Pérez status = virtio_net_handle_announce(n, ctrl.cmd, iov, out_num); 1578640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) { 1579640b8a1cSEugenio Pérez status = virtio_net_handle_mq(n, ctrl.cmd, iov, out_num); 1580640b8a1cSEugenio Pérez } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) { 1581640b8a1cSEugenio Pérez status = virtio_net_handle_offloads(n, ctrl.cmd, iov, out_num); 1582640b8a1cSEugenio Pérez } 1583640b8a1cSEugenio Pérez 1584640b8a1cSEugenio Pérez s = iov_from_buf(in_sg, in_num, 0, &status, sizeof(status)); 1585640b8a1cSEugenio Pérez assert(s == sizeof(status)); 1586640b8a1cSEugenio Pérez 1587640b8a1cSEugenio Pérez g_free(iov2); 1588640b8a1cSEugenio Pérez return sizeof(status); 1589640b8a1cSEugenio Pérez } 1590640b8a1cSEugenio Pérez 1591640b8a1cSEugenio Pérez static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq) 1592640b8a1cSEugenio Pérez { 1593640b8a1cSEugenio Pérez VirtQueueElement *elem; 15946e790746SPaolo Bonzini 159551b19ebeSPaolo Bonzini for (;;) { 1596640b8a1cSEugenio Pérez size_t written; 159751b19ebeSPaolo Bonzini elem = virtqueue_pop(vq, sizeof(VirtQueueElement)); 159851b19ebeSPaolo Bonzini if (!elem) { 159951b19ebeSPaolo Bonzini break; 160051b19ebeSPaolo Bonzini } 1601640b8a1cSEugenio Pérez 1602640b8a1cSEugenio Pérez written = virtio_net_handle_ctrl_iov(vdev, elem->in_sg, elem->in_num, 1603640b8a1cSEugenio Pérez elem->out_sg, elem->out_num); 1604640b8a1cSEugenio Pérez if (written > 0) { 1605640b8a1cSEugenio Pérez virtqueue_push(vq, elem, written); 1606640b8a1cSEugenio Pérez virtio_notify(vdev, vq); 1607640b8a1cSEugenio Pérez g_free(elem); 1608640b8a1cSEugenio Pérez } else { 1609ba7eadb5SGreg Kurz virtqueue_detach_element(vq, elem, 0); 1610ba7eadb5SGreg Kurz g_free(elem); 1611ba7eadb5SGreg Kurz break; 16126e790746SPaolo Bonzini } 16136e790746SPaolo Bonzini } 16146e790746SPaolo Bonzini } 16156e790746SPaolo Bonzini 16166e790746SPaolo Bonzini /* RX */ 16176e790746SPaolo Bonzini 16186e790746SPaolo Bonzini static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq) 16196e790746SPaolo Bonzini { 162017a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 16216e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(vq)); 16226e790746SPaolo Bonzini 16236e790746SPaolo Bonzini qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index)); 16246e790746SPaolo Bonzini } 16256e790746SPaolo Bonzini 1626b8c4b67eSPhilippe Mathieu-Daudé static bool virtio_net_can_receive(NetClientState *nc) 16276e790746SPaolo Bonzini { 16286e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 162917a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 16306e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 16316e790746SPaolo Bonzini 163217a0ca55SKONRAD Frederic if (!vdev->vm_running) { 1633b8c4b67eSPhilippe Mathieu-Daudé return false; 16346e790746SPaolo Bonzini } 16356e790746SPaolo Bonzini 1636441537f1SJason Wang if (nc->queue_index >= n->curr_queue_pairs) { 1637b8c4b67eSPhilippe Mathieu-Daudé return false; 16386e790746SPaolo Bonzini } 16396e790746SPaolo Bonzini 16406e790746SPaolo Bonzini if (!virtio_queue_ready(q->rx_vq) || 164117a0ca55SKONRAD Frederic !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 1642b8c4b67eSPhilippe Mathieu-Daudé return false; 16436e790746SPaolo Bonzini } 16446e790746SPaolo Bonzini 1645b8c4b67eSPhilippe Mathieu-Daudé return true; 16466e790746SPaolo Bonzini } 16476e790746SPaolo Bonzini 16486e790746SPaolo Bonzini static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize) 16496e790746SPaolo Bonzini { 1650f937309fSthomas int opaque; 1651f937309fSthomas unsigned int in_bytes; 16526e790746SPaolo Bonzini VirtIONet *n = q->n; 16536e790746SPaolo Bonzini 1654f937309fSthomas while (virtio_queue_empty(q->rx_vq) || n->mergeable_rx_bufs) { 1655f937309fSthomas opaque = virtqueue_get_avail_bytes(q->rx_vq, &in_bytes, NULL, 1656f937309fSthomas bufsize, 0); 1657f937309fSthomas /* Buffer is enough, disable notifiaction */ 1658f937309fSthomas if (bufsize <= in_bytes) { 1659f937309fSthomas break; 1660f937309fSthomas } 1661f937309fSthomas 1662f937309fSthomas if (virtio_queue_enable_notification_and_check(q->rx_vq, opaque)) { 1663f937309fSthomas /* Guest has added some buffers, try again */ 1664f937309fSthomas continue; 1665f937309fSthomas } else { 16666e790746SPaolo Bonzini return 0; 16676e790746SPaolo Bonzini } 16686e790746SPaolo Bonzini } 16696e790746SPaolo Bonzini 16706e790746SPaolo Bonzini virtio_queue_set_notification(q->rx_vq, 0); 1671f937309fSthomas 16726e790746SPaolo Bonzini return 1; 16736e790746SPaolo Bonzini } 16746e790746SPaolo Bonzini 16751399c60dSRusty Russell static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr) 1676032a74a1SCédric Le Goater { 16771399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->hdr_len); 16781399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->gso_size); 16791399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_start); 16801399c60dSRusty Russell virtio_tswap16s(vdev, &hdr->csum_offset); 1681032a74a1SCédric Le Goater } 1682032a74a1SCédric Le Goater 16836e790746SPaolo Bonzini /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so 16846e790746SPaolo Bonzini * it never finds out that the packets don't have valid checksums. This 16856e790746SPaolo Bonzini * causes dhclient to get upset. Fedora's carried a patch for ages to 16866e790746SPaolo Bonzini * fix this with Xen but it hasn't appeared in an upstream release of 16876e790746SPaolo Bonzini * dhclient yet. 16886e790746SPaolo Bonzini * 16896e790746SPaolo Bonzini * To avoid breaking existing guests, we catch udp packets and add 16906e790746SPaolo Bonzini * checksums. This is terrible but it's better than hacking the guest 16916e790746SPaolo Bonzini * kernels. 16926e790746SPaolo Bonzini * 16936e790746SPaolo Bonzini * N.B. if we introduce a zero-copy API, this operation is no longer free so 16946e790746SPaolo Bonzini * we should provide a mechanism to disable it to avoid polluting the host 16956e790746SPaolo Bonzini * cache. 16966e790746SPaolo Bonzini */ 16976e790746SPaolo Bonzini static void work_around_broken_dhclient(struct virtio_net_hdr *hdr, 16986e790746SPaolo Bonzini uint8_t *buf, size_t size) 16996e790746SPaolo Bonzini { 17006e790746SPaolo Bonzini if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */ 17016e790746SPaolo Bonzini (size > 27 && size < 1500) && /* normal sized MTU */ 17026e790746SPaolo Bonzini (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */ 17036e790746SPaolo Bonzini (buf[23] == 17) && /* ip.protocol == UDP */ 17046e790746SPaolo Bonzini (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */ 1705f5746335SBin Meng net_checksum_calculate(buf, size, CSUM_UDP); 17066e790746SPaolo Bonzini hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM; 17076e790746SPaolo Bonzini } 17086e790746SPaolo Bonzini } 17096e790746SPaolo Bonzini 17106e790746SPaolo Bonzini static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt, 17116e790746SPaolo Bonzini const void *buf, size_t size) 17126e790746SPaolo Bonzini { 17136e790746SPaolo Bonzini if (n->has_vnet_hdr) { 17146e790746SPaolo Bonzini /* FIXME this cast is evil */ 17156e790746SPaolo Bonzini void *wbuf = (void *)buf; 17166e790746SPaolo Bonzini work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len, 17176e790746SPaolo Bonzini size - n->host_hdr_len); 17181bfa316cSGreg Kurz 17191bfa316cSGreg Kurz if (n->needs_vnet_hdr_swap) { 17201399c60dSRusty Russell virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf); 17211bfa316cSGreg Kurz } 17226e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr)); 17236e790746SPaolo Bonzini } else { 17246e790746SPaolo Bonzini struct virtio_net_hdr hdr = { 17256e790746SPaolo Bonzini .flags = 0, 17266e790746SPaolo Bonzini .gso_type = VIRTIO_NET_HDR_GSO_NONE 17276e790746SPaolo Bonzini }; 17286e790746SPaolo Bonzini iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr); 17296e790746SPaolo Bonzini } 17306e790746SPaolo Bonzini } 17316e790746SPaolo Bonzini 17326e790746SPaolo Bonzini static int receive_filter(VirtIONet *n, const uint8_t *buf, int size) 17336e790746SPaolo Bonzini { 17346e790746SPaolo Bonzini static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff}; 17356e790746SPaolo Bonzini static const uint8_t vlan[] = {0x81, 0x00}; 17366e790746SPaolo Bonzini uint8_t *ptr = (uint8_t *)buf; 17376e790746SPaolo Bonzini int i; 17386e790746SPaolo Bonzini 17396e790746SPaolo Bonzini if (n->promisc) 17406e790746SPaolo Bonzini return 1; 17416e790746SPaolo Bonzini 17426e790746SPaolo Bonzini ptr += n->host_hdr_len; 17436e790746SPaolo Bonzini 17446e790746SPaolo Bonzini if (!memcmp(&ptr[12], vlan, sizeof(vlan))) { 17457542d3e7SPeter Maydell int vid = lduw_be_p(ptr + 14) & 0xfff; 17466e790746SPaolo Bonzini if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f)))) 17476e790746SPaolo Bonzini return 0; 17486e790746SPaolo Bonzini } 17496e790746SPaolo Bonzini 17506e790746SPaolo Bonzini if (ptr[0] & 1) { // multicast 17516e790746SPaolo Bonzini if (!memcmp(ptr, bcast, sizeof(bcast))) { 17526e790746SPaolo Bonzini return !n->nobcast; 17536e790746SPaolo Bonzini } else if (n->nomulti) { 17546e790746SPaolo Bonzini return 0; 17556e790746SPaolo Bonzini } else if (n->allmulti || n->mac_table.multi_overflow) { 17566e790746SPaolo Bonzini return 1; 17576e790746SPaolo Bonzini } 17586e790746SPaolo Bonzini 17596e790746SPaolo Bonzini for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) { 17606e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 17616e790746SPaolo Bonzini return 1; 17626e790746SPaolo Bonzini } 17636e790746SPaolo Bonzini } 17646e790746SPaolo Bonzini } else { // unicast 17656e790746SPaolo Bonzini if (n->nouni) { 17666e790746SPaolo Bonzini return 0; 17676e790746SPaolo Bonzini } else if (n->alluni || n->mac_table.uni_overflow) { 17686e790746SPaolo Bonzini return 1; 17696e790746SPaolo Bonzini } else if (!memcmp(ptr, n->mac, ETH_ALEN)) { 17706e790746SPaolo Bonzini return 1; 17716e790746SPaolo Bonzini } 17726e790746SPaolo Bonzini 17736e790746SPaolo Bonzini for (i = 0; i < n->mac_table.first_multi; i++) { 17746e790746SPaolo Bonzini if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) { 17756e790746SPaolo Bonzini return 1; 17766e790746SPaolo Bonzini } 17776e790746SPaolo Bonzini } 17786e790746SPaolo Bonzini } 17796e790746SPaolo Bonzini 17806e790746SPaolo Bonzini return 0; 17816e790746SPaolo Bonzini } 17826e790746SPaolo Bonzini 178369ff5ef8SAkihiko Odaki static uint8_t virtio_net_get_hash_type(bool hasip4, 178469ff5ef8SAkihiko Odaki bool hasip6, 178565f474bbSAkihiko Odaki EthL4HdrProto l4hdr_proto, 17864474e37aSYuri Benditovich uint32_t types) 17874474e37aSYuri Benditovich { 178869ff5ef8SAkihiko Odaki if (hasip4) { 178965f474bbSAkihiko Odaki switch (l4hdr_proto) { 179065f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_TCP: 179165f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv4) { 17924474e37aSYuri Benditovich return NetPktRssIpV4Tcp; 17934474e37aSYuri Benditovich } 179465f474bbSAkihiko Odaki break; 179565f474bbSAkihiko Odaki 179665f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_UDP: 179765f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv4) { 17984474e37aSYuri Benditovich return NetPktRssIpV4Udp; 17994474e37aSYuri Benditovich } 180065f474bbSAkihiko Odaki break; 180165f474bbSAkihiko Odaki 180265f474bbSAkihiko Odaki default: 180365f474bbSAkihiko Odaki break; 180465f474bbSAkihiko Odaki } 180565f474bbSAkihiko Odaki 18064474e37aSYuri Benditovich if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv4) { 18074474e37aSYuri Benditovich return NetPktRssIpV4; 18084474e37aSYuri Benditovich } 180969ff5ef8SAkihiko Odaki } else if (hasip6) { 181065f474bbSAkihiko Odaki switch (l4hdr_proto) { 181165f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_TCP: 181265f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCP_EX) { 181365f474bbSAkihiko Odaki return NetPktRssIpV6TcpEx; 181465f474bbSAkihiko Odaki } 181565f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_TCPv6) { 181665f474bbSAkihiko Odaki return NetPktRssIpV6Tcp; 181765f474bbSAkihiko Odaki } 181865f474bbSAkihiko Odaki break; 18194474e37aSYuri Benditovich 182065f474bbSAkihiko Odaki case ETH_L4_HDR_PROTO_UDP: 182165f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDP_EX) { 182265f474bbSAkihiko Odaki return NetPktRssIpV6UdpEx; 18234474e37aSYuri Benditovich } 182465f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_UDPv6) { 182565f474bbSAkihiko Odaki return NetPktRssIpV6Udp; 18264474e37aSYuri Benditovich } 182765f474bbSAkihiko Odaki break; 182865f474bbSAkihiko Odaki 182965f474bbSAkihiko Odaki default: 183065f474bbSAkihiko Odaki break; 183165f474bbSAkihiko Odaki } 183265f474bbSAkihiko Odaki 183365f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_IP_EX) { 183465f474bbSAkihiko Odaki return NetPktRssIpV6Ex; 183565f474bbSAkihiko Odaki } 183665f474bbSAkihiko Odaki if (types & VIRTIO_NET_RSS_HASH_TYPE_IPv6) { 183765f474bbSAkihiko Odaki return NetPktRssIpV6; 18384474e37aSYuri Benditovich } 18394474e37aSYuri Benditovich } 18404474e37aSYuri Benditovich return 0xff; 18414474e37aSYuri Benditovich } 18424474e37aSYuri Benditovich 18434474e37aSYuri Benditovich static int virtio_net_process_rss(NetClientState *nc, const uint8_t *buf, 1844a4c960eeSAkihiko Odaki size_t size, 1845a4c960eeSAkihiko Odaki struct virtio_net_hdr_v1_hash *hdr) 18466e790746SPaolo Bonzini { 18476e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 1848e22f0603SYuri Benditovich unsigned int index = nc->queue_index, new_index = index; 18494474e37aSYuri Benditovich struct NetRxPkt *pkt = n->rx_pkt; 18504474e37aSYuri Benditovich uint8_t net_hash_type; 18514474e37aSYuri Benditovich uint32_t hash; 185265f474bbSAkihiko Odaki bool hasip4, hasip6; 185365f474bbSAkihiko Odaki EthL4HdrProto l4hdr_proto; 1854e22f0603SYuri Benditovich static const uint8_t reports[NetPktRssIpV6UdpEx + 1] = { 1855e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv4, 1856e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv4, 1857e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6, 1858e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6, 1859e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_IPv6_EX, 1860e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_TCPv6_EX, 1861e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv4, 1862e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6, 1863e22f0603SYuri Benditovich VIRTIO_NET_HASH_REPORT_UDPv6_EX 1864e22f0603SYuri Benditovich }; 18652f0fa232SAkihiko Odaki struct iovec iov = { 18662f0fa232SAkihiko Odaki .iov_base = (void *)buf, 18672f0fa232SAkihiko Odaki .iov_len = size 18682f0fa232SAkihiko Odaki }; 18694474e37aSYuri Benditovich 18702f0fa232SAkihiko Odaki net_rx_pkt_set_protocols(pkt, &iov, 1, n->host_hdr_len); 187165f474bbSAkihiko Odaki net_rx_pkt_get_protocols(pkt, &hasip4, &hasip6, &l4hdr_proto); 187265f474bbSAkihiko Odaki net_hash_type = virtio_net_get_hash_type(hasip4, hasip6, l4hdr_proto, 18734474e37aSYuri Benditovich n->rss_data.hash_types); 18744474e37aSYuri Benditovich if (net_hash_type > NetPktRssIpV6UdpEx) { 1875e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1876a4c960eeSAkihiko Odaki hdr->hash_value = VIRTIO_NET_HASH_REPORT_NONE; 1877a4c960eeSAkihiko Odaki hdr->hash_report = 0; 1878e22f0603SYuri Benditovich } 1879e22f0603SYuri Benditovich return n->rss_data.redirect ? n->rss_data.default_queue : -1; 18804474e37aSYuri Benditovich } 18814474e37aSYuri Benditovich 18824474e37aSYuri Benditovich hash = net_rx_pkt_calc_rss_hash(pkt, net_hash_type, n->rss_data.key); 1883e22f0603SYuri Benditovich 1884e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1885a4c960eeSAkihiko Odaki hdr->hash_value = hash; 1886a4c960eeSAkihiko Odaki hdr->hash_report = reports[net_hash_type]; 1887e22f0603SYuri Benditovich } 1888e22f0603SYuri Benditovich 1889e22f0603SYuri Benditovich if (n->rss_data.redirect) { 18904474e37aSYuri Benditovich new_index = hash & (n->rss_data.indirections_len - 1); 18914474e37aSYuri Benditovich new_index = n->rss_data.indirections_table[new_index]; 18924474e37aSYuri Benditovich } 1893e22f0603SYuri Benditovich 1894e22f0603SYuri Benditovich return (index == new_index) ? -1 : new_index; 18954474e37aSYuri Benditovich } 18964474e37aSYuri Benditovich 18974474e37aSYuri Benditovich static ssize_t virtio_net_receive_rcu(NetClientState *nc, const uint8_t *buf, 18984474e37aSYuri Benditovich size_t size, bool no_rss) 18994474e37aSYuri Benditovich { 19004474e37aSYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 19016e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 190217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 1903bedd7e93SJason Wang VirtQueueElement *elems[VIRTQUEUE_MAX_SIZE]; 1904bedd7e93SJason Wang size_t lens[VIRTQUEUE_MAX_SIZE]; 19056e790746SPaolo Bonzini struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE]; 1906a4c960eeSAkihiko Odaki struct virtio_net_hdr_v1_hash extra_hdr; 19076e790746SPaolo Bonzini unsigned mhdr_cnt = 0; 1908bedd7e93SJason Wang size_t offset, i, guest_offset, j; 1909bedd7e93SJason Wang ssize_t err; 19106e790746SPaolo Bonzini 19116e790746SPaolo Bonzini if (!virtio_net_can_receive(nc)) { 19126e790746SPaolo Bonzini return -1; 19136e790746SPaolo Bonzini } 19146e790746SPaolo Bonzini 19150145c393SAndrew Melnychenko if (!no_rss && n->rss_data.enabled && n->rss_data.enabled_software_rss) { 1916a4c960eeSAkihiko Odaki int index = virtio_net_process_rss(nc, buf, size, &extra_hdr); 19174474e37aSYuri Benditovich if (index >= 0) { 1918f1595cebSAkihiko Odaki NetClientState *nc2 = 1919f1595cebSAkihiko Odaki qemu_get_subqueue(n->nic, index % n->curr_queue_pairs); 19204474e37aSYuri Benditovich return virtio_net_receive_rcu(nc2, buf, size, true); 19214474e37aSYuri Benditovich } 19224474e37aSYuri Benditovich } 19234474e37aSYuri Benditovich 19246e790746SPaolo Bonzini /* hdr_len refers to the header we supply to the guest */ 19256e790746SPaolo Bonzini if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) { 19266e790746SPaolo Bonzini return 0; 19276e790746SPaolo Bonzini } 19286e790746SPaolo Bonzini 19296e790746SPaolo Bonzini if (!receive_filter(n, buf, size)) 19306e790746SPaolo Bonzini return size; 19316e790746SPaolo Bonzini 19326e790746SPaolo Bonzini offset = i = 0; 19336e790746SPaolo Bonzini 19346e790746SPaolo Bonzini while (offset < size) { 193551b19ebeSPaolo Bonzini VirtQueueElement *elem; 19366e790746SPaolo Bonzini int len, total; 193751b19ebeSPaolo Bonzini const struct iovec *sg; 19386e790746SPaolo Bonzini 19396e790746SPaolo Bonzini total = 0; 19406e790746SPaolo Bonzini 1941bedd7e93SJason Wang if (i == VIRTQUEUE_MAX_SIZE) { 1942bedd7e93SJason Wang virtio_error(vdev, "virtio-net unexpected long buffer chain"); 1943bedd7e93SJason Wang err = size; 1944bedd7e93SJason Wang goto err; 1945bedd7e93SJason Wang } 1946bedd7e93SJason Wang 194751b19ebeSPaolo Bonzini elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement)); 194851b19ebeSPaolo Bonzini if (!elem) { 1949ba10b9c0SGreg Kurz if (i) { 1950ba10b9c0SGreg Kurz virtio_error(vdev, "virtio-net unexpected empty queue: " 19516e790746SPaolo Bonzini "i %zd mergeable %d offset %zd, size %zd, " 1952019a3edbSGerd Hoffmann "guest hdr len %zd, host hdr len %zd " 1953019a3edbSGerd Hoffmann "guest features 0x%" PRIx64, 19546e790746SPaolo Bonzini i, n->mergeable_rx_bufs, offset, size, 1955019a3edbSGerd Hoffmann n->guest_hdr_len, n->host_hdr_len, 1956019a3edbSGerd Hoffmann vdev->guest_features); 1957ba10b9c0SGreg Kurz } 1958bedd7e93SJason Wang err = -1; 1959bedd7e93SJason Wang goto err; 19606e790746SPaolo Bonzini } 19616e790746SPaolo Bonzini 196251b19ebeSPaolo Bonzini if (elem->in_num < 1) { 1963ba10b9c0SGreg Kurz virtio_error(vdev, 1964ba10b9c0SGreg Kurz "virtio-net receive queue contains no in buffers"); 1965ba10b9c0SGreg Kurz virtqueue_detach_element(q->rx_vq, elem, 0); 1966ba10b9c0SGreg Kurz g_free(elem); 1967bedd7e93SJason Wang err = -1; 1968bedd7e93SJason Wang goto err; 19696e790746SPaolo Bonzini } 19706e790746SPaolo Bonzini 197151b19ebeSPaolo Bonzini sg = elem->in_sg; 19726e790746SPaolo Bonzini if (i == 0) { 19736e790746SPaolo Bonzini assert(offset == 0); 19746e790746SPaolo Bonzini if (n->mergeable_rx_bufs) { 19756e790746SPaolo Bonzini mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg), 197651b19ebeSPaolo Bonzini sg, elem->in_num, 1977a4c960eeSAkihiko Odaki offsetof(typeof(extra_hdr), hdr.num_buffers), 1978a4c960eeSAkihiko Odaki sizeof(extra_hdr.hdr.num_buffers)); 19796e790746SPaolo Bonzini } 19806e790746SPaolo Bonzini 198151b19ebeSPaolo Bonzini receive_header(n, sg, elem->in_num, buf, size); 1982e22f0603SYuri Benditovich if (n->rss_data.populate_hash) { 1983a4c960eeSAkihiko Odaki offset = offsetof(typeof(extra_hdr), hash_value); 1984e22f0603SYuri Benditovich iov_from_buf(sg, elem->in_num, offset, 1985a4c960eeSAkihiko Odaki (char *)&extra_hdr + offset, 1986a4c960eeSAkihiko Odaki sizeof(extra_hdr.hash_value) + 1987a4c960eeSAkihiko Odaki sizeof(extra_hdr.hash_report)); 1988e22f0603SYuri Benditovich } 19896e790746SPaolo Bonzini offset = n->host_hdr_len; 19906e790746SPaolo Bonzini total += n->guest_hdr_len; 19916e790746SPaolo Bonzini guest_offset = n->guest_hdr_len; 19926e790746SPaolo Bonzini } else { 19936e790746SPaolo Bonzini guest_offset = 0; 19946e790746SPaolo Bonzini } 19956e790746SPaolo Bonzini 19966e790746SPaolo Bonzini /* copy in packet. ugh */ 199751b19ebeSPaolo Bonzini len = iov_from_buf(sg, elem->in_num, guest_offset, 19986e790746SPaolo Bonzini buf + offset, size - offset); 19996e790746SPaolo Bonzini total += len; 20006e790746SPaolo Bonzini offset += len; 20016e790746SPaolo Bonzini /* If buffers can't be merged, at this point we 20026e790746SPaolo Bonzini * must have consumed the complete packet. 20036e790746SPaolo Bonzini * Otherwise, drop it. */ 20046e790746SPaolo Bonzini if (!n->mergeable_rx_bufs && offset < size) { 200527e57efeSLadi Prosek virtqueue_unpop(q->rx_vq, elem, total); 200651b19ebeSPaolo Bonzini g_free(elem); 2007bedd7e93SJason Wang err = size; 2008bedd7e93SJason Wang goto err; 20096e790746SPaolo Bonzini } 20106e790746SPaolo Bonzini 2011bedd7e93SJason Wang elems[i] = elem; 2012bedd7e93SJason Wang lens[i] = total; 2013bedd7e93SJason Wang i++; 20146e790746SPaolo Bonzini } 20156e790746SPaolo Bonzini 20166e790746SPaolo Bonzini if (mhdr_cnt) { 2017a4c960eeSAkihiko Odaki virtio_stw_p(vdev, &extra_hdr.hdr.num_buffers, i); 20186e790746SPaolo Bonzini iov_from_buf(mhdr_sg, mhdr_cnt, 20196e790746SPaolo Bonzini 0, 2020a4c960eeSAkihiko Odaki &extra_hdr.hdr.num_buffers, 2021a4c960eeSAkihiko Odaki sizeof extra_hdr.hdr.num_buffers); 20226e790746SPaolo Bonzini } 20236e790746SPaolo Bonzini 2024bedd7e93SJason Wang for (j = 0; j < i; j++) { 2025bedd7e93SJason Wang /* signal other side */ 2026bedd7e93SJason Wang virtqueue_fill(q->rx_vq, elems[j], lens[j], j); 2027bedd7e93SJason Wang g_free(elems[j]); 2028bedd7e93SJason Wang } 2029bedd7e93SJason Wang 20306e790746SPaolo Bonzini virtqueue_flush(q->rx_vq, i); 203117a0ca55SKONRAD Frederic virtio_notify(vdev, q->rx_vq); 20326e790746SPaolo Bonzini 20336e790746SPaolo Bonzini return size; 2034bedd7e93SJason Wang 2035bedd7e93SJason Wang err: 2036bedd7e93SJason Wang for (j = 0; j < i; j++) { 2037abe300d9SJason Wang virtqueue_detach_element(q->rx_vq, elems[j], lens[j]); 2038bedd7e93SJason Wang g_free(elems[j]); 2039bedd7e93SJason Wang } 2040bedd7e93SJason Wang 2041bedd7e93SJason Wang return err; 20426e790746SPaolo Bonzini } 20436e790746SPaolo Bonzini 20442974e916SYuri Benditovich static ssize_t virtio_net_do_receive(NetClientState *nc, const uint8_t *buf, 204597cd965cSPaolo Bonzini size_t size) 204697cd965cSPaolo Bonzini { 2047068ddfa9SDr. David Alan Gilbert RCU_READ_LOCK_GUARD(); 204897cd965cSPaolo Bonzini 20494474e37aSYuri Benditovich return virtio_net_receive_rcu(nc, buf, size, false); 205097cd965cSPaolo Bonzini } 205197cd965cSPaolo Bonzini 20522974e916SYuri Benditovich static void virtio_net_rsc_extract_unit4(VirtioNetRscChain *chain, 20532974e916SYuri Benditovich const uint8_t *buf, 20542974e916SYuri Benditovich VirtioNetRscUnit *unit) 20552974e916SYuri Benditovich { 20562974e916SYuri Benditovich uint16_t ip_hdrlen; 20572974e916SYuri Benditovich struct ip_header *ip; 20582974e916SYuri Benditovich 20592974e916SYuri Benditovich ip = (struct ip_header *)(buf + chain->n->guest_hdr_len 20602974e916SYuri Benditovich + sizeof(struct eth_header)); 20612974e916SYuri Benditovich unit->ip = (void *)ip; 20622974e916SYuri Benditovich ip_hdrlen = (ip->ip_ver_len & 0xF) << 2; 20632974e916SYuri Benditovich unit->ip_plen = &ip->ip_len; 20642974e916SYuri Benditovich unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) + ip_hdrlen); 20652974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 20662974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - ip_hdrlen - unit->tcp_hdrlen; 20672974e916SYuri Benditovich } 20682974e916SYuri Benditovich 20692974e916SYuri Benditovich static void virtio_net_rsc_extract_unit6(VirtioNetRscChain *chain, 20702974e916SYuri Benditovich const uint8_t *buf, 20712974e916SYuri Benditovich VirtioNetRscUnit *unit) 20722974e916SYuri Benditovich { 20732974e916SYuri Benditovich struct ip6_header *ip6; 20742974e916SYuri Benditovich 20752974e916SYuri Benditovich ip6 = (struct ip6_header *)(buf + chain->n->guest_hdr_len 20762974e916SYuri Benditovich + sizeof(struct eth_header)); 20772974e916SYuri Benditovich unit->ip = ip6; 20782974e916SYuri Benditovich unit->ip_plen = &(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 207978ee6bd0SPhilippe Mathieu-Daudé unit->tcp = (struct tcp_header *)(((uint8_t *)unit->ip) 20802974e916SYuri Benditovich + sizeof(struct ip6_header)); 20812974e916SYuri Benditovich unit->tcp_hdrlen = (htons(unit->tcp->th_offset_flags) & 0xF000) >> 10; 20822974e916SYuri Benditovich 20832431f4f1SMichael Tokarev /* There is a difference between payload length in ipv4 and v6, 20842974e916SYuri Benditovich ip header is excluded in ipv6 */ 20852974e916SYuri Benditovich unit->payload = htons(*unit->ip_plen) - unit->tcp_hdrlen; 20862974e916SYuri Benditovich } 20872974e916SYuri Benditovich 20882974e916SYuri Benditovich static size_t virtio_net_rsc_drain_seg(VirtioNetRscChain *chain, 20892974e916SYuri Benditovich VirtioNetRscSeg *seg) 20902974e916SYuri Benditovich { 20912974e916SYuri Benditovich int ret; 2092dd3d85e8SYuri Benditovich struct virtio_net_hdr_v1 *h; 20932974e916SYuri Benditovich 2094dd3d85e8SYuri Benditovich h = (struct virtio_net_hdr_v1 *)seg->buf; 20952974e916SYuri Benditovich h->flags = 0; 20962974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_NONE; 20972974e916SYuri Benditovich 20982974e916SYuri Benditovich if (seg->is_coalesced) { 2099dd3d85e8SYuri Benditovich h->rsc.segments = seg->packets; 2100dd3d85e8SYuri Benditovich h->rsc.dup_acks = seg->dup_ack; 21012974e916SYuri Benditovich h->flags = VIRTIO_NET_HDR_F_RSC_INFO; 21022974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 21032974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 21042974e916SYuri Benditovich } else { 21052974e916SYuri Benditovich h->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 21062974e916SYuri Benditovich } 21072974e916SYuri Benditovich } 21082974e916SYuri Benditovich 21092974e916SYuri Benditovich ret = virtio_net_do_receive(seg->nc, seg->buf, seg->size); 21102974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 21112974e916SYuri Benditovich g_free(seg->buf); 21122974e916SYuri Benditovich g_free(seg); 21132974e916SYuri Benditovich 21142974e916SYuri Benditovich return ret; 21152974e916SYuri Benditovich } 21162974e916SYuri Benditovich 21172974e916SYuri Benditovich static void virtio_net_rsc_purge(void *opq) 21182974e916SYuri Benditovich { 21192974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn; 21202974e916SYuri Benditovich VirtioNetRscChain *chain = (VirtioNetRscChain *)opq; 21212974e916SYuri Benditovich 21222974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn) { 21232974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 21242974e916SYuri Benditovich chain->stat.purge_failed++; 21252974e916SYuri Benditovich continue; 21262974e916SYuri Benditovich } 21272974e916SYuri Benditovich } 21282974e916SYuri Benditovich 21292974e916SYuri Benditovich chain->stat.timer++; 21302974e916SYuri Benditovich if (!QTAILQ_EMPTY(&chain->buffers)) { 21312974e916SYuri Benditovich timer_mod(chain->drain_timer, 213244bc14faSNicholas Piggin qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + chain->n->rsc_timeout); 21332974e916SYuri Benditovich } 21342974e916SYuri Benditovich } 21352974e916SYuri Benditovich 21362974e916SYuri Benditovich static void virtio_net_rsc_cleanup(VirtIONet *n) 21372974e916SYuri Benditovich { 21382974e916SYuri Benditovich VirtioNetRscChain *chain, *rn_chain; 21392974e916SYuri Benditovich VirtioNetRscSeg *seg, *rn_seg; 21402974e916SYuri Benditovich 21412974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(chain, &n->rsc_chains, next, rn_chain) { 21422974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, rn_seg) { 21432974e916SYuri Benditovich QTAILQ_REMOVE(&chain->buffers, seg, next); 21442974e916SYuri Benditovich g_free(seg->buf); 21452974e916SYuri Benditovich g_free(seg); 21462974e916SYuri Benditovich } 21472974e916SYuri Benditovich 21482974e916SYuri Benditovich timer_free(chain->drain_timer); 21492974e916SYuri Benditovich QTAILQ_REMOVE(&n->rsc_chains, chain, next); 21502974e916SYuri Benditovich g_free(chain); 21512974e916SYuri Benditovich } 21522974e916SYuri Benditovich } 21532974e916SYuri Benditovich 21542974e916SYuri Benditovich static void virtio_net_rsc_cache_buf(VirtioNetRscChain *chain, 21552974e916SYuri Benditovich NetClientState *nc, 21562974e916SYuri Benditovich const uint8_t *buf, size_t size) 21572974e916SYuri Benditovich { 21582974e916SYuri Benditovich uint16_t hdr_len; 21592974e916SYuri Benditovich VirtioNetRscSeg *seg; 21602974e916SYuri Benditovich 21612974e916SYuri Benditovich hdr_len = chain->n->guest_hdr_len; 2162b21e2380SMarkus Armbruster seg = g_new(VirtioNetRscSeg, 1); 21632974e916SYuri Benditovich seg->buf = g_malloc(hdr_len + sizeof(struct eth_header) 21642974e916SYuri Benditovich + sizeof(struct ip6_header) + VIRTIO_NET_MAX_TCP_PAYLOAD); 21652974e916SYuri Benditovich memcpy(seg->buf, buf, size); 21662974e916SYuri Benditovich seg->size = size; 21672974e916SYuri Benditovich seg->packets = 1; 21682974e916SYuri Benditovich seg->dup_ack = 0; 21692974e916SYuri Benditovich seg->is_coalesced = 0; 21702974e916SYuri Benditovich seg->nc = nc; 21712974e916SYuri Benditovich 21722974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&chain->buffers, seg, next); 21732974e916SYuri Benditovich chain->stat.cache++; 21742974e916SYuri Benditovich 21752974e916SYuri Benditovich switch (chain->proto) { 21762974e916SYuri Benditovich case ETH_P_IP: 21772974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, seg->buf, &seg->unit); 21782974e916SYuri Benditovich break; 21792974e916SYuri Benditovich case ETH_P_IPV6: 21802974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, seg->buf, &seg->unit); 21812974e916SYuri Benditovich break; 21822974e916SYuri Benditovich default: 21832974e916SYuri Benditovich g_assert_not_reached(); 21842974e916SYuri Benditovich } 21852974e916SYuri Benditovich } 21862974e916SYuri Benditovich 21872974e916SYuri Benditovich static int32_t virtio_net_rsc_handle_ack(VirtioNetRscChain *chain, 21882974e916SYuri Benditovich VirtioNetRscSeg *seg, 21892974e916SYuri Benditovich const uint8_t *buf, 21902974e916SYuri Benditovich struct tcp_header *n_tcp, 21912974e916SYuri Benditovich struct tcp_header *o_tcp) 21922974e916SYuri Benditovich { 21932974e916SYuri Benditovich uint32_t nack, oack; 21942974e916SYuri Benditovich uint16_t nwin, owin; 21952974e916SYuri Benditovich 21962974e916SYuri Benditovich nack = htonl(n_tcp->th_ack); 21972974e916SYuri Benditovich nwin = htons(n_tcp->th_win); 21982974e916SYuri Benditovich oack = htonl(o_tcp->th_ack); 21992974e916SYuri Benditovich owin = htons(o_tcp->th_win); 22002974e916SYuri Benditovich 22012974e916SYuri Benditovich if ((nack - oack) >= VIRTIO_NET_MAX_TCP_PAYLOAD) { 22022974e916SYuri Benditovich chain->stat.ack_out_of_win++; 22032974e916SYuri Benditovich return RSC_FINAL; 22042974e916SYuri Benditovich } else if (nack == oack) { 22052974e916SYuri Benditovich /* duplicated ack or window probe */ 22062974e916SYuri Benditovich if (nwin == owin) { 22072974e916SYuri Benditovich /* duplicated ack, add dup ack count due to whql test up to 1 */ 22082974e916SYuri Benditovich chain->stat.dup_ack++; 22092974e916SYuri Benditovich return RSC_FINAL; 22102974e916SYuri Benditovich } else { 22112974e916SYuri Benditovich /* Coalesce window update */ 22122974e916SYuri Benditovich o_tcp->th_win = n_tcp->th_win; 22132974e916SYuri Benditovich chain->stat.win_update++; 22142974e916SYuri Benditovich return RSC_COALESCE; 22152974e916SYuri Benditovich } 22162974e916SYuri Benditovich } else { 22172974e916SYuri Benditovich /* pure ack, go to 'C', finalize*/ 22182974e916SYuri Benditovich chain->stat.pure_ack++; 22192974e916SYuri Benditovich return RSC_FINAL; 22202974e916SYuri Benditovich } 22212974e916SYuri Benditovich } 22222974e916SYuri Benditovich 22232974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce_data(VirtioNetRscChain *chain, 22242974e916SYuri Benditovich VirtioNetRscSeg *seg, 22252974e916SYuri Benditovich const uint8_t *buf, 22262974e916SYuri Benditovich VirtioNetRscUnit *n_unit) 22272974e916SYuri Benditovich { 22282974e916SYuri Benditovich void *data; 22292974e916SYuri Benditovich uint16_t o_ip_len; 22302974e916SYuri Benditovich uint32_t nseq, oseq; 22312974e916SYuri Benditovich VirtioNetRscUnit *o_unit; 22322974e916SYuri Benditovich 22332974e916SYuri Benditovich o_unit = &seg->unit; 22342974e916SYuri Benditovich o_ip_len = htons(*o_unit->ip_plen); 22352974e916SYuri Benditovich nseq = htonl(n_unit->tcp->th_seq); 22362974e916SYuri Benditovich oseq = htonl(o_unit->tcp->th_seq); 22372974e916SYuri Benditovich 22382974e916SYuri Benditovich /* out of order or retransmitted. */ 22392974e916SYuri Benditovich if ((nseq - oseq) > VIRTIO_NET_MAX_TCP_PAYLOAD) { 22402974e916SYuri Benditovich chain->stat.data_out_of_win++; 22412974e916SYuri Benditovich return RSC_FINAL; 22422974e916SYuri Benditovich } 22432974e916SYuri Benditovich 22442974e916SYuri Benditovich data = ((uint8_t *)n_unit->tcp) + n_unit->tcp_hdrlen; 22452974e916SYuri Benditovich if (nseq == oseq) { 22462974e916SYuri Benditovich if ((o_unit->payload == 0) && n_unit->payload) { 22472974e916SYuri Benditovich /* From no payload to payload, normal case, not a dup ack or etc */ 22482974e916SYuri Benditovich chain->stat.data_after_pure_ack++; 22492974e916SYuri Benditovich goto coalesce; 22502974e916SYuri Benditovich } else { 22512974e916SYuri Benditovich return virtio_net_rsc_handle_ack(chain, seg, buf, 22522974e916SYuri Benditovich n_unit->tcp, o_unit->tcp); 22532974e916SYuri Benditovich } 22542974e916SYuri Benditovich } else if ((nseq - oseq) != o_unit->payload) { 22552974e916SYuri Benditovich /* Not a consistent packet, out of order */ 22562974e916SYuri Benditovich chain->stat.data_out_of_order++; 22572974e916SYuri Benditovich return RSC_FINAL; 22582974e916SYuri Benditovich } else { 22592974e916SYuri Benditovich coalesce: 22602974e916SYuri Benditovich if ((o_ip_len + n_unit->payload) > chain->max_payload) { 22612974e916SYuri Benditovich chain->stat.over_size++; 22622974e916SYuri Benditovich return RSC_FINAL; 22632974e916SYuri Benditovich } 22642974e916SYuri Benditovich 22652974e916SYuri Benditovich /* Here comes the right data, the payload length in v4/v6 is different, 22662974e916SYuri Benditovich so use the field value to update and record the new data len */ 22672974e916SYuri Benditovich o_unit->payload += n_unit->payload; /* update new data len */ 22682974e916SYuri Benditovich 22692974e916SYuri Benditovich /* update field in ip header */ 22702974e916SYuri Benditovich *o_unit->ip_plen = htons(o_ip_len + n_unit->payload); 22712974e916SYuri Benditovich 22722974e916SYuri Benditovich /* Bring 'PUSH' big, the whql test guide says 'PUSH' can be coalesced 22732974e916SYuri Benditovich for windows guest, while this may change the behavior for linux 22742974e916SYuri Benditovich guest (only if it uses RSC feature). */ 22752974e916SYuri Benditovich o_unit->tcp->th_offset_flags = n_unit->tcp->th_offset_flags; 22762974e916SYuri Benditovich 22772974e916SYuri Benditovich o_unit->tcp->th_ack = n_unit->tcp->th_ack; 22782974e916SYuri Benditovich o_unit->tcp->th_win = n_unit->tcp->th_win; 22792974e916SYuri Benditovich 22802974e916SYuri Benditovich memmove(seg->buf + seg->size, data, n_unit->payload); 22812974e916SYuri Benditovich seg->size += n_unit->payload; 22822974e916SYuri Benditovich seg->packets++; 22832974e916SYuri Benditovich chain->stat.coalesced++; 22842974e916SYuri Benditovich return RSC_COALESCE; 22852974e916SYuri Benditovich } 22862974e916SYuri Benditovich } 22872974e916SYuri Benditovich 22882974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce4(VirtioNetRscChain *chain, 22892974e916SYuri Benditovich VirtioNetRscSeg *seg, 22902974e916SYuri Benditovich const uint8_t *buf, size_t size, 22912974e916SYuri Benditovich VirtioNetRscUnit *unit) 22922974e916SYuri Benditovich { 22932974e916SYuri Benditovich struct ip_header *ip1, *ip2; 22942974e916SYuri Benditovich 22952974e916SYuri Benditovich ip1 = (struct ip_header *)(unit->ip); 22962974e916SYuri Benditovich ip2 = (struct ip_header *)(seg->unit.ip); 22972974e916SYuri Benditovich if ((ip1->ip_src ^ ip2->ip_src) || (ip1->ip_dst ^ ip2->ip_dst) 22982974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 22992974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 23002974e916SYuri Benditovich chain->stat.no_match++; 23012974e916SYuri Benditovich return RSC_NO_MATCH; 23022974e916SYuri Benditovich } 23032974e916SYuri Benditovich 23042974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 23052974e916SYuri Benditovich } 23062974e916SYuri Benditovich 23072974e916SYuri Benditovich static int32_t virtio_net_rsc_coalesce6(VirtioNetRscChain *chain, 23082974e916SYuri Benditovich VirtioNetRscSeg *seg, 23092974e916SYuri Benditovich const uint8_t *buf, size_t size, 23102974e916SYuri Benditovich VirtioNetRscUnit *unit) 23112974e916SYuri Benditovich { 23122974e916SYuri Benditovich struct ip6_header *ip1, *ip2; 23132974e916SYuri Benditovich 23142974e916SYuri Benditovich ip1 = (struct ip6_header *)(unit->ip); 23152974e916SYuri Benditovich ip2 = (struct ip6_header *)(seg->unit.ip); 23162974e916SYuri Benditovich if (memcmp(&ip1->ip6_src, &ip2->ip6_src, sizeof(struct in6_address)) 23172974e916SYuri Benditovich || memcmp(&ip1->ip6_dst, &ip2->ip6_dst, sizeof(struct in6_address)) 23182974e916SYuri Benditovich || (unit->tcp->th_sport ^ seg->unit.tcp->th_sport) 23192974e916SYuri Benditovich || (unit->tcp->th_dport ^ seg->unit.tcp->th_dport)) { 23202974e916SYuri Benditovich chain->stat.no_match++; 23212974e916SYuri Benditovich return RSC_NO_MATCH; 23222974e916SYuri Benditovich } 23232974e916SYuri Benditovich 23242974e916SYuri Benditovich return virtio_net_rsc_coalesce_data(chain, seg, buf, unit); 23252974e916SYuri Benditovich } 23262974e916SYuri Benditovich 23272974e916SYuri Benditovich /* Packets with 'SYN' should bypass, other flag should be sent after drain 23282974e916SYuri Benditovich * to prevent out of order */ 23292974e916SYuri Benditovich static int virtio_net_rsc_tcp_ctrl_check(VirtioNetRscChain *chain, 23302974e916SYuri Benditovich struct tcp_header *tcp) 23312974e916SYuri Benditovich { 23322974e916SYuri Benditovich uint16_t tcp_hdr; 23332974e916SYuri Benditovich uint16_t tcp_flag; 23342974e916SYuri Benditovich 23352974e916SYuri Benditovich tcp_flag = htons(tcp->th_offset_flags); 23362974e916SYuri Benditovich tcp_hdr = (tcp_flag & VIRTIO_NET_TCP_HDR_LENGTH) >> 10; 23372974e916SYuri Benditovich tcp_flag &= VIRTIO_NET_TCP_FLAG; 23382974e916SYuri Benditovich if (tcp_flag & TH_SYN) { 23392974e916SYuri Benditovich chain->stat.tcp_syn++; 23402974e916SYuri Benditovich return RSC_BYPASS; 23412974e916SYuri Benditovich } 23422974e916SYuri Benditovich 23432974e916SYuri Benditovich if (tcp_flag & (TH_FIN | TH_URG | TH_RST | TH_ECE | TH_CWR)) { 23442974e916SYuri Benditovich chain->stat.tcp_ctrl_drain++; 23452974e916SYuri Benditovich return RSC_FINAL; 23462974e916SYuri Benditovich } 23472974e916SYuri Benditovich 23482974e916SYuri Benditovich if (tcp_hdr > sizeof(struct tcp_header)) { 23492974e916SYuri Benditovich chain->stat.tcp_all_opt++; 23502974e916SYuri Benditovich return RSC_FINAL; 23512974e916SYuri Benditovich } 23522974e916SYuri Benditovich 23532974e916SYuri Benditovich return RSC_CANDIDATE; 23542974e916SYuri Benditovich } 23552974e916SYuri Benditovich 23562974e916SYuri Benditovich static size_t virtio_net_rsc_do_coalesce(VirtioNetRscChain *chain, 23572974e916SYuri Benditovich NetClientState *nc, 23582974e916SYuri Benditovich const uint8_t *buf, size_t size, 23592974e916SYuri Benditovich VirtioNetRscUnit *unit) 23602974e916SYuri Benditovich { 23612974e916SYuri Benditovich int ret; 23622974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 23632974e916SYuri Benditovich 23642974e916SYuri Benditovich if (QTAILQ_EMPTY(&chain->buffers)) { 23652974e916SYuri Benditovich chain->stat.empty_cache++; 23662974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 23672974e916SYuri Benditovich timer_mod(chain->drain_timer, 236844bc14faSNicholas Piggin qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + chain->n->rsc_timeout); 23692974e916SYuri Benditovich return size; 23702974e916SYuri Benditovich } 23712974e916SYuri Benditovich 23722974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 23732974e916SYuri Benditovich if (chain->proto == ETH_P_IP) { 23742974e916SYuri Benditovich ret = virtio_net_rsc_coalesce4(chain, seg, buf, size, unit); 23752974e916SYuri Benditovich } else { 23762974e916SYuri Benditovich ret = virtio_net_rsc_coalesce6(chain, seg, buf, size, unit); 23772974e916SYuri Benditovich } 23782974e916SYuri Benditovich 23792974e916SYuri Benditovich if (ret == RSC_FINAL) { 23802974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 23812974e916SYuri Benditovich /* Send failed */ 23822974e916SYuri Benditovich chain->stat.final_failed++; 23832974e916SYuri Benditovich return 0; 23842974e916SYuri Benditovich } 23852974e916SYuri Benditovich 23862974e916SYuri Benditovich /* Send current packet */ 23872974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 23882974e916SYuri Benditovich } else if (ret == RSC_NO_MATCH) { 23892974e916SYuri Benditovich continue; 23902974e916SYuri Benditovich } else { 23912974e916SYuri Benditovich /* Coalesced, mark coalesced flag to tell calc cksum for ipv4 */ 23922974e916SYuri Benditovich seg->is_coalesced = 1; 23932974e916SYuri Benditovich return size; 23942974e916SYuri Benditovich } 23952974e916SYuri Benditovich } 23962974e916SYuri Benditovich 23972974e916SYuri Benditovich chain->stat.no_match_cache++; 23982974e916SYuri Benditovich virtio_net_rsc_cache_buf(chain, nc, buf, size); 23992974e916SYuri Benditovich return size; 24002974e916SYuri Benditovich } 24012974e916SYuri Benditovich 24022974e916SYuri Benditovich /* Drain a connection data, this is to avoid out of order segments */ 24032974e916SYuri Benditovich static size_t virtio_net_rsc_drain_flow(VirtioNetRscChain *chain, 24042974e916SYuri Benditovich NetClientState *nc, 24052974e916SYuri Benditovich const uint8_t *buf, size_t size, 24062974e916SYuri Benditovich uint16_t ip_start, uint16_t ip_size, 24072974e916SYuri Benditovich uint16_t tcp_port) 24082974e916SYuri Benditovich { 24092974e916SYuri Benditovich VirtioNetRscSeg *seg, *nseg; 24102974e916SYuri Benditovich uint32_t ppair1, ppair2; 24112974e916SYuri Benditovich 24122974e916SYuri Benditovich ppair1 = *(uint32_t *)(buf + tcp_port); 24132974e916SYuri Benditovich QTAILQ_FOREACH_SAFE(seg, &chain->buffers, next, nseg) { 24142974e916SYuri Benditovich ppair2 = *(uint32_t *)(seg->buf + tcp_port); 24152974e916SYuri Benditovich if (memcmp(buf + ip_start, seg->buf + ip_start, ip_size) 24162974e916SYuri Benditovich || (ppair1 != ppair2)) { 24172974e916SYuri Benditovich continue; 24182974e916SYuri Benditovich } 24192974e916SYuri Benditovich if (virtio_net_rsc_drain_seg(chain, seg) == 0) { 24202974e916SYuri Benditovich chain->stat.drain_failed++; 24212974e916SYuri Benditovich } 24222974e916SYuri Benditovich 24232974e916SYuri Benditovich break; 24242974e916SYuri Benditovich } 24252974e916SYuri Benditovich 24262974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24272974e916SYuri Benditovich } 24282974e916SYuri Benditovich 24292974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check4(VirtioNetRscChain *chain, 24302974e916SYuri Benditovich struct ip_header *ip, 24312974e916SYuri Benditovich const uint8_t *buf, size_t size) 24322974e916SYuri Benditovich { 24332974e916SYuri Benditovich uint16_t ip_len; 24342974e916SYuri Benditovich 24352974e916SYuri Benditovich /* Not an ipv4 packet */ 24362974e916SYuri Benditovich if (((ip->ip_ver_len & 0xF0) >> 4) != IP_HEADER_VERSION_4) { 24372974e916SYuri Benditovich chain->stat.ip_option++; 24382974e916SYuri Benditovich return RSC_BYPASS; 24392974e916SYuri Benditovich } 24402974e916SYuri Benditovich 24412974e916SYuri Benditovich /* Don't handle packets with ip option */ 24422974e916SYuri Benditovich if ((ip->ip_ver_len & 0xF) != VIRTIO_NET_IP4_HEADER_LENGTH) { 24432974e916SYuri Benditovich chain->stat.ip_option++; 24442974e916SYuri Benditovich return RSC_BYPASS; 24452974e916SYuri Benditovich } 24462974e916SYuri Benditovich 24472974e916SYuri Benditovich if (ip->ip_p != IPPROTO_TCP) { 24482974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 24492974e916SYuri Benditovich return RSC_BYPASS; 24502974e916SYuri Benditovich } 24512974e916SYuri Benditovich 24522974e916SYuri Benditovich /* Don't handle packets with ip fragment */ 24532974e916SYuri Benditovich if (!(htons(ip->ip_off) & IP_DF)) { 24542974e916SYuri Benditovich chain->stat.ip_frag++; 24552974e916SYuri Benditovich return RSC_BYPASS; 24562974e916SYuri Benditovich } 24572974e916SYuri Benditovich 24582974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 24592974e916SYuri Benditovich if (IPTOS_ECN(ip->ip_tos)) { 24602974e916SYuri Benditovich chain->stat.ip_ecn++; 24612974e916SYuri Benditovich return RSC_BYPASS; 24622974e916SYuri Benditovich } 24632974e916SYuri Benditovich 24642974e916SYuri Benditovich ip_len = htons(ip->ip_len); 24652974e916SYuri Benditovich if (ip_len < (sizeof(struct ip_header) + sizeof(struct tcp_header)) 24662974e916SYuri Benditovich || ip_len > (size - chain->n->guest_hdr_len - 24672974e916SYuri Benditovich sizeof(struct eth_header))) { 24682974e916SYuri Benditovich chain->stat.ip_hacked++; 24692974e916SYuri Benditovich return RSC_BYPASS; 24702974e916SYuri Benditovich } 24712974e916SYuri Benditovich 24722974e916SYuri Benditovich return RSC_CANDIDATE; 24732974e916SYuri Benditovich } 24742974e916SYuri Benditovich 24752974e916SYuri Benditovich static size_t virtio_net_rsc_receive4(VirtioNetRscChain *chain, 24762974e916SYuri Benditovich NetClientState *nc, 24772974e916SYuri Benditovich const uint8_t *buf, size_t size) 24782974e916SYuri Benditovich { 24792974e916SYuri Benditovich int32_t ret; 24802974e916SYuri Benditovich uint16_t hdr_len; 24812974e916SYuri Benditovich VirtioNetRscUnit unit; 24822974e916SYuri Benditovich 24832974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 24842974e916SYuri Benditovich 24852974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header) 24862974e916SYuri Benditovich + sizeof(struct tcp_header))) { 24872974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 24882974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24892974e916SYuri Benditovich } 24902974e916SYuri Benditovich 24912974e916SYuri Benditovich virtio_net_rsc_extract_unit4(chain, buf, &unit); 24922974e916SYuri Benditovich if (virtio_net_rsc_sanity_check4(chain, unit.ip, buf, size) 24932974e916SYuri Benditovich != RSC_CANDIDATE) { 24942974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 24952974e916SYuri Benditovich } 24962974e916SYuri Benditovich 24972974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 24982974e916SYuri Benditovich if (ret == RSC_BYPASS) { 24992974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25002974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 25012974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 25022974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 12), 25032974e916SYuri Benditovich VIRTIO_NET_IP4_ADDR_SIZE, 25042974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) + sizeof(struct ip_header)); 25052974e916SYuri Benditovich } 25062974e916SYuri Benditovich 25072974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 25082974e916SYuri Benditovich } 25092974e916SYuri Benditovich 25102974e916SYuri Benditovich static int32_t virtio_net_rsc_sanity_check6(VirtioNetRscChain *chain, 25112974e916SYuri Benditovich struct ip6_header *ip6, 25122974e916SYuri Benditovich const uint8_t *buf, size_t size) 25132974e916SYuri Benditovich { 25142974e916SYuri Benditovich uint16_t ip_len; 25152974e916SYuri Benditovich 25162974e916SYuri Benditovich if (((ip6->ip6_ctlun.ip6_un1.ip6_un1_flow & 0xF0) >> 4) 25172974e916SYuri Benditovich != IP_HEADER_VERSION_6) { 25182974e916SYuri Benditovich return RSC_BYPASS; 25192974e916SYuri Benditovich } 25202974e916SYuri Benditovich 25212974e916SYuri Benditovich /* Both option and protocol is checked in this */ 25222974e916SYuri Benditovich if (ip6->ip6_ctlun.ip6_un1.ip6_un1_nxt != IPPROTO_TCP) { 25232974e916SYuri Benditovich chain->stat.bypass_not_tcp++; 25242974e916SYuri Benditovich return RSC_BYPASS; 25252974e916SYuri Benditovich } 25262974e916SYuri Benditovich 25272974e916SYuri Benditovich ip_len = htons(ip6->ip6_ctlun.ip6_un1.ip6_un1_plen); 25282974e916SYuri Benditovich if (ip_len < sizeof(struct tcp_header) || 25292974e916SYuri Benditovich ip_len > (size - chain->n->guest_hdr_len - sizeof(struct eth_header) 25302974e916SYuri Benditovich - sizeof(struct ip6_header))) { 25312974e916SYuri Benditovich chain->stat.ip_hacked++; 25322974e916SYuri Benditovich return RSC_BYPASS; 25332974e916SYuri Benditovich } 25342974e916SYuri Benditovich 25352974e916SYuri Benditovich /* Don't handle packets with ecn flag */ 25362974e916SYuri Benditovich if (IP6_ECN(ip6->ip6_ctlun.ip6_un3.ip6_un3_ecn)) { 25372974e916SYuri Benditovich chain->stat.ip_ecn++; 25382974e916SYuri Benditovich return RSC_BYPASS; 25392974e916SYuri Benditovich } 25402974e916SYuri Benditovich 25412974e916SYuri Benditovich return RSC_CANDIDATE; 25422974e916SYuri Benditovich } 25432974e916SYuri Benditovich 25442974e916SYuri Benditovich static size_t virtio_net_rsc_receive6(void *opq, NetClientState *nc, 25452974e916SYuri Benditovich const uint8_t *buf, size_t size) 25462974e916SYuri Benditovich { 25472974e916SYuri Benditovich int32_t ret; 25482974e916SYuri Benditovich uint16_t hdr_len; 25492974e916SYuri Benditovich VirtioNetRscChain *chain; 25502974e916SYuri Benditovich VirtioNetRscUnit unit; 25512974e916SYuri Benditovich 25523d558330SMarkus Armbruster chain = opq; 25532974e916SYuri Benditovich hdr_len = ((VirtIONet *)(chain->n))->guest_hdr_len; 25542974e916SYuri Benditovich 25552974e916SYuri Benditovich if (size < (hdr_len + sizeof(struct eth_header) + sizeof(struct ip6_header) 25562974e916SYuri Benditovich + sizeof(tcp_header))) { 25572974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25582974e916SYuri Benditovich } 25592974e916SYuri Benditovich 25602974e916SYuri Benditovich virtio_net_rsc_extract_unit6(chain, buf, &unit); 25612974e916SYuri Benditovich if (RSC_CANDIDATE != virtio_net_rsc_sanity_check6(chain, 25622974e916SYuri Benditovich unit.ip, buf, size)) { 25632974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25642974e916SYuri Benditovich } 25652974e916SYuri Benditovich 25662974e916SYuri Benditovich ret = virtio_net_rsc_tcp_ctrl_check(chain, unit.tcp); 25672974e916SYuri Benditovich if (ret == RSC_BYPASS) { 25682974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 25692974e916SYuri Benditovich } else if (ret == RSC_FINAL) { 25702974e916SYuri Benditovich return virtio_net_rsc_drain_flow(chain, nc, buf, size, 25712974e916SYuri Benditovich ((hdr_len + sizeof(struct eth_header)) + 8), 25722974e916SYuri Benditovich VIRTIO_NET_IP6_ADDR_SIZE, 25732974e916SYuri Benditovich hdr_len + sizeof(struct eth_header) 25742974e916SYuri Benditovich + sizeof(struct ip6_header)); 25752974e916SYuri Benditovich } 25762974e916SYuri Benditovich 25772974e916SYuri Benditovich return virtio_net_rsc_do_coalesce(chain, nc, buf, size, &unit); 25782974e916SYuri Benditovich } 25792974e916SYuri Benditovich 25802974e916SYuri Benditovich static VirtioNetRscChain *virtio_net_rsc_lookup_chain(VirtIONet *n, 25812974e916SYuri Benditovich NetClientState *nc, 25822974e916SYuri Benditovich uint16_t proto) 25832974e916SYuri Benditovich { 25842974e916SYuri Benditovich VirtioNetRscChain *chain; 25852974e916SYuri Benditovich 25862974e916SYuri Benditovich if ((proto != (uint16_t)ETH_P_IP) && (proto != (uint16_t)ETH_P_IPV6)) { 25872974e916SYuri Benditovich return NULL; 25882974e916SYuri Benditovich } 25892974e916SYuri Benditovich 25902974e916SYuri Benditovich QTAILQ_FOREACH(chain, &n->rsc_chains, next) { 25912974e916SYuri Benditovich if (chain->proto == proto) { 25922974e916SYuri Benditovich return chain; 25932974e916SYuri Benditovich } 25942974e916SYuri Benditovich } 25952974e916SYuri Benditovich 25962974e916SYuri Benditovich chain = g_malloc(sizeof(*chain)); 25972974e916SYuri Benditovich chain->n = n; 25982974e916SYuri Benditovich chain->proto = proto; 25992974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP) { 26002974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP4_PAYLOAD; 26012974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV4; 26022974e916SYuri Benditovich } else { 26032974e916SYuri Benditovich chain->max_payload = VIRTIO_NET_MAX_IP6_PAYLOAD; 26042974e916SYuri Benditovich chain->gso_type = VIRTIO_NET_HDR_GSO_TCPV6; 26052974e916SYuri Benditovich } 260644bc14faSNicholas Piggin chain->drain_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, 26072974e916SYuri Benditovich virtio_net_rsc_purge, chain); 26082974e916SYuri Benditovich memset(&chain->stat, 0, sizeof(chain->stat)); 26092974e916SYuri Benditovich 26102974e916SYuri Benditovich QTAILQ_INIT(&chain->buffers); 26112974e916SYuri Benditovich QTAILQ_INSERT_TAIL(&n->rsc_chains, chain, next); 26122974e916SYuri Benditovich 26132974e916SYuri Benditovich return chain; 26142974e916SYuri Benditovich } 26152974e916SYuri Benditovich 26162974e916SYuri Benditovich static ssize_t virtio_net_rsc_receive(NetClientState *nc, 26172974e916SYuri Benditovich const uint8_t *buf, 26182974e916SYuri Benditovich size_t size) 26192974e916SYuri Benditovich { 26202974e916SYuri Benditovich uint16_t proto; 26212974e916SYuri Benditovich VirtioNetRscChain *chain; 26222974e916SYuri Benditovich struct eth_header *eth; 26232974e916SYuri Benditovich VirtIONet *n; 26242974e916SYuri Benditovich 26252974e916SYuri Benditovich n = qemu_get_nic_opaque(nc); 26262974e916SYuri Benditovich if (size < (n->host_hdr_len + sizeof(struct eth_header))) { 26272974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26282974e916SYuri Benditovich } 26292974e916SYuri Benditovich 26302974e916SYuri Benditovich eth = (struct eth_header *)(buf + n->guest_hdr_len); 26312974e916SYuri Benditovich proto = htons(eth->h_proto); 26322974e916SYuri Benditovich 26332974e916SYuri Benditovich chain = virtio_net_rsc_lookup_chain(n, nc, proto); 26342974e916SYuri Benditovich if (chain) { 26352974e916SYuri Benditovich chain->stat.received++; 26362974e916SYuri Benditovich if (proto == (uint16_t)ETH_P_IP && n->rsc4_enabled) { 26372974e916SYuri Benditovich return virtio_net_rsc_receive4(chain, nc, buf, size); 26382974e916SYuri Benditovich } else if (proto == (uint16_t)ETH_P_IPV6 && n->rsc6_enabled) { 26392974e916SYuri Benditovich return virtio_net_rsc_receive6(chain, nc, buf, size); 26402974e916SYuri Benditovich } 26412974e916SYuri Benditovich } 26422974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26432974e916SYuri Benditovich } 26442974e916SYuri Benditovich 26452974e916SYuri Benditovich static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, 26462974e916SYuri Benditovich size_t size) 26472974e916SYuri Benditovich { 26482974e916SYuri Benditovich VirtIONet *n = qemu_get_nic_opaque(nc); 26492974e916SYuri Benditovich if ((n->rsc4_enabled || n->rsc6_enabled)) { 26502974e916SYuri Benditovich return virtio_net_rsc_receive(nc, buf, size); 26512974e916SYuri Benditovich } else { 26522974e916SYuri Benditovich return virtio_net_do_receive(nc, buf, size); 26532974e916SYuri Benditovich } 26542974e916SYuri Benditovich } 26552974e916SYuri Benditovich 26566e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q); 26576e790746SPaolo Bonzini 26586e790746SPaolo Bonzini static void virtio_net_tx_complete(NetClientState *nc, ssize_t len) 26596e790746SPaolo Bonzini { 26606e790746SPaolo Bonzini VirtIONet *n = qemu_get_nic_opaque(nc); 26616e790746SPaolo Bonzini VirtIONetQueue *q = virtio_net_get_subqueue(nc); 266217a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 2663df8d0708SLaurent Vivier int ret; 26646e790746SPaolo Bonzini 266551b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, q->async_tx.elem, 0); 266617a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 26676e790746SPaolo Bonzini 266851b19ebeSPaolo Bonzini g_free(q->async_tx.elem); 266951b19ebeSPaolo Bonzini q->async_tx.elem = NULL; 26706e790746SPaolo Bonzini 26716e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2672df8d0708SLaurent Vivier ret = virtio_net_flush_tx(q); 26737550a822SLaurent Vivier if (ret >= n->tx_burst) { 2674df8d0708SLaurent Vivier /* 2675df8d0708SLaurent Vivier * the flush has been stopped by tx_burst 2676df8d0708SLaurent Vivier * we will not receive notification for the 2677df8d0708SLaurent Vivier * remainining part, so re-schedule 2678df8d0708SLaurent Vivier */ 2679df8d0708SLaurent Vivier virtio_queue_set_notification(q->tx_vq, 0); 26807550a822SLaurent Vivier if (q->tx_bh) { 2681a0bf401bSNicholas Piggin replay_bh_schedule_event(q->tx_bh); 26827550a822SLaurent Vivier } else { 26837550a822SLaurent Vivier timer_mod(q->tx_timer, 26847550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 26857550a822SLaurent Vivier } 2686df8d0708SLaurent Vivier q->tx_waiting = 1; 2687df8d0708SLaurent Vivier } 26886e790746SPaolo Bonzini } 26896e790746SPaolo Bonzini 26906e790746SPaolo Bonzini /* TX */ 26916e790746SPaolo Bonzini static int32_t virtio_net_flush_tx(VirtIONetQueue *q) 26926e790746SPaolo Bonzini { 26936e790746SPaolo Bonzini VirtIONet *n = q->n; 269417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 269551b19ebeSPaolo Bonzini VirtQueueElement *elem; 26966e790746SPaolo Bonzini int32_t num_packets = 0; 26976e790746SPaolo Bonzini int queue_index = vq2q(virtio_get_queue_index(q->tx_vq)); 269817a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 26996e790746SPaolo Bonzini return num_packets; 27006e790746SPaolo Bonzini } 27016e790746SPaolo Bonzini 270251b19ebeSPaolo Bonzini if (q->async_tx.elem) { 27036e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27046e790746SPaolo Bonzini return num_packets; 27056e790746SPaolo Bonzini } 27066e790746SPaolo Bonzini 270751b19ebeSPaolo Bonzini for (;;) { 2708bd89dd98SJason Wang ssize_t ret; 270951b19ebeSPaolo Bonzini unsigned int out_num; 271051b19ebeSPaolo Bonzini struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg; 2711942f420eSAkihiko Odaki struct virtio_net_hdr vhdr; 27126e790746SPaolo Bonzini 271351b19ebeSPaolo Bonzini elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement)); 271451b19ebeSPaolo Bonzini if (!elem) { 271551b19ebeSPaolo Bonzini break; 271651b19ebeSPaolo Bonzini } 271751b19ebeSPaolo Bonzini 271851b19ebeSPaolo Bonzini out_num = elem->out_num; 271951b19ebeSPaolo Bonzini out_sg = elem->out_sg; 27206e790746SPaolo Bonzini if (out_num < 1) { 2721fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header not in first element"); 27222c3e4e2dSAlexey Dobriyan goto detach; 27236e790746SPaolo Bonzini } 27246e790746SPaolo Bonzini 2725ad57f700SAkihiko Odaki if (n->needs_vnet_hdr_swap) { 2726942f420eSAkihiko Odaki if (iov_to_buf(out_sg, out_num, 0, &vhdr, sizeof(vhdr)) < 2727942f420eSAkihiko Odaki sizeof(vhdr)) { 2728fa5e56c2SGreg Kurz virtio_error(vdev, "virtio-net header incorrect"); 27292c3e4e2dSAlexey Dobriyan goto detach; 2730032a74a1SCédric Le Goater } 2731942f420eSAkihiko Odaki virtio_net_hdr_swap(vdev, &vhdr); 27322220e818SJason Wang sg2[0].iov_base = &vhdr; 2733942f420eSAkihiko Odaki sg2[0].iov_len = sizeof(vhdr); 2734ad57f700SAkihiko Odaki out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1, out_sg, out_num, 2735942f420eSAkihiko Odaki sizeof(vhdr), -1); 2736feb93f36SJason Wang if (out_num == VIRTQUEUE_MAX_SIZE) { 2737feb93f36SJason Wang goto drop; 2738032a74a1SCédric Le Goater } 2739feb93f36SJason Wang out_num += 1; 2740feb93f36SJason Wang out_sg = sg2; 2741feb93f36SJason Wang } 27426e790746SPaolo Bonzini /* 27436e790746SPaolo Bonzini * If host wants to see the guest header as is, we can 27446e790746SPaolo Bonzini * pass it on unchanged. Otherwise, copy just the parts 27456e790746SPaolo Bonzini * that host is interested in. 27466e790746SPaolo Bonzini */ 27476e790746SPaolo Bonzini assert(n->host_hdr_len <= n->guest_hdr_len); 27486e790746SPaolo Bonzini if (n->host_hdr_len != n->guest_hdr_len) { 2749d4f471ebSDmitry Frolov if (iov_size(out_sg, out_num) < n->guest_hdr_len) { 2750d4f471ebSDmitry Frolov virtio_error(vdev, "virtio-net header is invalid"); 2751d4f471ebSDmitry Frolov goto detach; 2752d4f471ebSDmitry Frolov } 27536e790746SPaolo Bonzini unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg), 27546e790746SPaolo Bonzini out_sg, out_num, 27556e790746SPaolo Bonzini 0, n->host_hdr_len); 27566e790746SPaolo Bonzini sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num, 27576e790746SPaolo Bonzini out_sg, out_num, 27586e790746SPaolo Bonzini n->guest_hdr_len, -1); 27596e790746SPaolo Bonzini out_num = sg_num; 27606e790746SPaolo Bonzini out_sg = sg; 27612c3e4e2dSAlexey Dobriyan 27622c3e4e2dSAlexey Dobriyan if (out_num < 1) { 27632c3e4e2dSAlexey Dobriyan virtio_error(vdev, "virtio-net nothing to send"); 27642c3e4e2dSAlexey Dobriyan goto detach; 27652c3e4e2dSAlexey Dobriyan } 27666e790746SPaolo Bonzini } 27676e790746SPaolo Bonzini 27686e790746SPaolo Bonzini ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index), 27696e790746SPaolo Bonzini out_sg, out_num, virtio_net_tx_complete); 27706e790746SPaolo Bonzini if (ret == 0) { 27716e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 27726e790746SPaolo Bonzini q->async_tx.elem = elem; 27736e790746SPaolo Bonzini return -EBUSY; 27746e790746SPaolo Bonzini } 27756e790746SPaolo Bonzini 2776feb93f36SJason Wang drop: 277751b19ebeSPaolo Bonzini virtqueue_push(q->tx_vq, elem, 0); 277817a0ca55SKONRAD Frederic virtio_notify(vdev, q->tx_vq); 277951b19ebeSPaolo Bonzini g_free(elem); 27806e790746SPaolo Bonzini 27816e790746SPaolo Bonzini if (++num_packets >= n->tx_burst) { 27826e790746SPaolo Bonzini break; 27836e790746SPaolo Bonzini } 27846e790746SPaolo Bonzini } 27856e790746SPaolo Bonzini return num_packets; 27862c3e4e2dSAlexey Dobriyan 27872c3e4e2dSAlexey Dobriyan detach: 27882c3e4e2dSAlexey Dobriyan virtqueue_detach_element(q->tx_vq, elem, 0); 27892c3e4e2dSAlexey Dobriyan g_free(elem); 27902c3e4e2dSAlexey Dobriyan return -EINVAL; 27916e790746SPaolo Bonzini } 27926e790746SPaolo Bonzini 27937550a822SLaurent Vivier static void virtio_net_tx_timer(void *opaque); 27947550a822SLaurent Vivier 27956e790746SPaolo Bonzini static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq) 27966e790746SPaolo Bonzini { 279717a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 27986e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 27996e790746SPaolo Bonzini 2800283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2801283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2802283e2c2aSYuri Benditovich return; 2803283e2c2aSYuri Benditovich } 2804283e2c2aSYuri Benditovich 28056e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 280617a0ca55SKONRAD Frederic if (!vdev->vm_running) { 28076e790746SPaolo Bonzini q->tx_waiting = 1; 28086e790746SPaolo Bonzini return; 28096e790746SPaolo Bonzini } 28106e790746SPaolo Bonzini 28116e790746SPaolo Bonzini if (q->tx_waiting) { 28127550a822SLaurent Vivier /* We already have queued packets, immediately flush */ 2813bc72ad67SAlex Bligh timer_del(q->tx_timer); 28147550a822SLaurent Vivier virtio_net_tx_timer(q); 28156e790746SPaolo Bonzini } else { 28167550a822SLaurent Vivier /* re-arm timer to flush it (and more) on next tick */ 2817bc72ad67SAlex Bligh timer_mod(q->tx_timer, 2818bc72ad67SAlex Bligh qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28196e790746SPaolo Bonzini q->tx_waiting = 1; 28206e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 28216e790746SPaolo Bonzini } 28226e790746SPaolo Bonzini } 28236e790746SPaolo Bonzini 28246e790746SPaolo Bonzini static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq) 28256e790746SPaolo Bonzini { 282617a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 28276e790746SPaolo Bonzini VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))]; 28286e790746SPaolo Bonzini 28294c54f5bcSYajun Wu if (unlikely(n->vhost_started)) { 28304c54f5bcSYajun Wu return; 28314c54f5bcSYajun Wu } 28324c54f5bcSYajun Wu 2833283e2c2aSYuri Benditovich if (unlikely((n->status & VIRTIO_NET_S_LINK_UP) == 0)) { 2834283e2c2aSYuri Benditovich virtio_net_drop_tx_queue_data(vdev, vq); 2835283e2c2aSYuri Benditovich return; 2836283e2c2aSYuri Benditovich } 2837283e2c2aSYuri Benditovich 28386e790746SPaolo Bonzini if (unlikely(q->tx_waiting)) { 28396e790746SPaolo Bonzini return; 28406e790746SPaolo Bonzini } 28416e790746SPaolo Bonzini q->tx_waiting = 1; 28426e790746SPaolo Bonzini /* This happens when device was stopped but VCPU wasn't. */ 284317a0ca55SKONRAD Frederic if (!vdev->vm_running) { 28446e790746SPaolo Bonzini return; 28456e790746SPaolo Bonzini } 28466e790746SPaolo Bonzini virtio_queue_set_notification(vq, 0); 2847a0bf401bSNicholas Piggin replay_bh_schedule_event(q->tx_bh); 28486e790746SPaolo Bonzini } 28496e790746SPaolo Bonzini 28506e790746SPaolo Bonzini static void virtio_net_tx_timer(void *opaque) 28516e790746SPaolo Bonzini { 28526e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 28536e790746SPaolo Bonzini VirtIONet *n = q->n; 285417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 28557550a822SLaurent Vivier int ret; 28567550a822SLaurent Vivier 2857e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2858e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2859e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2860e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2861e8bcf842SMichael S. Tsirkin return; 2862e8bcf842SMichael S. Tsirkin } 28636e790746SPaolo Bonzini 28646e790746SPaolo Bonzini q->tx_waiting = 0; 28656e790746SPaolo Bonzini 28666e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 286717a0ca55SKONRAD Frederic if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) { 28686e790746SPaolo Bonzini return; 286917a0ca55SKONRAD Frederic } 28706e790746SPaolo Bonzini 28717550a822SLaurent Vivier ret = virtio_net_flush_tx(q); 28727550a822SLaurent Vivier if (ret == -EBUSY || ret == -EINVAL) { 28737550a822SLaurent Vivier return; 28747550a822SLaurent Vivier } 28757550a822SLaurent Vivier /* 28767550a822SLaurent Vivier * If we flush a full burst of packets, assume there are 28777550a822SLaurent Vivier * more coming and immediately rearm 28787550a822SLaurent Vivier */ 28797550a822SLaurent Vivier if (ret >= n->tx_burst) { 28807550a822SLaurent Vivier q->tx_waiting = 1; 28817550a822SLaurent Vivier timer_mod(q->tx_timer, 28827550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28837550a822SLaurent Vivier return; 28847550a822SLaurent Vivier } 28857550a822SLaurent Vivier /* 28867550a822SLaurent Vivier * If less than a full burst, re-enable notification and flush 28877550a822SLaurent Vivier * anything that may have come in while we weren't looking. If 28887550a822SLaurent Vivier * we find something, assume the guest is still active and rearm 28897550a822SLaurent Vivier */ 28906e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 28917550a822SLaurent Vivier ret = virtio_net_flush_tx(q); 28927550a822SLaurent Vivier if (ret > 0) { 28937550a822SLaurent Vivier virtio_queue_set_notification(q->tx_vq, 0); 28947550a822SLaurent Vivier q->tx_waiting = 1; 28957550a822SLaurent Vivier timer_mod(q->tx_timer, 28967550a822SLaurent Vivier qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout); 28977550a822SLaurent Vivier } 28986e790746SPaolo Bonzini } 28996e790746SPaolo Bonzini 29006e790746SPaolo Bonzini static void virtio_net_tx_bh(void *opaque) 29016e790746SPaolo Bonzini { 29026e790746SPaolo Bonzini VirtIONetQueue *q = opaque; 29036e790746SPaolo Bonzini VirtIONet *n = q->n; 290417a0ca55SKONRAD Frederic VirtIODevice *vdev = VIRTIO_DEVICE(n); 29056e790746SPaolo Bonzini int32_t ret; 29066e790746SPaolo Bonzini 2907e8bcf842SMichael S. Tsirkin /* This happens when device was stopped but BH wasn't. */ 2908e8bcf842SMichael S. Tsirkin if (!vdev->vm_running) { 2909e8bcf842SMichael S. Tsirkin /* Make sure tx waiting is set, so we'll run when restarted. */ 2910e8bcf842SMichael S. Tsirkin assert(q->tx_waiting); 2911e8bcf842SMichael S. Tsirkin return; 2912e8bcf842SMichael S. Tsirkin } 29136e790746SPaolo Bonzini 29146e790746SPaolo Bonzini q->tx_waiting = 0; 29156e790746SPaolo Bonzini 29166e790746SPaolo Bonzini /* Just in case the driver is not ready on more */ 291717a0ca55SKONRAD Frederic if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) { 29186e790746SPaolo Bonzini return; 291917a0ca55SKONRAD Frederic } 29206e790746SPaolo Bonzini 29216e790746SPaolo Bonzini ret = virtio_net_flush_tx(q); 2922fa5e56c2SGreg Kurz if (ret == -EBUSY || ret == -EINVAL) { 2923fa5e56c2SGreg Kurz return; /* Notification re-enable handled by tx_complete or device 2924fa5e56c2SGreg Kurz * broken */ 29256e790746SPaolo Bonzini } 29266e790746SPaolo Bonzini 29276e790746SPaolo Bonzini /* If we flush a full burst of packets, assume there are 29286e790746SPaolo Bonzini * more coming and immediately reschedule */ 29296e790746SPaolo Bonzini if (ret >= n->tx_burst) { 2930a0bf401bSNicholas Piggin replay_bh_schedule_event(q->tx_bh); 29316e790746SPaolo Bonzini q->tx_waiting = 1; 29326e790746SPaolo Bonzini return; 29336e790746SPaolo Bonzini } 29346e790746SPaolo Bonzini 29356e790746SPaolo Bonzini /* If less than a full burst, re-enable notification and flush 29366e790746SPaolo Bonzini * anything that may have come in while we weren't looking. If 29376e790746SPaolo Bonzini * we find something, assume the guest is still active and reschedule */ 29386e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 1); 2939fa5e56c2SGreg Kurz ret = virtio_net_flush_tx(q); 2940fa5e56c2SGreg Kurz if (ret == -EINVAL) { 2941fa5e56c2SGreg Kurz return; 2942fa5e56c2SGreg Kurz } else if (ret > 0) { 29436e790746SPaolo Bonzini virtio_queue_set_notification(q->tx_vq, 0); 2944a0bf401bSNicholas Piggin replay_bh_schedule_event(q->tx_bh); 29456e790746SPaolo Bonzini q->tx_waiting = 1; 29466e790746SPaolo Bonzini } 29476e790746SPaolo Bonzini } 29486e790746SPaolo Bonzini 2949f9d6dbf0SWen Congyang static void virtio_net_add_queue(VirtIONet *n, int index) 2950f9d6dbf0SWen Congyang { 2951f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2952f9d6dbf0SWen Congyang 29531c0fbfa3SMichael S. Tsirkin n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size, 29541c0fbfa3SMichael S. Tsirkin virtio_net_handle_rx); 29559b02e161SWei Wang 2956f9d6dbf0SWen Congyang if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) { 2957f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 29589b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 29599b02e161SWei Wang virtio_net_handle_tx_timer); 2960f9d6dbf0SWen Congyang n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL, 2961f9d6dbf0SWen Congyang virtio_net_tx_timer, 2962f9d6dbf0SWen Congyang &n->vqs[index]); 2963f9d6dbf0SWen Congyang } else { 2964f9d6dbf0SWen Congyang n->vqs[index].tx_vq = 29659b02e161SWei Wang virtio_add_queue(vdev, n->net_conf.tx_queue_size, 29669b02e161SWei Wang virtio_net_handle_tx_bh); 2967f63192b0SAlexander Bulekov n->vqs[index].tx_bh = qemu_bh_new_guarded(virtio_net_tx_bh, &n->vqs[index], 2968f63192b0SAlexander Bulekov &DEVICE(vdev)->mem_reentrancy_guard); 2969f9d6dbf0SWen Congyang } 2970f9d6dbf0SWen Congyang 2971f9d6dbf0SWen Congyang n->vqs[index].tx_waiting = 0; 2972f9d6dbf0SWen Congyang n->vqs[index].n = n; 2973f9d6dbf0SWen Congyang } 2974f9d6dbf0SWen Congyang 2975f9d6dbf0SWen Congyang static void virtio_net_del_queue(VirtIONet *n, int index) 2976f9d6dbf0SWen Congyang { 2977f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2978f9d6dbf0SWen Congyang VirtIONetQueue *q = &n->vqs[index]; 2979f9d6dbf0SWen Congyang NetClientState *nc = qemu_get_subqueue(n->nic, index); 2980f9d6dbf0SWen Congyang 2981f9d6dbf0SWen Congyang qemu_purge_queued_packets(nc); 2982f9d6dbf0SWen Congyang 2983f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2); 2984f9d6dbf0SWen Congyang if (q->tx_timer) { 2985f9d6dbf0SWen Congyang timer_free(q->tx_timer); 2986f989c30cSYunjian Wang q->tx_timer = NULL; 2987f9d6dbf0SWen Congyang } else { 2988f9d6dbf0SWen Congyang qemu_bh_delete(q->tx_bh); 2989f989c30cSYunjian Wang q->tx_bh = NULL; 2990f9d6dbf0SWen Congyang } 2991f989c30cSYunjian Wang q->tx_waiting = 0; 2992f9d6dbf0SWen Congyang virtio_del_queue(vdev, index * 2 + 1); 2993f9d6dbf0SWen Congyang } 2994f9d6dbf0SWen Congyang 2995441537f1SJason Wang static void virtio_net_change_num_queue_pairs(VirtIONet *n, int new_max_queue_pairs) 2996f9d6dbf0SWen Congyang { 2997f9d6dbf0SWen Congyang VirtIODevice *vdev = VIRTIO_DEVICE(n); 2998f9d6dbf0SWen Congyang int old_num_queues = virtio_get_num_queues(vdev); 2999441537f1SJason Wang int new_num_queues = new_max_queue_pairs * 2 + 1; 3000f9d6dbf0SWen Congyang int i; 3001f9d6dbf0SWen Congyang 3002f9d6dbf0SWen Congyang assert(old_num_queues >= 3); 3003f9d6dbf0SWen Congyang assert(old_num_queues % 2 == 1); 3004f9d6dbf0SWen Congyang 3005f9d6dbf0SWen Congyang if (old_num_queues == new_num_queues) { 3006f9d6dbf0SWen Congyang return; 3007f9d6dbf0SWen Congyang } 3008f9d6dbf0SWen Congyang 3009f9d6dbf0SWen Congyang /* 3010f9d6dbf0SWen Congyang * We always need to remove and add ctrl vq if 3011f9d6dbf0SWen Congyang * old_num_queues != new_num_queues. Remove ctrl_vq first, 301220f86a75SYuval Shaia * and then we only enter one of the following two loops. 3013f9d6dbf0SWen Congyang */ 3014f9d6dbf0SWen Congyang virtio_del_queue(vdev, old_num_queues - 1); 3015f9d6dbf0SWen Congyang 3016f9d6dbf0SWen Congyang for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) { 3017f9d6dbf0SWen Congyang /* new_num_queues < old_num_queues */ 3018f9d6dbf0SWen Congyang virtio_net_del_queue(n, i / 2); 3019f9d6dbf0SWen Congyang } 3020f9d6dbf0SWen Congyang 3021f9d6dbf0SWen Congyang for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) { 3022f9d6dbf0SWen Congyang /* new_num_queues > old_num_queues */ 3023f9d6dbf0SWen Congyang virtio_net_add_queue(n, i / 2); 3024f9d6dbf0SWen Congyang } 3025f9d6dbf0SWen Congyang 3026f9d6dbf0SWen Congyang /* add ctrl_vq last */ 3027f9d6dbf0SWen Congyang n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 3028f9d6dbf0SWen Congyang } 3029f9d6dbf0SWen Congyang 3030ec57db16SJason Wang static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue) 30316e790746SPaolo Bonzini { 3032441537f1SJason Wang int max = multiqueue ? n->max_queue_pairs : 1; 3033f9d6dbf0SWen Congyang 30346e790746SPaolo Bonzini n->multiqueue = multiqueue; 3035441537f1SJason Wang virtio_net_change_num_queue_pairs(n, max); 30366e790746SPaolo Bonzini 3037441537f1SJason Wang virtio_net_set_queue_pairs(n); 30386e790746SPaolo Bonzini } 30396e790746SPaolo Bonzini 3040982b78c5SDr. David Alan Gilbert static int virtio_net_post_load_device(void *opaque, int version_id) 3041037dab2fSGreg Kurz { 3042982b78c5SDr. David Alan Gilbert VirtIONet *n = opaque; 3043982b78c5SDr. David Alan Gilbert VirtIODevice *vdev = VIRTIO_DEVICE(n); 3044037dab2fSGreg Kurz int i, link_down; 3045037dab2fSGreg Kurz 30469d8c6a25SDr. David Alan Gilbert trace_virtio_net_post_load_device(); 3047982b78c5SDr. David Alan Gilbert virtio_net_set_mrg_rx_bufs(n, n->mergeable_rx_bufs, 304895129d6fSCornelia Huck virtio_vdev_has_feature(vdev, 3049e22f0603SYuri Benditovich VIRTIO_F_VERSION_1), 3050e22f0603SYuri Benditovich virtio_vdev_has_feature(vdev, 3051e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT)); 30526e790746SPaolo Bonzini 30536e790746SPaolo Bonzini /* MAC_TABLE_ENTRIES may be different from the saved image */ 3054982b78c5SDr. David Alan Gilbert if (n->mac_table.in_use > MAC_TABLE_ENTRIES) { 30556e790746SPaolo Bonzini n->mac_table.in_use = 0; 30566e790746SPaolo Bonzini } 30576e790746SPaolo Bonzini 3058982b78c5SDr. David Alan Gilbert if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) { 30596c666823SMichael S. Tsirkin n->curr_guest_offloads = virtio_net_supported_guest_offloads(n); 30606c666823SMichael S. Tsirkin } 30616c666823SMichael S. Tsirkin 30627788c3f2SMikhail Sennikovsky /* 30637788c3f2SMikhail Sennikovsky * curr_guest_offloads will be later overwritten by the 30647788c3f2SMikhail Sennikovsky * virtio_set_features_nocheck call done from the virtio_load. 30657788c3f2SMikhail Sennikovsky * Here we make sure it is preserved and restored accordingly 30667788c3f2SMikhail Sennikovsky * in the virtio_net_post_load_virtio callback. 30677788c3f2SMikhail Sennikovsky */ 30687788c3f2SMikhail Sennikovsky n->saved_guest_offloads = n->curr_guest_offloads; 30696c666823SMichael S. Tsirkin 3070441537f1SJason Wang virtio_net_set_queue_pairs(n); 30716e790746SPaolo Bonzini 30726e790746SPaolo Bonzini /* Find the first multicast entry in the saved MAC filter */ 30736e790746SPaolo Bonzini for (i = 0; i < n->mac_table.in_use; i++) { 30746e790746SPaolo Bonzini if (n->mac_table.macs[i * ETH_ALEN] & 1) { 30756e790746SPaolo Bonzini break; 30766e790746SPaolo Bonzini } 30776e790746SPaolo Bonzini } 30786e790746SPaolo Bonzini n->mac_table.first_multi = i; 30796e790746SPaolo Bonzini 30806e790746SPaolo Bonzini /* nc.link_down can't be migrated, so infer link_down according 30816e790746SPaolo Bonzini * to link status bit in n->status */ 30826e790746SPaolo Bonzini link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0; 3083441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 30846e790746SPaolo Bonzini qemu_get_subqueue(n->nic, i)->link_down = link_down; 30856e790746SPaolo Bonzini } 30866e790746SPaolo Bonzini 30876c666823SMichael S. Tsirkin if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) && 30886c666823SMichael S. Tsirkin virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 30899d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 30909d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 30919d8c6a25SDr. David Alan Gilbert virtio_net_announce_timer, n); 30929d8c6a25SDr. David Alan Gilbert if (n->announce_timer.round) { 30939d8c6a25SDr. David Alan Gilbert timer_mod(n->announce_timer.tm, 30949d8c6a25SDr. David Alan Gilbert qemu_clock_get_ms(n->announce_timer.type)); 30959d8c6a25SDr. David Alan Gilbert } else { 3096944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 30979d8c6a25SDr. David Alan Gilbert } 30986c666823SMichael S. Tsirkin } 30996c666823SMichael S. Tsirkin 31000e07198eSAkihiko Odaki virtio_net_commit_rss_config(n); 31016e790746SPaolo Bonzini return 0; 31026e790746SPaolo Bonzini } 31036e790746SPaolo Bonzini 31047788c3f2SMikhail Sennikovsky static int virtio_net_post_load_virtio(VirtIODevice *vdev) 31057788c3f2SMikhail Sennikovsky { 31067788c3f2SMikhail Sennikovsky VirtIONet *n = VIRTIO_NET(vdev); 31077788c3f2SMikhail Sennikovsky /* 31087788c3f2SMikhail Sennikovsky * The actual needed state is now in saved_guest_offloads, 31097788c3f2SMikhail Sennikovsky * see virtio_net_post_load_device for detail. 31107788c3f2SMikhail Sennikovsky * Restore it back and apply the desired offloads. 31117788c3f2SMikhail Sennikovsky */ 31127788c3f2SMikhail Sennikovsky n->curr_guest_offloads = n->saved_guest_offloads; 31137788c3f2SMikhail Sennikovsky if (peer_has_vnet_hdr(n)) { 31147788c3f2SMikhail Sennikovsky virtio_net_apply_guest_offloads(n); 31157788c3f2SMikhail Sennikovsky } 31167788c3f2SMikhail Sennikovsky 31177788c3f2SMikhail Sennikovsky return 0; 31187788c3f2SMikhail Sennikovsky } 31197788c3f2SMikhail Sennikovsky 3120982b78c5SDr. David Alan Gilbert /* tx_waiting field of a VirtIONetQueue */ 3121982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_queue_tx_waiting = { 3122982b78c5SDr. David Alan Gilbert .name = "virtio-net-queue-tx_waiting", 31231de81b42SRichard Henderson .fields = (const VMStateField[]) { 3124982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(tx_waiting, VirtIONetQueue), 3125982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3126982b78c5SDr. David Alan Gilbert }, 3127982b78c5SDr. David Alan Gilbert }; 3128982b78c5SDr. David Alan Gilbert 3129441537f1SJason Wang static bool max_queue_pairs_gt_1(void *opaque, int version_id) 3130982b78c5SDr. David Alan Gilbert { 3131441537f1SJason Wang return VIRTIO_NET(opaque)->max_queue_pairs > 1; 3132982b78c5SDr. David Alan Gilbert } 3133982b78c5SDr. David Alan Gilbert 3134982b78c5SDr. David Alan Gilbert static bool has_ctrl_guest_offloads(void *opaque, int version_id) 3135982b78c5SDr. David Alan Gilbert { 3136982b78c5SDr. David Alan Gilbert return virtio_vdev_has_feature(VIRTIO_DEVICE(opaque), 3137982b78c5SDr. David Alan Gilbert VIRTIO_NET_F_CTRL_GUEST_OFFLOADS); 3138982b78c5SDr. David Alan Gilbert } 3139982b78c5SDr. David Alan Gilbert 3140982b78c5SDr. David Alan Gilbert static bool mac_table_fits(void *opaque, int version_id) 3141982b78c5SDr. David Alan Gilbert { 3142982b78c5SDr. David Alan Gilbert return VIRTIO_NET(opaque)->mac_table.in_use <= MAC_TABLE_ENTRIES; 3143982b78c5SDr. David Alan Gilbert } 3144982b78c5SDr. David Alan Gilbert 3145982b78c5SDr. David Alan Gilbert static bool mac_table_doesnt_fit(void *opaque, int version_id) 3146982b78c5SDr. David Alan Gilbert { 3147982b78c5SDr. David Alan Gilbert return !mac_table_fits(opaque, version_id); 3148982b78c5SDr. David Alan Gilbert } 3149982b78c5SDr. David Alan Gilbert 3150982b78c5SDr. David Alan Gilbert /* This temporary type is shared by all the WITH_TMP methods 3151982b78c5SDr. David Alan Gilbert * although only some fields are used by each. 3152982b78c5SDr. David Alan Gilbert */ 3153982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp { 3154982b78c5SDr. David Alan Gilbert VirtIONet *parent; 3155982b78c5SDr. David Alan Gilbert VirtIONetQueue *vqs_1; 3156441537f1SJason Wang uint16_t curr_queue_pairs_1; 3157982b78c5SDr. David Alan Gilbert uint8_t has_ufo; 3158982b78c5SDr. David Alan Gilbert uint32_t has_vnet_hdr; 3159982b78c5SDr. David Alan Gilbert }; 3160982b78c5SDr. David Alan Gilbert 3161982b78c5SDr. David Alan Gilbert /* The 2nd and subsequent tx_waiting flags are loaded later than 3162441537f1SJason Wang * the 1st entry in the queue_pairs and only if there's more than one 3163982b78c5SDr. David Alan Gilbert * entry. We use the tmp mechanism to calculate a temporary 3164982b78c5SDr. David Alan Gilbert * pointer and count and also validate the count. 3165982b78c5SDr. David Alan Gilbert */ 3166982b78c5SDr. David Alan Gilbert 316744b1ff31SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_save(void *opaque) 3168982b78c5SDr. David Alan Gilbert { 3169982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3170982b78c5SDr. David Alan Gilbert 3171982b78c5SDr. David Alan Gilbert tmp->vqs_1 = tmp->parent->vqs + 1; 3172441537f1SJason Wang tmp->curr_queue_pairs_1 = tmp->parent->curr_queue_pairs - 1; 3173441537f1SJason Wang if (tmp->parent->curr_queue_pairs == 0) { 3174441537f1SJason Wang tmp->curr_queue_pairs_1 = 0; 3175982b78c5SDr. David Alan Gilbert } 317644b1ff31SDr. David Alan Gilbert 317744b1ff31SDr. David Alan Gilbert return 0; 3178982b78c5SDr. David Alan Gilbert } 3179982b78c5SDr. David Alan Gilbert 3180982b78c5SDr. David Alan Gilbert static int virtio_net_tx_waiting_pre_load(void *opaque) 3181982b78c5SDr. David Alan Gilbert { 3182982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3183982b78c5SDr. David Alan Gilbert 3184982b78c5SDr. David Alan Gilbert /* Reuse the pointer setup from save */ 3185982b78c5SDr. David Alan Gilbert virtio_net_tx_waiting_pre_save(opaque); 3186982b78c5SDr. David Alan Gilbert 3187441537f1SJason Wang if (tmp->parent->curr_queue_pairs > tmp->parent->max_queue_pairs) { 3188441537f1SJason Wang error_report("virtio-net: curr_queue_pairs %x > max_queue_pairs %x", 3189441537f1SJason Wang tmp->parent->curr_queue_pairs, tmp->parent->max_queue_pairs); 3190982b78c5SDr. David Alan Gilbert 3191982b78c5SDr. David Alan Gilbert return -EINVAL; 3192982b78c5SDr. David Alan Gilbert } 3193982b78c5SDr. David Alan Gilbert 3194982b78c5SDr. David Alan Gilbert return 0; /* all good */ 3195982b78c5SDr. David Alan Gilbert } 3196982b78c5SDr. David Alan Gilbert 3197982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_tx_waiting = { 3198982b78c5SDr. David Alan Gilbert .name = "virtio-net-tx_waiting", 3199982b78c5SDr. David Alan Gilbert .pre_load = virtio_net_tx_waiting_pre_load, 3200982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_tx_waiting_pre_save, 32011de81b42SRichard Henderson .fields = (const VMStateField[]) { 3202982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_VARRAY_POINTER_UINT16(vqs_1, struct VirtIONetMigTmp, 3203441537f1SJason Wang curr_queue_pairs_1, 3204982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3205982b78c5SDr. David Alan Gilbert struct VirtIONetQueue), 3206982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3207982b78c5SDr. David Alan Gilbert }, 3208982b78c5SDr. David Alan Gilbert }; 3209982b78c5SDr. David Alan Gilbert 3210982b78c5SDr. David Alan Gilbert /* the 'has_ufo' flag is just tested; if the incoming stream has the 3211982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3212982b78c5SDr. David Alan Gilbert */ 3213982b78c5SDr. David Alan Gilbert static int virtio_net_ufo_post_load(void *opaque, int version_id) 3214982b78c5SDr. David Alan Gilbert { 3215982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3216982b78c5SDr. David Alan Gilbert 3217982b78c5SDr. David Alan Gilbert if (tmp->has_ufo && !peer_has_ufo(tmp->parent)) { 3218982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires TUN_F_UFO support"); 3219982b78c5SDr. David Alan Gilbert return -EINVAL; 3220982b78c5SDr. David Alan Gilbert } 3221982b78c5SDr. David Alan Gilbert 3222982b78c5SDr. David Alan Gilbert return 0; 3223982b78c5SDr. David Alan Gilbert } 3224982b78c5SDr. David Alan Gilbert 322544b1ff31SDr. David Alan Gilbert static int virtio_net_ufo_pre_save(void *opaque) 3226982b78c5SDr. David Alan Gilbert { 3227982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3228982b78c5SDr. David Alan Gilbert 3229982b78c5SDr. David Alan Gilbert tmp->has_ufo = tmp->parent->has_ufo; 323044b1ff31SDr. David Alan Gilbert 323144b1ff31SDr. David Alan Gilbert return 0; 3232982b78c5SDr. David Alan Gilbert } 3233982b78c5SDr. David Alan Gilbert 3234982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_ufo = { 3235982b78c5SDr. David Alan Gilbert .name = "virtio-net-ufo", 3236982b78c5SDr. David Alan Gilbert .post_load = virtio_net_ufo_post_load, 3237982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_ufo_pre_save, 32381de81b42SRichard Henderson .fields = (const VMStateField[]) { 3239982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(has_ufo, struct VirtIONetMigTmp), 3240982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3241982b78c5SDr. David Alan Gilbert }, 3242982b78c5SDr. David Alan Gilbert }; 3243982b78c5SDr. David Alan Gilbert 3244982b78c5SDr. David Alan Gilbert /* the 'has_vnet_hdr' flag is just tested; if the incoming stream has the 3245982b78c5SDr. David Alan Gilbert * flag set we need to check that we have it 3246982b78c5SDr. David Alan Gilbert */ 3247982b78c5SDr. David Alan Gilbert static int virtio_net_vnet_post_load(void *opaque, int version_id) 3248982b78c5SDr. David Alan Gilbert { 3249982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3250982b78c5SDr. David Alan Gilbert 3251982b78c5SDr. David Alan Gilbert if (tmp->has_vnet_hdr && !peer_has_vnet_hdr(tmp->parent)) { 3252982b78c5SDr. David Alan Gilbert error_report("virtio-net: saved image requires vnet_hdr=on"); 3253982b78c5SDr. David Alan Gilbert return -EINVAL; 3254982b78c5SDr. David Alan Gilbert } 3255982b78c5SDr. David Alan Gilbert 3256982b78c5SDr. David Alan Gilbert return 0; 3257982b78c5SDr. David Alan Gilbert } 3258982b78c5SDr. David Alan Gilbert 325944b1ff31SDr. David Alan Gilbert static int virtio_net_vnet_pre_save(void *opaque) 3260982b78c5SDr. David Alan Gilbert { 3261982b78c5SDr. David Alan Gilbert struct VirtIONetMigTmp *tmp = opaque; 3262982b78c5SDr. David Alan Gilbert 3263982b78c5SDr. David Alan Gilbert tmp->has_vnet_hdr = tmp->parent->has_vnet_hdr; 326444b1ff31SDr. David Alan Gilbert 326544b1ff31SDr. David Alan Gilbert return 0; 3266982b78c5SDr. David Alan Gilbert } 3267982b78c5SDr. David Alan Gilbert 3268982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_has_vnet = { 3269982b78c5SDr. David Alan Gilbert .name = "virtio-net-vnet", 3270982b78c5SDr. David Alan Gilbert .post_load = virtio_net_vnet_post_load, 3271982b78c5SDr. David Alan Gilbert .pre_save = virtio_net_vnet_pre_save, 32721de81b42SRichard Henderson .fields = (const VMStateField[]) { 3273982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(has_vnet_hdr, struct VirtIONetMigTmp), 3274982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3275982b78c5SDr. David Alan Gilbert }, 3276982b78c5SDr. David Alan Gilbert }; 3277982b78c5SDr. David Alan Gilbert 3278e41b7114SYuri Benditovich static bool virtio_net_rss_needed(void *opaque) 3279e41b7114SYuri Benditovich { 3280e41b7114SYuri Benditovich return VIRTIO_NET(opaque)->rss_data.enabled; 3281e41b7114SYuri Benditovich } 3282e41b7114SYuri Benditovich 3283e41b7114SYuri Benditovich static const VMStateDescription vmstate_virtio_net_rss = { 3284e41b7114SYuri Benditovich .name = "virtio-net-device/rss", 3285e41b7114SYuri Benditovich .version_id = 1, 3286e41b7114SYuri Benditovich .minimum_version_id = 1, 3287e41b7114SYuri Benditovich .needed = virtio_net_rss_needed, 32881de81b42SRichard Henderson .fields = (const VMStateField[]) { 3289e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.enabled, VirtIONet), 3290e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.redirect, VirtIONet), 3291e41b7114SYuri Benditovich VMSTATE_BOOL(rss_data.populate_hash, VirtIONet), 3292e41b7114SYuri Benditovich VMSTATE_UINT32(rss_data.hash_types, VirtIONet), 3293e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.indirections_len, VirtIONet), 3294e41b7114SYuri Benditovich VMSTATE_UINT16(rss_data.default_queue, VirtIONet), 3295e41b7114SYuri Benditovich VMSTATE_UINT8_ARRAY(rss_data.key, VirtIONet, 3296e41b7114SYuri Benditovich VIRTIO_NET_RSS_MAX_KEY_SIZE), 3297e41b7114SYuri Benditovich VMSTATE_VARRAY_UINT16_ALLOC(rss_data.indirections_table, VirtIONet, 3298e41b7114SYuri Benditovich rss_data.indirections_len, 0, 3299e41b7114SYuri Benditovich vmstate_info_uint16, uint16_t), 3300e41b7114SYuri Benditovich VMSTATE_END_OF_LIST() 3301e41b7114SYuri Benditovich }, 3302e41b7114SYuri Benditovich }; 3303e41b7114SYuri Benditovich 3304982b78c5SDr. David Alan Gilbert static const VMStateDescription vmstate_virtio_net_device = { 3305982b78c5SDr. David Alan Gilbert .name = "virtio-net-device", 3306982b78c5SDr. David Alan Gilbert .version_id = VIRTIO_NET_VM_VERSION, 3307982b78c5SDr. David Alan Gilbert .minimum_version_id = VIRTIO_NET_VM_VERSION, 3308982b78c5SDr. David Alan Gilbert .post_load = virtio_net_post_load_device, 33091de81b42SRichard Henderson .fields = (const VMStateField[]) { 3310982b78c5SDr. David Alan Gilbert VMSTATE_UINT8_ARRAY(mac, VirtIONet, ETH_ALEN), 3311982b78c5SDr. David Alan Gilbert VMSTATE_STRUCT_POINTER(vqs, VirtIONet, 3312982b78c5SDr. David Alan Gilbert vmstate_virtio_net_queue_tx_waiting, 3313982b78c5SDr. David Alan Gilbert VirtIONetQueue), 3314982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mergeable_rx_bufs, VirtIONet), 3315982b78c5SDr. David Alan Gilbert VMSTATE_UINT16(status, VirtIONet), 3316982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(promisc, VirtIONet), 3317982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(allmulti, VirtIONet), 3318982b78c5SDr. David Alan Gilbert VMSTATE_UINT32(mac_table.in_use, VirtIONet), 3319982b78c5SDr. David Alan Gilbert 3320982b78c5SDr. David Alan Gilbert /* Guarded pair: If it fits we load it, else we throw it away 3321982b78c5SDr. David Alan Gilbert * - can happen if source has a larger MAC table.; post-load 3322982b78c5SDr. David Alan Gilbert * sets flags in this case. 3323982b78c5SDr. David Alan Gilbert */ 3324982b78c5SDr. David Alan Gilbert VMSTATE_VBUFFER_MULTIPLY(mac_table.macs, VirtIONet, 3325982b78c5SDr. David Alan Gilbert 0, mac_table_fits, mac_table.in_use, 3326982b78c5SDr. David Alan Gilbert ETH_ALEN), 3327982b78c5SDr. David Alan Gilbert VMSTATE_UNUSED_VARRAY_UINT32(VirtIONet, mac_table_doesnt_fit, 0, 3328982b78c5SDr. David Alan Gilbert mac_table.in_use, ETH_ALEN), 3329982b78c5SDr. David Alan Gilbert 3330982b78c5SDr. David Alan Gilbert /* Note: This is an array of uint32's that's always been saved as a 3331982b78c5SDr. David Alan Gilbert * buffer; hold onto your endiannesses; it's actually used as a bitmap 3332982b78c5SDr. David Alan Gilbert * but based on the uint. 3333982b78c5SDr. David Alan Gilbert */ 3334982b78c5SDr. David Alan Gilbert VMSTATE_BUFFER_POINTER_UNSAFE(vlans, VirtIONet, 0, MAX_VLAN >> 3), 3335982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3336982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_vnet), 3337982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.multi_overflow, VirtIONet), 3338982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(mac_table.uni_overflow, VirtIONet), 3339982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(alluni, VirtIONet), 3340982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nomulti, VirtIONet), 3341982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nouni, VirtIONet), 3342982b78c5SDr. David Alan Gilbert VMSTATE_UINT8(nobcast, VirtIONet), 3343982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3344982b78c5SDr. David Alan Gilbert vmstate_virtio_net_has_ufo), 3345441537f1SJason Wang VMSTATE_SINGLE_TEST(max_queue_pairs, VirtIONet, max_queue_pairs_gt_1, 0, 3346982b78c5SDr. David Alan Gilbert vmstate_info_uint16_equal, uint16_t), 3347441537f1SJason Wang VMSTATE_UINT16_TEST(curr_queue_pairs, VirtIONet, max_queue_pairs_gt_1), 3348982b78c5SDr. David Alan Gilbert VMSTATE_WITH_TMP(VirtIONet, struct VirtIONetMigTmp, 3349982b78c5SDr. David Alan Gilbert vmstate_virtio_net_tx_waiting), 3350982b78c5SDr. David Alan Gilbert VMSTATE_UINT64_TEST(curr_guest_offloads, VirtIONet, 3351982b78c5SDr. David Alan Gilbert has_ctrl_guest_offloads), 3352982b78c5SDr. David Alan Gilbert VMSTATE_END_OF_LIST() 3353982b78c5SDr. David Alan Gilbert }, 33541de81b42SRichard Henderson .subsections = (const VMStateDescription * const []) { 3355e41b7114SYuri Benditovich &vmstate_virtio_net_rss, 3356e41b7114SYuri Benditovich NULL 3357e41b7114SYuri Benditovich } 3358982b78c5SDr. David Alan Gilbert }; 3359982b78c5SDr. David Alan Gilbert 33606e790746SPaolo Bonzini static NetClientInfo net_virtio_info = { 3361f394b2e2SEric Blake .type = NET_CLIENT_DRIVER_NIC, 33626e790746SPaolo Bonzini .size = sizeof(NICState), 33636e790746SPaolo Bonzini .can_receive = virtio_net_can_receive, 33646e790746SPaolo Bonzini .receive = virtio_net_receive, 33656e790746SPaolo Bonzini .link_status_changed = virtio_net_set_link_status, 3366b1be4280SAmos Kong .query_rx_filter = virtio_net_query_rxfilter, 3367b2c929f0SDr. David Alan Gilbert .announce = virtio_net_announce, 33686e790746SPaolo Bonzini }; 33696e790746SPaolo Bonzini 33706e790746SPaolo Bonzini static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx) 33716e790746SPaolo Bonzini { 337217a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 337368b0a639SSi-Wei Liu NetClientState *nc; 33746e790746SPaolo Bonzini assert(n->vhost_started); 33751c188fc8SAkihiko Odaki if (!n->multiqueue && idx == 2) { 337668b0a639SSi-Wei Liu /* Must guard against invalid features and bogus queue index 337768b0a639SSi-Wei Liu * from being set by malicious guest, or penetrated through 337868b0a639SSi-Wei Liu * buggy migration stream. 337968b0a639SSi-Wei Liu */ 338068b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 338168b0a639SSi-Wei Liu qemu_log_mask(LOG_GUEST_ERROR, 338268b0a639SSi-Wei Liu "%s: bogus vq index ignored\n", __func__); 338368b0a639SSi-Wei Liu return false; 338468b0a639SSi-Wei Liu } 338568b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, n->max_queue_pairs); 338668b0a639SSi-Wei Liu } else { 338768b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, vq2q(idx)); 338868b0a639SSi-Wei Liu } 3389544f0278SCindy Lu /* 3390544f0278SCindy Lu * Add the check for configure interrupt, Use VIRTIO_CONFIG_IRQ_IDX -1 33917e8094f0SAlex Bennée * as the macro of configure interrupt's IDX, If this driver does not 3392544f0278SCindy Lu * support, the function will return false 3393544f0278SCindy Lu */ 3394544f0278SCindy Lu 3395544f0278SCindy Lu if (idx == VIRTIO_CONFIG_IRQ_IDX) { 33968aab0d1dSCindy Lu return vhost_net_config_pending(get_vhost_net(nc->peer)); 3397544f0278SCindy Lu } 3398ed8b4afeSNikolay Nikolaev return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx); 33996e790746SPaolo Bonzini } 34006e790746SPaolo Bonzini 34016e790746SPaolo Bonzini static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx, 34026e790746SPaolo Bonzini bool mask) 34036e790746SPaolo Bonzini { 340417a0ca55SKONRAD Frederic VirtIONet *n = VIRTIO_NET(vdev); 340568b0a639SSi-Wei Liu NetClientState *nc; 34066e790746SPaolo Bonzini assert(n->vhost_started); 34071c188fc8SAkihiko Odaki if (!n->multiqueue && idx == 2) { 340868b0a639SSi-Wei Liu /* Must guard against invalid features and bogus queue index 340968b0a639SSi-Wei Liu * from being set by malicious guest, or penetrated through 341068b0a639SSi-Wei Liu * buggy migration stream. 341168b0a639SSi-Wei Liu */ 341268b0a639SSi-Wei Liu if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) { 341368b0a639SSi-Wei Liu qemu_log_mask(LOG_GUEST_ERROR, 341468b0a639SSi-Wei Liu "%s: bogus vq index ignored\n", __func__); 341568b0a639SSi-Wei Liu return; 341668b0a639SSi-Wei Liu } 341768b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, n->max_queue_pairs); 341868b0a639SSi-Wei Liu } else { 341968b0a639SSi-Wei Liu nc = qemu_get_subqueue(n->nic, vq2q(idx)); 342068b0a639SSi-Wei Liu } 3421544f0278SCindy Lu /* 3422544f0278SCindy Lu *Add the check for configure interrupt, Use VIRTIO_CONFIG_IRQ_IDX -1 34237e8094f0SAlex Bennée * as the macro of configure interrupt's IDX, If this driver does not 3424544f0278SCindy Lu * support, the function will return 3425544f0278SCindy Lu */ 3426544f0278SCindy Lu 3427544f0278SCindy Lu if (idx == VIRTIO_CONFIG_IRQ_IDX) { 34288aab0d1dSCindy Lu vhost_net_config_mask(get_vhost_net(nc->peer), vdev, mask); 3429544f0278SCindy Lu return; 3430544f0278SCindy Lu } 3431544f0278SCindy Lu vhost_net_virtqueue_mask(get_vhost_net(nc->peer), vdev, idx, mask); 34326e790746SPaolo Bonzini } 34336e790746SPaolo Bonzini 3434019a3edbSGerd Hoffmann static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features) 34356e790746SPaolo Bonzini { 34360cd09c3aSCornelia Huck virtio_add_feature(&host_features, VIRTIO_NET_F_MAC); 3437a93e599dSMaxime Coquelin 3438d74c30c8SDaniil Tatianin n->config_size = virtio_get_config_size(&cfg_size_params, host_features); 343917ec5a86SKONRAD Frederic } 34406e790746SPaolo Bonzini 34418a253ec2SKONRAD Frederic void virtio_net_set_netclient_name(VirtIONet *n, const char *name, 34428a253ec2SKONRAD Frederic const char *type) 34438a253ec2SKONRAD Frederic { 34448a253ec2SKONRAD Frederic /* 34458a253ec2SKONRAD Frederic * The name can be NULL, the netclient name will be type.x. 34468a253ec2SKONRAD Frederic */ 34478a253ec2SKONRAD Frederic assert(type != NULL); 34488a253ec2SKONRAD Frederic 34498a253ec2SKONRAD Frederic g_free(n->netclient_name); 34508a253ec2SKONRAD Frederic g_free(n->netclient_type); 34518a253ec2SKONRAD Frederic n->netclient_name = g_strdup(name); 34528a253ec2SKONRAD Frederic n->netclient_type = g_strdup(type); 34538a253ec2SKONRAD Frederic } 34548a253ec2SKONRAD Frederic 34550e9a65c5SJuan Quintela static bool failover_unplug_primary(VirtIONet *n, DeviceState *dev) 34569711cd0dSJens Freimann { 34579711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 34589711cd0dSJens Freimann PCIDevice *pci_dev; 34599711cd0dSJens Freimann Error *err = NULL; 34609711cd0dSJens Freimann 34610e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 34629711cd0dSJens Freimann if (hotplug_ctrl) { 34630e9a65c5SJuan Quintela pci_dev = PCI_DEVICE(dev); 34649711cd0dSJens Freimann pci_dev->partially_hotplugged = true; 34650e9a65c5SJuan Quintela hotplug_handler_unplug_request(hotplug_ctrl, dev, &err); 34669711cd0dSJens Freimann if (err) { 34679711cd0dSJens Freimann error_report_err(err); 34689711cd0dSJens Freimann return false; 34699711cd0dSJens Freimann } 34709711cd0dSJens Freimann } else { 34719711cd0dSJens Freimann return false; 34729711cd0dSJens Freimann } 34739711cd0dSJens Freimann return true; 34749711cd0dSJens Freimann } 34759711cd0dSJens Freimann 34760e9a65c5SJuan Quintela static bool failover_replug_primary(VirtIONet *n, DeviceState *dev, 34770e9a65c5SJuan Quintela Error **errp) 34789711cd0dSJens Freimann { 34795a0948d3SMarkus Armbruster Error *err = NULL; 34809711cd0dSJens Freimann HotplugHandler *hotplug_ctrl; 34810e9a65c5SJuan Quintela PCIDevice *pdev = PCI_DEVICE(dev); 348278274682SJuan Quintela BusState *primary_bus; 34839711cd0dSJens Freimann 34849711cd0dSJens Freimann if (!pdev->partially_hotplugged) { 34859711cd0dSJens Freimann return true; 34869711cd0dSJens Freimann } 34870e9a65c5SJuan Quintela primary_bus = dev->parent_bus; 348878274682SJuan Quintela if (!primary_bus) { 3489150ab54aSJens Freimann error_setg(errp, "virtio_net: couldn't find primary bus"); 34905a0948d3SMarkus Armbruster return false; 34919711cd0dSJens Freimann } 34920e9a65c5SJuan Quintela qdev_set_parent_bus(dev, primary_bus, &error_abort); 3493e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, false); 34940e9a65c5SJuan Quintela hotplug_ctrl = qdev_get_hotplug_handler(dev); 34959711cd0dSJens Freimann if (hotplug_ctrl) { 34960e9a65c5SJuan Quintela hotplug_handler_pre_plug(hotplug_ctrl, dev, &err); 34975a0948d3SMarkus Armbruster if (err) { 34985a0948d3SMarkus Armbruster goto out; 34995a0948d3SMarkus Armbruster } 35000e9a65c5SJuan Quintela hotplug_handler_plug(hotplug_ctrl, dev, &err); 35019711cd0dSJens Freimann } 3502109c20eaSLaurent Vivier pdev->partially_hotplugged = false; 3503150ab54aSJens Freimann 3504150ab54aSJens Freimann out: 35055a0948d3SMarkus Armbruster error_propagate(errp, err); 35065a0948d3SMarkus Armbruster return !err; 35079711cd0dSJens Freimann } 35089711cd0dSJens Freimann 35099d9babf7SSteve Sistare static void virtio_net_handle_migration_primary(VirtIONet *n, MigrationEvent *e) 35109711cd0dSJens Freimann { 35119711cd0dSJens Freimann bool should_be_hidden; 35129711cd0dSJens Freimann Error *err = NULL; 351307a5d816SJuan Quintela DeviceState *dev = failover_find_primary_device(n); 351407a5d816SJuan Quintela 351507a5d816SJuan Quintela if (!dev) { 351607a5d816SJuan Quintela return; 351707a5d816SJuan Quintela } 35189711cd0dSJens Freimann 3519e2bde83eSJuan Quintela should_be_hidden = qatomic_read(&n->failover_primary_hidden); 35209711cd0dSJens Freimann 35219d9babf7SSteve Sistare if (e->type == MIG_EVENT_PRECOPY_SETUP && !should_be_hidden) { 352207a5d816SJuan Quintela if (failover_unplug_primary(n, dev)) { 352307a5d816SJuan Quintela vmstate_unregister(VMSTATE_IF(dev), qdev_get_vmsd(dev), dev); 352407a5d816SJuan Quintela qapi_event_send_unplug_primary(dev->id); 3525e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 35269711cd0dSJens Freimann } else { 35279711cd0dSJens Freimann warn_report("couldn't unplug primary device"); 35289711cd0dSJens Freimann } 35299d9babf7SSteve Sistare } else if (e->type == MIG_EVENT_PRECOPY_FAILED) { 3530150ab54aSJens Freimann /* We already unplugged the device let's plug it back */ 353107a5d816SJuan Quintela if (!failover_replug_primary(n, dev, &err)) { 35329711cd0dSJens Freimann if (err) { 35339711cd0dSJens Freimann error_report_err(err); 35349711cd0dSJens Freimann } 35359711cd0dSJens Freimann } 35369711cd0dSJens Freimann } 35379711cd0dSJens Freimann } 35389711cd0dSJens Freimann 35393e775730SSteve Sistare static int virtio_net_migration_state_notifier(NotifierWithReturn *notifier, 35405663dd3fSSteve Sistare MigrationEvent *e, Error **errp) 35419711cd0dSJens Freimann { 35429711cd0dSJens Freimann VirtIONet *n = container_of(notifier, VirtIONet, migration_state); 35439d9babf7SSteve Sistare virtio_net_handle_migration_primary(n, e); 35443e775730SSteve Sistare return 0; 35459711cd0dSJens Freimann } 35469711cd0dSJens Freimann 3547b91ad981SJuan Quintela static bool failover_hide_primary_device(DeviceListener *listener, 3548f3558b1bSKevin Wolf const QDict *device_opts, 3549f3558b1bSKevin Wolf bool from_json, 3550f3558b1bSKevin Wolf Error **errp) 35519711cd0dSJens Freimann { 35529711cd0dSJens Freimann VirtIONet *n = container_of(listener, VirtIONet, primary_listener); 35534f0303aeSJuan Quintela const char *standby_id; 35549711cd0dSJens Freimann 35554d0e59acSJens Freimann if (!device_opts) { 355689631fedSJuan Quintela return false; 35574d0e59acSJens Freimann } 3558bcfc906bSLaurent Vivier 3559bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "failover_pair_id")) { 3560bcfc906bSLaurent Vivier return false; 3561bcfc906bSLaurent Vivier } 3562bcfc906bSLaurent Vivier 3563bcfc906bSLaurent Vivier if (!qdict_haskey(device_opts, "id")) { 3564bcfc906bSLaurent Vivier error_setg(errp, "Device with failover_pair_id needs to have id"); 3565bcfc906bSLaurent Vivier return false; 3566bcfc906bSLaurent Vivier } 3567bcfc906bSLaurent Vivier 3568bcfc906bSLaurent Vivier standby_id = qdict_get_str(device_opts, "failover_pair_id"); 356989631fedSJuan Quintela if (g_strcmp0(standby_id, n->netclient_name) != 0) { 357089631fedSJuan Quintela return false; 35719711cd0dSJens Freimann } 35729711cd0dSJens Freimann 35737fe7791eSLaurent Vivier /* 35747fe7791eSLaurent Vivier * The hide helper can be called several times for a given device. 35757fe7791eSLaurent Vivier * Check there is only one primary for a virtio-net device but 35767fe7791eSLaurent Vivier * don't duplicate the qdict several times if it's called for the same 35777fe7791eSLaurent Vivier * device. 35787fe7791eSLaurent Vivier */ 3579259a10dbSKevin Wolf if (n->primary_opts) { 35807fe7791eSLaurent Vivier const char *old, *new; 35817fe7791eSLaurent Vivier /* devices with failover_pair_id always have an id */ 35827fe7791eSLaurent Vivier old = qdict_get_str(n->primary_opts, "id"); 35837fe7791eSLaurent Vivier new = qdict_get_str(device_opts, "id"); 35847fe7791eSLaurent Vivier if (strcmp(old, new) != 0) { 35857fe7791eSLaurent Vivier error_setg(errp, "Cannot attach more than one primary device to " 35867fe7791eSLaurent Vivier "'%s': '%s' and '%s'", n->netclient_name, old, new); 3587259a10dbSKevin Wolf return false; 3588259a10dbSKevin Wolf } 35897fe7791eSLaurent Vivier } else { 3590f3558b1bSKevin Wolf n->primary_opts = qdict_clone_shallow(device_opts); 3591f3558b1bSKevin Wolf n->primary_opts_from_json = from_json; 35927fe7791eSLaurent Vivier } 3593259a10dbSKevin Wolf 3594e2bde83eSJuan Quintela /* failover_primary_hidden is set during feature negotiation */ 35953abad4a2SJuan Quintela return qatomic_read(&n->failover_primary_hidden); 35969711cd0dSJens Freimann } 35979711cd0dSJens Freimann 3598e6f746b3SAndreas Färber static void virtio_net_device_realize(DeviceState *dev, Error **errp) 359917ec5a86SKONRAD Frederic { 3600e6f746b3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3601284a32f0SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3602284a32f0SAndreas Färber NetClientState *nc; 36031773d9eeSKONRAD Frederic int i; 360417ec5a86SKONRAD Frederic 3605a93e599dSMaxime Coquelin if (n->net_conf.mtu) { 3606127833eeSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_MTU); 3607a93e599dSMaxime Coquelin } 3608a93e599dSMaxime Coquelin 36099473939eSJason Baron if (n->net_conf.duplex_str) { 36109473939eSJason Baron if (strncmp(n->net_conf.duplex_str, "half", 5) == 0) { 36119473939eSJason Baron n->net_conf.duplex = DUPLEX_HALF; 36129473939eSJason Baron } else if (strncmp(n->net_conf.duplex_str, "full", 5) == 0) { 36139473939eSJason Baron n->net_conf.duplex = DUPLEX_FULL; 36149473939eSJason Baron } else { 36159473939eSJason Baron error_setg(errp, "'duplex' must be 'half' or 'full'"); 3616843c4cfcSMarkus Armbruster return; 36179473939eSJason Baron } 36189473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 36199473939eSJason Baron } else { 36209473939eSJason Baron n->net_conf.duplex = DUPLEX_UNKNOWN; 36219473939eSJason Baron } 36229473939eSJason Baron 36239473939eSJason Baron if (n->net_conf.speed < SPEED_UNKNOWN) { 36249473939eSJason Baron error_setg(errp, "'speed' must be between 0 and INT_MAX"); 3625843c4cfcSMarkus Armbruster return; 3626843c4cfcSMarkus Armbruster } 3627843c4cfcSMarkus Armbruster if (n->net_conf.speed >= 0) { 36289473939eSJason Baron n->host_features |= (1ULL << VIRTIO_NET_F_SPEED_DUPLEX); 36299473939eSJason Baron } 36309473939eSJason Baron 36319711cd0dSJens Freimann if (n->failover) { 3632b91ad981SJuan Quintela n->primary_listener.hide_device = failover_hide_primary_device; 3633e2bde83eSJuan Quintela qatomic_set(&n->failover_primary_hidden, true); 36349711cd0dSJens Freimann device_listener_register(&n->primary_listener); 3635d9cda213SSteve Sistare migration_add_notifier(&n->migration_state, 3636d9cda213SSteve Sistare virtio_net_migration_state_notifier); 36379711cd0dSJens Freimann n->host_features |= (1ULL << VIRTIO_NET_F_STANDBY); 36389711cd0dSJens Freimann } 36399711cd0dSJens Freimann 3640da3e8a23SShannon Zhao virtio_net_set_config_size(n, n->host_features); 36413857cd5cSJonah Palmer virtio_init(vdev, VIRTIO_ID_NET, n->config_size); 364217ec5a86SKONRAD Frederic 36431c0fbfa3SMichael S. Tsirkin /* 36441c0fbfa3SMichael S. Tsirkin * We set a lower limit on RX queue size to what it always was. 36451c0fbfa3SMichael S. Tsirkin * Guests that want a smaller ring can always resize it without 36461c0fbfa3SMichael S. Tsirkin * help from us (using virtio 1 and up). 36471c0fbfa3SMichael S. Tsirkin */ 36481c0fbfa3SMichael S. Tsirkin if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE || 36491c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE || 36505f997fd1SMichal Privoznik !is_power_of_2(n->net_conf.rx_queue_size)) { 36511c0fbfa3SMichael S. Tsirkin error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), " 36521c0fbfa3SMichael S. Tsirkin "must be a power of 2 between %d and %d.", 36531c0fbfa3SMichael S. Tsirkin n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE, 36541c0fbfa3SMichael S. Tsirkin VIRTQUEUE_MAX_SIZE); 36551c0fbfa3SMichael S. Tsirkin virtio_cleanup(vdev); 36561c0fbfa3SMichael S. Tsirkin return; 36571c0fbfa3SMichael S. Tsirkin } 36581c0fbfa3SMichael S. Tsirkin 36599b02e161SWei Wang if (n->net_conf.tx_queue_size < VIRTIO_NET_TX_QUEUE_MIN_SIZE || 36604271f403SLaurent Vivier n->net_conf.tx_queue_size > virtio_net_max_tx_queue_size(n) || 36619b02e161SWei Wang !is_power_of_2(n->net_conf.tx_queue_size)) { 36629b02e161SWei Wang error_setg(errp, "Invalid tx_queue_size (= %" PRIu16 "), " 36639b02e161SWei Wang "must be a power of 2 between %d and %d", 36649b02e161SWei Wang n->net_conf.tx_queue_size, VIRTIO_NET_TX_QUEUE_MIN_SIZE, 36654271f403SLaurent Vivier virtio_net_max_tx_queue_size(n)); 36669b02e161SWei Wang virtio_cleanup(vdev); 36679b02e161SWei Wang return; 36689b02e161SWei Wang } 36699b02e161SWei Wang 367022288fe5SJason Wang n->max_ncs = MAX(n->nic_conf.peers.queues, 1); 367122288fe5SJason Wang 367222288fe5SJason Wang /* 367322288fe5SJason Wang * Figure out the datapath queue pairs since the backend could 367422288fe5SJason Wang * provide control queue via peers as well. 367522288fe5SJason Wang */ 367622288fe5SJason Wang if (n->nic_conf.peers.queues) { 367722288fe5SJason Wang for (i = 0; i < n->max_ncs; i++) { 367822288fe5SJason Wang if (n->nic_conf.peers.ncs[i]->is_datapath) { 367922288fe5SJason Wang ++n->max_queue_pairs; 368022288fe5SJason Wang } 368122288fe5SJason Wang } 368222288fe5SJason Wang } 368322288fe5SJason Wang n->max_queue_pairs = MAX(n->max_queue_pairs, 1); 368422288fe5SJason Wang 3685441537f1SJason Wang if (n->max_queue_pairs * 2 + 1 > VIRTIO_QUEUE_MAX) { 368622288fe5SJason Wang error_setg(errp, "Invalid number of queue pairs (= %" PRIu32 "), " 3687631b22eaSStefan Weil "must be a positive integer less than %d.", 3688441537f1SJason Wang n->max_queue_pairs, (VIRTIO_QUEUE_MAX - 1) / 2); 36897e0e736eSJason Wang virtio_cleanup(vdev); 36907e0e736eSJason Wang return; 36917e0e736eSJason Wang } 3692b21e2380SMarkus Armbruster n->vqs = g_new0(VirtIONetQueue, n->max_queue_pairs); 3693441537f1SJason Wang n->curr_queue_pairs = 1; 36941773d9eeSKONRAD Frederic n->tx_timeout = n->net_conf.txtimer; 36956e790746SPaolo Bonzini 36961773d9eeSKONRAD Frederic if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer") 36971773d9eeSKONRAD Frederic && strcmp(n->net_conf.tx, "bh")) { 36980765691eSMarkus Armbruster warn_report("virtio-net: " 36996e790746SPaolo Bonzini "Unknown option tx=%s, valid options: \"timer\" \"bh\"", 37001773d9eeSKONRAD Frederic n->net_conf.tx); 37010765691eSMarkus Armbruster error_printf("Defaulting to \"bh\""); 37026e790746SPaolo Bonzini } 37036e790746SPaolo Bonzini 37042eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size = MIN(virtio_net_max_tx_queue_size(n), 37052eef278bSMichael S. Tsirkin n->net_conf.tx_queue_size); 37069b02e161SWei Wang 37078c497568SAkihiko Odaki virtio_net_add_queue(n, 0); 3708da51a335SJason Wang 370917a0ca55SKONRAD Frederic n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl); 37101773d9eeSKONRAD Frederic qemu_macaddr_default_if_unset(&n->nic_conf.macaddr); 37111773d9eeSKONRAD Frederic memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac)); 37126e790746SPaolo Bonzini n->status = VIRTIO_NET_S_LINK_UP; 37139d8c6a25SDr. David Alan Gilbert qemu_announce_timer_reset(&n->announce_timer, migrate_announce_params(), 37149d8c6a25SDr. David Alan Gilbert QEMU_CLOCK_VIRTUAL, 3715f57fcf70SJason Wang virtio_net_announce_timer, n); 3716b2c929f0SDr. David Alan Gilbert n->announce_timer.round = 0; 37176e790746SPaolo Bonzini 37188a253ec2SKONRAD Frederic if (n->netclient_type) { 37198a253ec2SKONRAD Frederic /* 37208a253ec2SKONRAD Frederic * Happen when virtio_net_set_netclient_name has been called. 37218a253ec2SKONRAD Frederic */ 37228a253ec2SKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 37237d0fefdfSAkihiko Odaki n->netclient_type, n->netclient_name, 37247d0fefdfSAkihiko Odaki &dev->mem_reentrancy_guard, n); 37258a253ec2SKONRAD Frederic } else { 37261773d9eeSKONRAD Frederic n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf, 37277d0fefdfSAkihiko Odaki object_get_typename(OBJECT(dev)), dev->id, 37287d0fefdfSAkihiko Odaki &dev->mem_reentrancy_guard, n); 37298a253ec2SKONRAD Frederic } 37308a253ec2SKONRAD Frederic 3731441537f1SJason Wang for (i = 0; i < n->max_queue_pairs; i++) { 3732d4c62930SBin Meng n->nic->ncs[i].do_not_pad = true; 3733d4c62930SBin Meng } 3734d4c62930SBin Meng 37356e790746SPaolo Bonzini peer_test_vnet_hdr(n); 37366e790746SPaolo Bonzini if (peer_has_vnet_hdr(n)) { 37376e790746SPaolo Bonzini n->host_hdr_len = sizeof(struct virtio_net_hdr); 37386e790746SPaolo Bonzini } else { 37396e790746SPaolo Bonzini n->host_hdr_len = 0; 37406e790746SPaolo Bonzini } 37416e790746SPaolo Bonzini 37421773d9eeSKONRAD Frederic qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a); 37436e790746SPaolo Bonzini 37446e790746SPaolo Bonzini n->vqs[0].tx_waiting = 0; 37451773d9eeSKONRAD Frederic n->tx_burst = n->net_conf.txburst; 3746e22f0603SYuri Benditovich virtio_net_set_mrg_rx_bufs(n, 0, 0, 0); 37476e790746SPaolo Bonzini n->promisc = 1; /* for compatibility */ 37486e790746SPaolo Bonzini 37496e790746SPaolo Bonzini n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN); 37506e790746SPaolo Bonzini 37516e790746SPaolo Bonzini n->vlans = g_malloc0(MAX_VLAN >> 3); 37526e790746SPaolo Bonzini 3753b1be4280SAmos Kong nc = qemu_get_queue(n->nic); 3754b1be4280SAmos Kong nc->rxfilter_notify_enabled = 1; 3755b1be4280SAmos Kong 3756e87936eaSCindy Lu if (nc->peer && nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_VDPA) { 3757e87936eaSCindy Lu struct virtio_net_config netcfg = {}; 3758e87936eaSCindy Lu memcpy(&netcfg.mac, &n->nic_conf.macaddr, ETH_ALEN); 3759e87936eaSCindy Lu vhost_net_set_config(get_vhost_net(nc->peer), 3760f8ed3648SManos Pitsidianakis (uint8_t *)&netcfg, 0, ETH_ALEN, VHOST_SET_CONFIG_TYPE_FRONTEND); 3761e87936eaSCindy Lu } 37622974e916SYuri Benditovich QTAILQ_INIT(&n->rsc_chains); 3763284a32f0SAndreas Färber n->qdev = dev; 37644474e37aSYuri Benditovich 3765aac8f89dSAkihiko Odaki net_rx_pkt_init(&n->rx_pkt); 37660145c393SAndrew Melnychenko 37670145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 3768b5900dffSDaniel P. Berrangé Error *err = NULL; 3769b5900dffSDaniel P. Berrangé if (!virtio_net_load_ebpf(n, &err)) { 3770b5900dffSDaniel P. Berrangé /* 3771b5900dffSDaniel P. Berrangé * If user explicitly gave QEMU RSS FDs to use, then 3772b5900dffSDaniel P. Berrangé * failing to use them must be considered a fatal 3773b5900dffSDaniel P. Berrangé * error. If no RSS FDs were provided, QEMU is trying 3774b5900dffSDaniel P. Berrangé * eBPF on a "best effort" basis only, so report a 3775b5900dffSDaniel P. Berrangé * warning and allow fallback to software RSS. 3776b5900dffSDaniel P. Berrangé */ 3777b5900dffSDaniel P. Berrangé if (n->ebpf_rss_fds) { 3778b5900dffSDaniel P. Berrangé error_propagate(errp, err); 3779b5900dffSDaniel P. Berrangé } else { 3780b5900dffSDaniel P. Berrangé warn_report("unable to load eBPF RSS: %s", 3781b5900dffSDaniel P. Berrangé error_get_pretty(err)); 3782b5900dffSDaniel P. Berrangé error_free(err); 3783b5900dffSDaniel P. Berrangé } 3784b5900dffSDaniel P. Berrangé } 37850145c393SAndrew Melnychenko } 378617ec5a86SKONRAD Frederic } 378717ec5a86SKONRAD Frederic 3788b69c3c21SMarkus Armbruster static void virtio_net_device_unrealize(DeviceState *dev) 378917ec5a86SKONRAD Frederic { 3790306ec6c3SAndreas Färber VirtIODevice *vdev = VIRTIO_DEVICE(dev); 3791306ec6c3SAndreas Färber VirtIONet *n = VIRTIO_NET(dev); 3792441537f1SJason Wang int i, max_queue_pairs; 379317ec5a86SKONRAD Frederic 37940145c393SAndrew Melnychenko if (virtio_has_feature(n->host_features, VIRTIO_NET_F_RSS)) { 37950145c393SAndrew Melnychenko virtio_net_unload_ebpf(n); 37960145c393SAndrew Melnychenko } 37970145c393SAndrew Melnychenko 379817ec5a86SKONRAD Frederic /* This will stop vhost backend if appropriate. */ 379917ec5a86SKONRAD Frederic virtio_net_set_status(vdev, 0); 380017ec5a86SKONRAD Frederic 38018a253ec2SKONRAD Frederic g_free(n->netclient_name); 38028a253ec2SKONRAD Frederic n->netclient_name = NULL; 38038a253ec2SKONRAD Frederic g_free(n->netclient_type); 38048a253ec2SKONRAD Frederic n->netclient_type = NULL; 38058a253ec2SKONRAD Frederic 380617ec5a86SKONRAD Frederic g_free(n->mac_table.macs); 380717ec5a86SKONRAD Frederic g_free(n->vlans); 380817ec5a86SKONRAD Frederic 38099711cd0dSJens Freimann if (n->failover) { 3810f3558b1bSKevin Wolf qobject_unref(n->primary_opts); 381165018100SJuan Quintela device_listener_unregister(&n->primary_listener); 3812d9cda213SSteve Sistare migration_remove_notifier(&n->migration_state); 3813f3558b1bSKevin Wolf } else { 3814f3558b1bSKevin Wolf assert(n->primary_opts == NULL); 38159711cd0dSJens Freimann } 38169711cd0dSJens Freimann 3817441537f1SJason Wang max_queue_pairs = n->multiqueue ? n->max_queue_pairs : 1; 3818441537f1SJason Wang for (i = 0; i < max_queue_pairs; i++) { 3819f9d6dbf0SWen Congyang virtio_net_del_queue(n, i); 382017ec5a86SKONRAD Frederic } 3821d945d9f1SYuri Benditovich /* delete also control vq */ 3822441537f1SJason Wang virtio_del_queue(vdev, max_queue_pairs * 2); 3823944458b6SDr. David Alan Gilbert qemu_announce_timer_del(&n->announce_timer, false); 382417ec5a86SKONRAD Frederic g_free(n->vqs); 382517ec5a86SKONRAD Frederic qemu_del_nic(n->nic); 38262974e916SYuri Benditovich virtio_net_rsc_cleanup(n); 382759079029SYuri Benditovich g_free(n->rss_data.indirections_table); 38284474e37aSYuri Benditovich net_rx_pkt_uninit(n->rx_pkt); 38296a1a8cc7SKONRAD Frederic virtio_cleanup(vdev); 383017ec5a86SKONRAD Frederic } 383117ec5a86SKONRAD Frederic 3832cef776c0SAkihiko Odaki static void virtio_net_reset(VirtIODevice *vdev) 3833cef776c0SAkihiko Odaki { 3834cef776c0SAkihiko Odaki VirtIONet *n = VIRTIO_NET(vdev); 3835cef776c0SAkihiko Odaki int i; 3836cef776c0SAkihiko Odaki 3837cef776c0SAkihiko Odaki /* Reset back to compatibility mode */ 3838cef776c0SAkihiko Odaki n->promisc = 1; 3839cef776c0SAkihiko Odaki n->allmulti = 0; 3840cef776c0SAkihiko Odaki n->alluni = 0; 3841cef776c0SAkihiko Odaki n->nomulti = 0; 3842cef776c0SAkihiko Odaki n->nouni = 0; 3843cef776c0SAkihiko Odaki n->nobcast = 0; 3844cef776c0SAkihiko Odaki /* multiqueue is disabled by default */ 3845cef776c0SAkihiko Odaki n->curr_queue_pairs = 1; 3846cef776c0SAkihiko Odaki timer_del(n->announce_timer.tm); 3847cef776c0SAkihiko Odaki n->announce_timer.round = 0; 3848cef776c0SAkihiko Odaki n->status &= ~VIRTIO_NET_S_ANNOUNCE; 3849cef776c0SAkihiko Odaki 3850cef776c0SAkihiko Odaki /* Flush any MAC and VLAN filter table state */ 3851cef776c0SAkihiko Odaki n->mac_table.in_use = 0; 3852cef776c0SAkihiko Odaki n->mac_table.first_multi = 0; 3853cef776c0SAkihiko Odaki n->mac_table.multi_overflow = 0; 3854cef776c0SAkihiko Odaki n->mac_table.uni_overflow = 0; 3855cef776c0SAkihiko Odaki memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN); 3856cef776c0SAkihiko Odaki memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac)); 3857cef776c0SAkihiko Odaki qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac); 3858cef776c0SAkihiko Odaki memset(n->vlans, 0, MAX_VLAN >> 3); 3859cef776c0SAkihiko Odaki 3860cef776c0SAkihiko Odaki /* Flush any async TX */ 3861cef776c0SAkihiko Odaki for (i = 0; i < n->max_queue_pairs; i++) { 3862cef776c0SAkihiko Odaki flush_or_purge_queued_packets(qemu_get_subqueue(n->nic, i)); 3863cef776c0SAkihiko Odaki } 3864cef776c0SAkihiko Odaki 3865cef776c0SAkihiko Odaki virtio_net_disable_rss(n); 3866cef776c0SAkihiko Odaki } 3867cef776c0SAkihiko Odaki 386817ec5a86SKONRAD Frederic static void virtio_net_instance_init(Object *obj) 386917ec5a86SKONRAD Frederic { 387017ec5a86SKONRAD Frederic VirtIONet *n = VIRTIO_NET(obj); 387117ec5a86SKONRAD Frederic 387217ec5a86SKONRAD Frederic /* 387317ec5a86SKONRAD Frederic * The default config_size is sizeof(struct virtio_net_config). 38742431f4f1SMichael Tokarev * Can be overridden with virtio_net_set_config_size. 387517ec5a86SKONRAD Frederic */ 387617ec5a86SKONRAD Frederic n->config_size = sizeof(struct virtio_net_config); 3877aa4197c3SGonglei device_add_bootindex_property(obj, &n->nic_conf.bootindex, 3878aa4197c3SGonglei "bootindex", "/ethernet-phy@0", 387940c2281cSMarkus Armbruster DEVICE(n)); 38800145c393SAndrew Melnychenko 38810145c393SAndrew Melnychenko ebpf_rss_init(&n->ebpf_rss); 388217ec5a86SKONRAD Frederic } 388317ec5a86SKONRAD Frederic 388444b1ff31SDr. David Alan Gilbert static int virtio_net_pre_save(void *opaque) 38854d45dcfbSHalil Pasic { 38864d45dcfbSHalil Pasic VirtIONet *n = opaque; 38874d45dcfbSHalil Pasic 38884d45dcfbSHalil Pasic /* At this point, backend must be stopped, otherwise 38894d45dcfbSHalil Pasic * it might keep writing to memory. */ 38904d45dcfbSHalil Pasic assert(!n->vhost_started); 389144b1ff31SDr. David Alan Gilbert 389244b1ff31SDr. David Alan Gilbert return 0; 38934d45dcfbSHalil Pasic } 38944d45dcfbSHalil Pasic 38959711cd0dSJens Freimann static bool primary_unplug_pending(void *opaque) 38969711cd0dSJens Freimann { 38979711cd0dSJens Freimann DeviceState *dev = opaque; 389821e8709bSJuan Quintela DeviceState *primary; 38999711cd0dSJens Freimann VirtIODevice *vdev = VIRTIO_DEVICE(dev); 39009711cd0dSJens Freimann VirtIONet *n = VIRTIO_NET(vdev); 39019711cd0dSJens Freimann 3902284f42a5SJens Freimann if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_STANDBY)) { 3903284f42a5SJens Freimann return false; 3904284f42a5SJens Freimann } 390521e8709bSJuan Quintela primary = failover_find_primary_device(n); 390621e8709bSJuan Quintela return primary ? primary->pending_deleted_event : false; 39079711cd0dSJens Freimann } 39089711cd0dSJens Freimann 39099711cd0dSJens Freimann static bool dev_unplug_pending(void *opaque) 39109711cd0dSJens Freimann { 39119711cd0dSJens Freimann DeviceState *dev = opaque; 39129711cd0dSJens Freimann VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(dev); 39139711cd0dSJens Freimann 39149711cd0dSJens Freimann return vdc->primary_unplug_pending(dev); 39159711cd0dSJens Freimann } 39169711cd0dSJens Freimann 3917c255488dSJonah Palmer static struct vhost_dev *virtio_net_get_vhost(VirtIODevice *vdev) 3918c255488dSJonah Palmer { 3919c255488dSJonah Palmer VirtIONet *n = VIRTIO_NET(vdev); 392000adced5SHanna Czenczek NetClientState *nc; 392100adced5SHanna Czenczek struct vhost_net *net; 392200adced5SHanna Czenczek 392300adced5SHanna Czenczek if (!n->nic) { 392400adced5SHanna Czenczek return NULL; 392500adced5SHanna Czenczek } 392600adced5SHanna Czenczek 392700adced5SHanna Czenczek nc = qemu_get_queue(n->nic); 392800adced5SHanna Czenczek if (!nc) { 392900adced5SHanna Czenczek return NULL; 393000adced5SHanna Czenczek } 393100adced5SHanna Czenczek 393200adced5SHanna Czenczek net = get_vhost_net(nc->peer); 393300adced5SHanna Czenczek if (!net) { 393400adced5SHanna Czenczek return NULL; 393500adced5SHanna Czenczek } 393600adced5SHanna Czenczek 3937c255488dSJonah Palmer return &net->dev; 3938c255488dSJonah Palmer } 3939c255488dSJonah Palmer 39404d45dcfbSHalil Pasic static const VMStateDescription vmstate_virtio_net = { 39414d45dcfbSHalil Pasic .name = "virtio-net", 39424d45dcfbSHalil Pasic .minimum_version_id = VIRTIO_NET_VM_VERSION, 39434d45dcfbSHalil Pasic .version_id = VIRTIO_NET_VM_VERSION, 39441de81b42SRichard Henderson .fields = (const VMStateField[]) { 39454d45dcfbSHalil Pasic VMSTATE_VIRTIO_DEVICE, 39464d45dcfbSHalil Pasic VMSTATE_END_OF_LIST() 39474d45dcfbSHalil Pasic }, 39484d45dcfbSHalil Pasic .pre_save = virtio_net_pre_save, 39499711cd0dSJens Freimann .dev_unplug_pending = dev_unplug_pending, 39504d45dcfbSHalil Pasic }; 3951290c2428SDr. David Alan Gilbert 395217ec5a86SKONRAD Frederic static Property virtio_net_properties[] = { 3953127833eeSJason Baron DEFINE_PROP_BIT64("csum", VirtIONet, host_features, 3954127833eeSJason Baron VIRTIO_NET_F_CSUM, true), 3955127833eeSJason Baron DEFINE_PROP_BIT64("guest_csum", VirtIONet, host_features, 395687108bb2SShannon Zhao VIRTIO_NET_F_GUEST_CSUM, true), 3957127833eeSJason Baron DEFINE_PROP_BIT64("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true), 3958127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso4", VirtIONet, host_features, 395987108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO4, true), 3960127833eeSJason Baron DEFINE_PROP_BIT64("guest_tso6", VirtIONet, host_features, 396187108bb2SShannon Zhao VIRTIO_NET_F_GUEST_TSO6, true), 3962127833eeSJason Baron DEFINE_PROP_BIT64("guest_ecn", VirtIONet, host_features, 396387108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ECN, true), 3964127833eeSJason Baron DEFINE_PROP_BIT64("guest_ufo", VirtIONet, host_features, 396587108bb2SShannon Zhao VIRTIO_NET_F_GUEST_UFO, true), 3966127833eeSJason Baron DEFINE_PROP_BIT64("guest_announce", VirtIONet, host_features, 396787108bb2SShannon Zhao VIRTIO_NET_F_GUEST_ANNOUNCE, true), 3968127833eeSJason Baron DEFINE_PROP_BIT64("host_tso4", VirtIONet, host_features, 396987108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO4, true), 3970127833eeSJason Baron DEFINE_PROP_BIT64("host_tso6", VirtIONet, host_features, 397187108bb2SShannon Zhao VIRTIO_NET_F_HOST_TSO6, true), 3972127833eeSJason Baron DEFINE_PROP_BIT64("host_ecn", VirtIONet, host_features, 397387108bb2SShannon Zhao VIRTIO_NET_F_HOST_ECN, true), 3974127833eeSJason Baron DEFINE_PROP_BIT64("host_ufo", VirtIONet, host_features, 397587108bb2SShannon Zhao VIRTIO_NET_F_HOST_UFO, true), 3976127833eeSJason Baron DEFINE_PROP_BIT64("mrg_rxbuf", VirtIONet, host_features, 397787108bb2SShannon Zhao VIRTIO_NET_F_MRG_RXBUF, true), 3978127833eeSJason Baron DEFINE_PROP_BIT64("status", VirtIONet, host_features, 397987108bb2SShannon Zhao VIRTIO_NET_F_STATUS, true), 3980127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vq", VirtIONet, host_features, 398187108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VQ, true), 3982127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx", VirtIONet, host_features, 398387108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX, true), 3984127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_vlan", VirtIONet, host_features, 398587108bb2SShannon Zhao VIRTIO_NET_F_CTRL_VLAN, true), 3986127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_rx_extra", VirtIONet, host_features, 398787108bb2SShannon Zhao VIRTIO_NET_F_CTRL_RX_EXTRA, true), 3988127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_mac_addr", VirtIONet, host_features, 398987108bb2SShannon Zhao VIRTIO_NET_F_CTRL_MAC_ADDR, true), 3990127833eeSJason Baron DEFINE_PROP_BIT64("ctrl_guest_offloads", VirtIONet, host_features, 399187108bb2SShannon Zhao VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true), 3992127833eeSJason Baron DEFINE_PROP_BIT64("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false), 399359079029SYuri Benditovich DEFINE_PROP_BIT64("rss", VirtIONet, host_features, 399459079029SYuri Benditovich VIRTIO_NET_F_RSS, false), 3995e22f0603SYuri Benditovich DEFINE_PROP_BIT64("hash", VirtIONet, host_features, 3996e22f0603SYuri Benditovich VIRTIO_NET_F_HASH_REPORT, false), 39976b230b7dSAndrew Melnychenko DEFINE_PROP_ARRAY("ebpf-rss-fds", VirtIONet, nr_ebpf_rss_fds, 39986b230b7dSAndrew Melnychenko ebpf_rss_fds, qdev_prop_string, char*), 39992974e916SYuri Benditovich DEFINE_PROP_BIT64("guest_rsc_ext", VirtIONet, host_features, 40002974e916SYuri Benditovich VIRTIO_NET_F_RSC_EXT, false), 40012974e916SYuri Benditovich DEFINE_PROP_UINT32("rsc_interval", VirtIONet, rsc_timeout, 40022974e916SYuri Benditovich VIRTIO_NET_RSC_DEFAULT_INTERVAL), 400317ec5a86SKONRAD Frederic DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf), 400417ec5a86SKONRAD Frederic DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer, 400517ec5a86SKONRAD Frederic TX_TIMER_INTERVAL), 400617ec5a86SKONRAD Frederic DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST), 400717ec5a86SKONRAD Frederic DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx), 40081c0fbfa3SMichael S. Tsirkin DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size, 40091c0fbfa3SMichael S. Tsirkin VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE), 40109b02e161SWei Wang DEFINE_PROP_UINT16("tx_queue_size", VirtIONet, net_conf.tx_queue_size, 40119b02e161SWei Wang VIRTIO_NET_TX_QUEUE_DEFAULT_SIZE), 4012a93e599dSMaxime Coquelin DEFINE_PROP_UINT16("host_mtu", VirtIONet, net_conf.mtu, 0), 401375ebec11SMaxime Coquelin DEFINE_PROP_BOOL("x-mtu-bypass-backend", VirtIONet, mtu_bypass_backend, 401475ebec11SMaxime Coquelin true), 40159473939eSJason Baron DEFINE_PROP_INT32("speed", VirtIONet, net_conf.speed, SPEED_UNKNOWN), 40169473939eSJason Baron DEFINE_PROP_STRING("duplex", VirtIONet, net_conf.duplex_str), 40179711cd0dSJens Freimann DEFINE_PROP_BOOL("failover", VirtIONet, failover, false), 401853da8b5aSYuri Benditovich DEFINE_PROP_BIT64("guest_uso4", VirtIONet, host_features, 401953da8b5aSYuri Benditovich VIRTIO_NET_F_GUEST_USO4, true), 402053da8b5aSYuri Benditovich DEFINE_PROP_BIT64("guest_uso6", VirtIONet, host_features, 402153da8b5aSYuri Benditovich VIRTIO_NET_F_GUEST_USO6, true), 402253da8b5aSYuri Benditovich DEFINE_PROP_BIT64("host_uso", VirtIONet, host_features, 402353da8b5aSYuri Benditovich VIRTIO_NET_F_HOST_USO, true), 402417ec5a86SKONRAD Frederic DEFINE_PROP_END_OF_LIST(), 402517ec5a86SKONRAD Frederic }; 402617ec5a86SKONRAD Frederic 402717ec5a86SKONRAD Frederic static void virtio_net_class_init(ObjectClass *klass, void *data) 402817ec5a86SKONRAD Frederic { 402917ec5a86SKONRAD Frederic DeviceClass *dc = DEVICE_CLASS(klass); 403017ec5a86SKONRAD Frederic VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass); 4031e6f746b3SAndreas Färber 40324f67d30bSMarc-André Lureau device_class_set_props(dc, virtio_net_properties); 4033290c2428SDr. David Alan Gilbert dc->vmsd = &vmstate_virtio_net; 4034125ee0edSMarcel Apfelbaum set_bit(DEVICE_CATEGORY_NETWORK, dc->categories); 4035e6f746b3SAndreas Färber vdc->realize = virtio_net_device_realize; 4036306ec6c3SAndreas Färber vdc->unrealize = virtio_net_device_unrealize; 403717ec5a86SKONRAD Frederic vdc->get_config = virtio_net_get_config; 403817ec5a86SKONRAD Frederic vdc->set_config = virtio_net_set_config; 403917ec5a86SKONRAD Frederic vdc->get_features = virtio_net_get_features; 404017ec5a86SKONRAD Frederic vdc->set_features = virtio_net_set_features; 404117ec5a86SKONRAD Frederic vdc->bad_features = virtio_net_bad_features; 404217ec5a86SKONRAD Frederic vdc->reset = virtio_net_reset; 40437dc6be52SXuan Zhuo vdc->queue_reset = virtio_net_queue_reset; 40447f863302SKangjie Xu vdc->queue_enable = virtio_net_queue_enable; 404517ec5a86SKONRAD Frederic vdc->set_status = virtio_net_set_status; 404617ec5a86SKONRAD Frederic vdc->guest_notifier_mask = virtio_net_guest_notifier_mask; 404717ec5a86SKONRAD Frederic vdc->guest_notifier_pending = virtio_net_guest_notifier_pending; 40482a083ffdSMichael S. Tsirkin vdc->legacy_features |= (0x1 << VIRTIO_NET_F_GSO); 40497788c3f2SMikhail Sennikovsky vdc->post_load = virtio_net_post_load_virtio; 4050982b78c5SDr. David Alan Gilbert vdc->vmsd = &vmstate_virtio_net_device; 40519711cd0dSJens Freimann vdc->primary_unplug_pending = primary_unplug_pending; 4052c255488dSJonah Palmer vdc->get_vhost = virtio_net_get_vhost; 4053cd9b8346SViktor Prutyanov vdc->toggle_device_iotlb = vhost_toggle_device_iotlb; 405417ec5a86SKONRAD Frederic } 405517ec5a86SKONRAD Frederic 405617ec5a86SKONRAD Frederic static const TypeInfo virtio_net_info = { 405717ec5a86SKONRAD Frederic .name = TYPE_VIRTIO_NET, 405817ec5a86SKONRAD Frederic .parent = TYPE_VIRTIO_DEVICE, 405917ec5a86SKONRAD Frederic .instance_size = sizeof(VirtIONet), 406017ec5a86SKONRAD Frederic .instance_init = virtio_net_instance_init, 406117ec5a86SKONRAD Frederic .class_init = virtio_net_class_init, 406217ec5a86SKONRAD Frederic }; 406317ec5a86SKONRAD Frederic 406417ec5a86SKONRAD Frederic static void virtio_register_types(void) 406517ec5a86SKONRAD Frederic { 406617ec5a86SKONRAD Frederic type_register_static(&virtio_net_info); 406717ec5a86SKONRAD Frederic } 406817ec5a86SKONRAD Frederic 406917ec5a86SKONRAD Frederic type_init(virtio_register_types) 4070