xref: /openbmc/linux/drivers/net/xen-netfront.c (revision 43b5169d)
10d160211SJeremy Fitzhardinge /*
20d160211SJeremy Fitzhardinge  * Virtual network driver for conversing with remote driver backends.
30d160211SJeremy Fitzhardinge  *
40d160211SJeremy Fitzhardinge  * Copyright (c) 2002-2005, K A Fraser
50d160211SJeremy Fitzhardinge  * Copyright (c) 2005, XenSource Ltd
60d160211SJeremy Fitzhardinge  *
70d160211SJeremy Fitzhardinge  * This program is free software; you can redistribute it and/or
80d160211SJeremy Fitzhardinge  * modify it under the terms of the GNU General Public License version 2
90d160211SJeremy Fitzhardinge  * as published by the Free Software Foundation; or, when distributed
100d160211SJeremy Fitzhardinge  * separately from the Linux kernel or incorporated into other
110d160211SJeremy Fitzhardinge  * software packages, subject to the following license:
120d160211SJeremy Fitzhardinge  *
130d160211SJeremy Fitzhardinge  * Permission is hereby granted, free of charge, to any person obtaining a copy
140d160211SJeremy Fitzhardinge  * of this source file (the "Software"), to deal in the Software without
150d160211SJeremy Fitzhardinge  * restriction, including without limitation the rights to use, copy, modify,
160d160211SJeremy Fitzhardinge  * merge, publish, distribute, sublicense, and/or sell copies of the Software,
170d160211SJeremy Fitzhardinge  * and to permit persons to whom the Software is furnished to do so, subject to
180d160211SJeremy Fitzhardinge  * the following conditions:
190d160211SJeremy Fitzhardinge  *
200d160211SJeremy Fitzhardinge  * The above copyright notice and this permission notice shall be included in
210d160211SJeremy Fitzhardinge  * all copies or substantial portions of the Software.
220d160211SJeremy Fitzhardinge  *
230d160211SJeremy Fitzhardinge  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
240d160211SJeremy Fitzhardinge  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
250d160211SJeremy Fitzhardinge  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
260d160211SJeremy Fitzhardinge  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
270d160211SJeremy Fitzhardinge  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
280d160211SJeremy Fitzhardinge  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
290d160211SJeremy Fitzhardinge  * IN THE SOFTWARE.
300d160211SJeremy Fitzhardinge  */
310d160211SJeremy Fitzhardinge 
32383eda32SJoe Perches #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
33383eda32SJoe Perches 
340d160211SJeremy Fitzhardinge #include <linux/module.h>
350d160211SJeremy Fitzhardinge #include <linux/kernel.h>
360d160211SJeremy Fitzhardinge #include <linux/netdevice.h>
370d160211SJeremy Fitzhardinge #include <linux/etherdevice.h>
380d160211SJeremy Fitzhardinge #include <linux/skbuff.h>
390d160211SJeremy Fitzhardinge #include <linux/ethtool.h>
400d160211SJeremy Fitzhardinge #include <linux/if_ether.h>
419ecd1a75SWei Liu #include <net/tcp.h>
420d160211SJeremy Fitzhardinge #include <linux/udp.h>
430d160211SJeremy Fitzhardinge #include <linux/moduleparam.h>
440d160211SJeremy Fitzhardinge #include <linux/mm.h>
455a0e3ad6STejun Heo #include <linux/slab.h>
460d160211SJeremy Fitzhardinge #include <net/ip.h>
476c5aa6fcSDenis Kirjanov #include <linux/bpf.h>
486c5aa6fcSDenis Kirjanov #include <net/page_pool.h>
496c5aa6fcSDenis Kirjanov #include <linux/bpf_trace.h>
500d160211SJeremy Fitzhardinge 
511ccbf534SJeremy Fitzhardinge #include <xen/xen.h>
520d160211SJeremy Fitzhardinge #include <xen/xenbus.h>
530d160211SJeremy Fitzhardinge #include <xen/events.h>
540d160211SJeremy Fitzhardinge #include <xen/page.h>
55b9136d20SIgor Mammedov #include <xen/platform_pci.h>
560d160211SJeremy Fitzhardinge #include <xen/grant_table.h>
570d160211SJeremy Fitzhardinge 
580d160211SJeremy Fitzhardinge #include <xen/interface/io/netif.h>
590d160211SJeremy Fitzhardinge #include <xen/interface/memory.h>
600d160211SJeremy Fitzhardinge #include <xen/interface/grant_table.h>
610d160211SJeremy Fitzhardinge 
6250ee6061SAndrew J. Bennieston /* Module parameters */
63034702a6SJuergen Gross #define MAX_QUEUES_DEFAULT 8
6450ee6061SAndrew J. Bennieston static unsigned int xennet_max_queues;
6550ee6061SAndrew J. Bennieston module_param_named(max_queues, xennet_max_queues, uint, 0644);
6650ee6061SAndrew J. Bennieston MODULE_PARM_DESC(max_queues,
6750ee6061SAndrew J. Bennieston 		 "Maximum number of queues per virtual interface");
6850ee6061SAndrew J. Bennieston 
69c2c63310SAndrea Righi #define XENNET_TIMEOUT  (5 * HZ)
70c2c63310SAndrea Righi 
710fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops;
720d160211SJeremy Fitzhardinge 
730d160211SJeremy Fitzhardinge struct netfront_cb {
743683243bSIan Campbell 	int pull_to;
750d160211SJeremy Fitzhardinge };
760d160211SJeremy Fitzhardinge 
770d160211SJeremy Fitzhardinge #define NETFRONT_SKB_CB(skb)	((struct netfront_cb *)((skb)->cb))
780d160211SJeremy Fitzhardinge 
790d160211SJeremy Fitzhardinge #define RX_COPY_THRESHOLD 256
800d160211SJeremy Fitzhardinge 
810d160211SJeremy Fitzhardinge #define GRANT_INVALID_REF	0
820d160211SJeremy Fitzhardinge 
8330c5d7f0SJulien Grall #define NET_TX_RING_SIZE __CONST_RING_SIZE(xen_netif_tx, XEN_PAGE_SIZE)
8430c5d7f0SJulien Grall #define NET_RX_RING_SIZE __CONST_RING_SIZE(xen_netif_rx, XEN_PAGE_SIZE)
851f3c2ebaSDavid Vrabel 
861f3c2ebaSDavid Vrabel /* Minimum number of Rx slots (includes slot for GSO metadata). */
871f3c2ebaSDavid Vrabel #define NET_RX_SLOTS_MIN (XEN_NETIF_NR_SLOTS_MIN + 1)
880d160211SJeremy Fitzhardinge 
892688fcb7SAndrew J. Bennieston /* Queue name is interface name with "-qNNN" appended */
902688fcb7SAndrew J. Bennieston #define QUEUE_NAME_SIZE (IFNAMSIZ + 6)
912688fcb7SAndrew J. Bennieston 
922688fcb7SAndrew J. Bennieston /* IRQ name is queue name with "-tx" or "-rx" appended */
932688fcb7SAndrew J. Bennieston #define IRQ_NAME_SIZE (QUEUE_NAME_SIZE + 3)
942688fcb7SAndrew J. Bennieston 
958edfe2e9SJuergen Gross static DECLARE_WAIT_QUEUE_HEAD(module_wq);
965b5971dfSEduardo Otubo 
97e00f85beSstephen hemminger struct netfront_stats {
98900e1833SDavid Vrabel 	u64			packets;
99900e1833SDavid Vrabel 	u64			bytes;
100e00f85beSstephen hemminger 	struct u64_stats_sync	syncp;
101e00f85beSstephen hemminger };
102e00f85beSstephen hemminger 
1032688fcb7SAndrew J. Bennieston struct netfront_info;
1042688fcb7SAndrew J. Bennieston 
1052688fcb7SAndrew J. Bennieston struct netfront_queue {
1062688fcb7SAndrew J. Bennieston 	unsigned int id; /* Queue ID, 0-based */
1072688fcb7SAndrew J. Bennieston 	char name[QUEUE_NAME_SIZE]; /* DEVNAME-qN */
1082688fcb7SAndrew J. Bennieston 	struct netfront_info *info;
1090d160211SJeremy Fitzhardinge 
1106c5aa6fcSDenis Kirjanov 	struct bpf_prog __rcu *xdp_prog;
1116c5aa6fcSDenis Kirjanov 
112bea3348eSStephen Hemminger 	struct napi_struct napi;
1130d160211SJeremy Fitzhardinge 
114d634bf2cSWei Liu 	/* Split event channels support, tx_* == rx_* when using
115d634bf2cSWei Liu 	 * single event channel.
116d634bf2cSWei Liu 	 */
117d634bf2cSWei Liu 	unsigned int tx_evtchn, rx_evtchn;
118d634bf2cSWei Liu 	unsigned int tx_irq, rx_irq;
119d634bf2cSWei Liu 	/* Only used when split event channels support is enabled */
1202688fcb7SAndrew J. Bennieston 	char tx_irq_name[IRQ_NAME_SIZE]; /* DEVNAME-qN-tx */
1212688fcb7SAndrew J. Bennieston 	char rx_irq_name[IRQ_NAME_SIZE]; /* DEVNAME-qN-rx */
1220d160211SJeremy Fitzhardinge 
1230d160211SJeremy Fitzhardinge 	spinlock_t   tx_lock;
12484284d3cSJeremy Fitzhardinge 	struct xen_netif_tx_front_ring tx;
12584284d3cSJeremy Fitzhardinge 	int tx_ring_ref;
1260d160211SJeremy Fitzhardinge 
1270d160211SJeremy Fitzhardinge 	/*
1280d160211SJeremy Fitzhardinge 	 * {tx,rx}_skbs store outstanding skbuffs. Free tx_skb entries
1290d160211SJeremy Fitzhardinge 	 * are linked from tx_skb_freelist through skb_entry.link.
1300d160211SJeremy Fitzhardinge 	 *
1310d160211SJeremy Fitzhardinge 	 *  NB. Freelist index entries are always going to be less than
1320d160211SJeremy Fitzhardinge 	 *  PAGE_OFFSET, whereas pointers to skbs will always be equal or
1330d160211SJeremy Fitzhardinge 	 *  greater than PAGE_OFFSET: we use this property to distinguish
1340d160211SJeremy Fitzhardinge 	 *  them.
1350d160211SJeremy Fitzhardinge 	 */
1360d160211SJeremy Fitzhardinge 	union skb_entry {
1370d160211SJeremy Fitzhardinge 		struct sk_buff *skb;
1381ffb40b8SIsaku Yamahata 		unsigned long link;
1390d160211SJeremy Fitzhardinge 	} tx_skbs[NET_TX_RING_SIZE];
1400d160211SJeremy Fitzhardinge 	grant_ref_t gref_tx_head;
1410d160211SJeremy Fitzhardinge 	grant_ref_t grant_tx_ref[NET_TX_RING_SIZE];
142cefe0078SAnnie Li 	struct page *grant_tx_page[NET_TX_RING_SIZE];
1430d160211SJeremy Fitzhardinge 	unsigned tx_skb_freelist;
1440d160211SJeremy Fitzhardinge 
14584284d3cSJeremy Fitzhardinge 	spinlock_t   rx_lock ____cacheline_aligned_in_smp;
14684284d3cSJeremy Fitzhardinge 	struct xen_netif_rx_front_ring rx;
14784284d3cSJeremy Fitzhardinge 	int rx_ring_ref;
14884284d3cSJeremy Fitzhardinge 
14984284d3cSJeremy Fitzhardinge 	struct timer_list rx_refill_timer;
15084284d3cSJeremy Fitzhardinge 
1510d160211SJeremy Fitzhardinge 	struct sk_buff *rx_skbs[NET_RX_RING_SIZE];
1520d160211SJeremy Fitzhardinge 	grant_ref_t gref_rx_head;
1530d160211SJeremy Fitzhardinge 	grant_ref_t grant_rx_ref[NET_RX_RING_SIZE];
1546c5aa6fcSDenis Kirjanov 
1556c5aa6fcSDenis Kirjanov 	struct page_pool *page_pool;
1566c5aa6fcSDenis Kirjanov 	struct xdp_rxq_info xdp_rxq;
1572688fcb7SAndrew J. Bennieston };
1582688fcb7SAndrew J. Bennieston 
1592688fcb7SAndrew J. Bennieston struct netfront_info {
1602688fcb7SAndrew J. Bennieston 	struct list_head list;
1612688fcb7SAndrew J. Bennieston 	struct net_device *netdev;
1622688fcb7SAndrew J. Bennieston 
1632688fcb7SAndrew J. Bennieston 	struct xenbus_device *xbdev;
1642688fcb7SAndrew J. Bennieston 
1652688fcb7SAndrew J. Bennieston 	/* Multi-queue support */
1662688fcb7SAndrew J. Bennieston 	struct netfront_queue *queues;
167e0ce4af9SIan Campbell 
168e0ce4af9SIan Campbell 	/* Statistics */
169900e1833SDavid Vrabel 	struct netfront_stats __percpu *rx_stats;
170900e1833SDavid Vrabel 	struct netfront_stats __percpu *tx_stats;
171e00f85beSstephen hemminger 
1726c5aa6fcSDenis Kirjanov 	/* XDP state */
1736c5aa6fcSDenis Kirjanov 	bool netback_has_xdp_headroom;
1746c5aa6fcSDenis Kirjanov 	bool netfront_xdp_enabled;
1756c5aa6fcSDenis Kirjanov 
1762688fcb7SAndrew J. Bennieston 	atomic_t rx_gso_checksum_fixup;
1770d160211SJeremy Fitzhardinge };
1780d160211SJeremy Fitzhardinge 
1790d160211SJeremy Fitzhardinge struct netfront_rx_info {
1800d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response rx;
1810d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info extras[XEN_NETIF_EXTRA_TYPE_MAX - 1];
1820d160211SJeremy Fitzhardinge };
1830d160211SJeremy Fitzhardinge 
1841ffb40b8SIsaku Yamahata static void skb_entry_set_link(union skb_entry *list, unsigned short id)
1851ffb40b8SIsaku Yamahata {
1861ffb40b8SIsaku Yamahata 	list->link = id;
1871ffb40b8SIsaku Yamahata }
1881ffb40b8SIsaku Yamahata 
1891ffb40b8SIsaku Yamahata static int skb_entry_is_link(const union skb_entry *list)
1901ffb40b8SIsaku Yamahata {
1911ffb40b8SIsaku Yamahata 	BUILD_BUG_ON(sizeof(list->skb) != sizeof(list->link));
192807540baSEric Dumazet 	return (unsigned long)list->skb < PAGE_OFFSET;
1931ffb40b8SIsaku Yamahata }
1941ffb40b8SIsaku Yamahata 
1950d160211SJeremy Fitzhardinge /*
1960d160211SJeremy Fitzhardinge  * Access macros for acquiring freeing slots in tx_skbs[].
1970d160211SJeremy Fitzhardinge  */
1980d160211SJeremy Fitzhardinge 
1990d160211SJeremy Fitzhardinge static void add_id_to_freelist(unsigned *head, union skb_entry *list,
2000d160211SJeremy Fitzhardinge 			       unsigned short id)
2010d160211SJeremy Fitzhardinge {
2021ffb40b8SIsaku Yamahata 	skb_entry_set_link(&list[id], *head);
2030d160211SJeremy Fitzhardinge 	*head = id;
2040d160211SJeremy Fitzhardinge }
2050d160211SJeremy Fitzhardinge 
2060d160211SJeremy Fitzhardinge static unsigned short get_id_from_freelist(unsigned *head,
2070d160211SJeremy Fitzhardinge 					   union skb_entry *list)
2080d160211SJeremy Fitzhardinge {
2090d160211SJeremy Fitzhardinge 	unsigned int id = *head;
2100d160211SJeremy Fitzhardinge 	*head = list[id].link;
2110d160211SJeremy Fitzhardinge 	return id;
2120d160211SJeremy Fitzhardinge }
2130d160211SJeremy Fitzhardinge 
2140d160211SJeremy Fitzhardinge static int xennet_rxidx(RING_IDX idx)
2150d160211SJeremy Fitzhardinge {
2160d160211SJeremy Fitzhardinge 	return idx & (NET_RX_RING_SIZE - 1);
2170d160211SJeremy Fitzhardinge }
2180d160211SJeremy Fitzhardinge 
2192688fcb7SAndrew J. Bennieston static struct sk_buff *xennet_get_rx_skb(struct netfront_queue *queue,
2200d160211SJeremy Fitzhardinge 					 RING_IDX ri)
2210d160211SJeremy Fitzhardinge {
2220d160211SJeremy Fitzhardinge 	int i = xennet_rxidx(ri);
2232688fcb7SAndrew J. Bennieston 	struct sk_buff *skb = queue->rx_skbs[i];
2242688fcb7SAndrew J. Bennieston 	queue->rx_skbs[i] = NULL;
2250d160211SJeremy Fitzhardinge 	return skb;
2260d160211SJeremy Fitzhardinge }
2270d160211SJeremy Fitzhardinge 
2282688fcb7SAndrew J. Bennieston static grant_ref_t xennet_get_rx_ref(struct netfront_queue *queue,
2290d160211SJeremy Fitzhardinge 					    RING_IDX ri)
2300d160211SJeremy Fitzhardinge {
2310d160211SJeremy Fitzhardinge 	int i = xennet_rxidx(ri);
2322688fcb7SAndrew J. Bennieston 	grant_ref_t ref = queue->grant_rx_ref[i];
2332688fcb7SAndrew J. Bennieston 	queue->grant_rx_ref[i] = GRANT_INVALID_REF;
2340d160211SJeremy Fitzhardinge 	return ref;
2350d160211SJeremy Fitzhardinge }
2360d160211SJeremy Fitzhardinge 
2370d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS
23827b917e5STakashi Iwai static const struct attribute_group xennet_dev_group;
2390d160211SJeremy Fitzhardinge #endif
2400d160211SJeremy Fitzhardinge 
2413ad9b358SMichał Mirosław static bool xennet_can_sg(struct net_device *dev)
2420d160211SJeremy Fitzhardinge {
2433ad9b358SMichał Mirosław 	return dev->features & NETIF_F_SG;
2440d160211SJeremy Fitzhardinge }
2450d160211SJeremy Fitzhardinge 
2460d160211SJeremy Fitzhardinge 
247e99e88a9SKees Cook static void rx_refill_timeout(struct timer_list *t)
2480d160211SJeremy Fitzhardinge {
249e99e88a9SKees Cook 	struct netfront_queue *queue = from_timer(queue, t, rx_refill_timer);
2502688fcb7SAndrew J. Bennieston 	napi_schedule(&queue->napi);
2510d160211SJeremy Fitzhardinge }
2520d160211SJeremy Fitzhardinge 
2532688fcb7SAndrew J. Bennieston static int netfront_tx_slot_available(struct netfront_queue *queue)
2540d160211SJeremy Fitzhardinge {
2552688fcb7SAndrew J. Bennieston 	return (queue->tx.req_prod_pvt - queue->tx.rsp_cons) <
25657f230abSJuergen Gross 		(NET_TX_RING_SIZE - XEN_NETIF_NR_SLOTS_MIN - 1);
2570d160211SJeremy Fitzhardinge }
2580d160211SJeremy Fitzhardinge 
2592688fcb7SAndrew J. Bennieston static void xennet_maybe_wake_tx(struct netfront_queue *queue)
2600d160211SJeremy Fitzhardinge {
2612688fcb7SAndrew J. Bennieston 	struct net_device *dev = queue->info->netdev;
2622688fcb7SAndrew J. Bennieston 	struct netdev_queue *dev_queue = netdev_get_tx_queue(dev, queue->id);
2630d160211SJeremy Fitzhardinge 
2642688fcb7SAndrew J. Bennieston 	if (unlikely(netif_tx_queue_stopped(dev_queue)) &&
2652688fcb7SAndrew J. Bennieston 	    netfront_tx_slot_available(queue) &&
2660d160211SJeremy Fitzhardinge 	    likely(netif_running(dev)))
2672688fcb7SAndrew J. Bennieston 		netif_tx_wake_queue(netdev_get_tx_queue(dev, queue->id));
2680d160211SJeremy Fitzhardinge }
2690d160211SJeremy Fitzhardinge 
2701f3c2ebaSDavid Vrabel 
2711f3c2ebaSDavid Vrabel static struct sk_buff *xennet_alloc_one_rx_buffer(struct netfront_queue *queue)
2720d160211SJeremy Fitzhardinge {
2730d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
2740d160211SJeremy Fitzhardinge 	struct page *page;
2750d160211SJeremy Fitzhardinge 
2762688fcb7SAndrew J. Bennieston 	skb = __netdev_alloc_skb(queue->info->netdev,
2772688fcb7SAndrew J. Bennieston 				 RX_COPY_THRESHOLD + NET_IP_ALIGN,
2780d160211SJeremy Fitzhardinge 				 GFP_ATOMIC | __GFP_NOWARN);
2790d160211SJeremy Fitzhardinge 	if (unlikely(!skb))
2801f3c2ebaSDavid Vrabel 		return NULL;
281617a20bbSIsaku Yamahata 
2826c5aa6fcSDenis Kirjanov 	page = page_pool_dev_alloc_pages(queue->page_pool);
2836c5aa6fcSDenis Kirjanov 	if (unlikely(!page)) {
2840d160211SJeremy Fitzhardinge 		kfree_skb(skb);
2851f3c2ebaSDavid Vrabel 		return NULL;
2860d160211SJeremy Fitzhardinge 	}
287093b9c71SJan Beulich 	skb_add_rx_frag(skb, 0, page, 0, 0, PAGE_SIZE);
2880d160211SJeremy Fitzhardinge 
2891f3c2ebaSDavid Vrabel 	/* Align ip header to a 16 bytes boundary */
2901f3c2ebaSDavid Vrabel 	skb_reserve(skb, NET_IP_ALIGN);
2912688fcb7SAndrew J. Bennieston 	skb->dev = queue->info->netdev;
2920d160211SJeremy Fitzhardinge 
2931f3c2ebaSDavid Vrabel 	return skb;
2941f3c2ebaSDavid Vrabel }
2951f3c2ebaSDavid Vrabel 
2961f3c2ebaSDavid Vrabel 
2971f3c2ebaSDavid Vrabel static void xennet_alloc_rx_buffers(struct netfront_queue *queue)
2981f3c2ebaSDavid Vrabel {
2991f3c2ebaSDavid Vrabel 	RING_IDX req_prod = queue->rx.req_prod_pvt;
3001f3c2ebaSDavid Vrabel 	int notify;
301538d9291SVineeth Remanan Pillai 	int err = 0;
3021f3c2ebaSDavid Vrabel 
3031f3c2ebaSDavid Vrabel 	if (unlikely(!netif_carrier_ok(queue->info->netdev)))
3041f3c2ebaSDavid Vrabel 		return;
3051f3c2ebaSDavid Vrabel 
3061f3c2ebaSDavid Vrabel 	for (req_prod = queue->rx.req_prod_pvt;
3071f3c2ebaSDavid Vrabel 	     req_prod - queue->rx.rsp_cons < NET_RX_RING_SIZE;
3081f3c2ebaSDavid Vrabel 	     req_prod++) {
3091f3c2ebaSDavid Vrabel 		struct sk_buff *skb;
3101f3c2ebaSDavid Vrabel 		unsigned short id;
3111f3c2ebaSDavid Vrabel 		grant_ref_t ref;
31230c5d7f0SJulien Grall 		struct page *page;
3131f3c2ebaSDavid Vrabel 		struct xen_netif_rx_request *req;
3141f3c2ebaSDavid Vrabel 
3151f3c2ebaSDavid Vrabel 		skb = xennet_alloc_one_rx_buffer(queue);
316538d9291SVineeth Remanan Pillai 		if (!skb) {
317538d9291SVineeth Remanan Pillai 			err = -ENOMEM;
3181f3c2ebaSDavid Vrabel 			break;
319538d9291SVineeth Remanan Pillai 		}
3201f3c2ebaSDavid Vrabel 
3211f3c2ebaSDavid Vrabel 		id = xennet_rxidx(req_prod);
3220d160211SJeremy Fitzhardinge 
3232688fcb7SAndrew J. Bennieston 		BUG_ON(queue->rx_skbs[id]);
3242688fcb7SAndrew J. Bennieston 		queue->rx_skbs[id] = skb;
3250d160211SJeremy Fitzhardinge 
3262688fcb7SAndrew J. Bennieston 		ref = gnttab_claim_grant_reference(&queue->gref_rx_head);
327269ebce4SDongli Zhang 		WARN_ON_ONCE(IS_ERR_VALUE((unsigned long)(int)ref));
3282688fcb7SAndrew J. Bennieston 		queue->grant_rx_ref[id] = ref;
3290d160211SJeremy Fitzhardinge 
33030c5d7f0SJulien Grall 		page = skb_frag_page(&skb_shinfo(skb)->frags[0]);
3310d160211SJeremy Fitzhardinge 
3321f3c2ebaSDavid Vrabel 		req = RING_GET_REQUEST(&queue->rx, req_prod);
33330c5d7f0SJulien Grall 		gnttab_page_grant_foreign_access_ref_one(ref,
3342688fcb7SAndrew J. Bennieston 							 queue->info->xbdev->otherend_id,
33530c5d7f0SJulien Grall 							 page,
3360d160211SJeremy Fitzhardinge 							 0);
3370d160211SJeremy Fitzhardinge 		req->id = id;
3380d160211SJeremy Fitzhardinge 		req->gref = ref;
3390d160211SJeremy Fitzhardinge 	}
3400d160211SJeremy Fitzhardinge 
3411f3c2ebaSDavid Vrabel 	queue->rx.req_prod_pvt = req_prod;
3421f3c2ebaSDavid Vrabel 
343538d9291SVineeth Remanan Pillai 	/* Try again later if there are not enough requests or skb allocation
344538d9291SVineeth Remanan Pillai 	 * failed.
345538d9291SVineeth Remanan Pillai 	 * Enough requests is quantified as the sum of newly created slots and
346538d9291SVineeth Remanan Pillai 	 * the unconsumed slots at the backend.
347538d9291SVineeth Remanan Pillai 	 */
348538d9291SVineeth Remanan Pillai 	if (req_prod - queue->rx.rsp_cons < NET_RX_SLOTS_MIN ||
349538d9291SVineeth Remanan Pillai 	    unlikely(err)) {
3501f3c2ebaSDavid Vrabel 		mod_timer(&queue->rx_refill_timer, jiffies + (HZ/10));
3511f3c2ebaSDavid Vrabel 		return;
3521f3c2ebaSDavid Vrabel 	}
3531f3c2ebaSDavid Vrabel 
3542688fcb7SAndrew J. Bennieston 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&queue->rx, notify);
3550d160211SJeremy Fitzhardinge 	if (notify)
3562688fcb7SAndrew J. Bennieston 		notify_remote_via_irq(queue->rx_irq);
3570d160211SJeremy Fitzhardinge }
3580d160211SJeremy Fitzhardinge 
3590d160211SJeremy Fitzhardinge static int xennet_open(struct net_device *dev)
3600d160211SJeremy Fitzhardinge {
3610d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
3622688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
3632688fcb7SAndrew J. Bennieston 	unsigned int i = 0;
3642688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
3650d160211SJeremy Fitzhardinge 
366f599c64fSRoss Lagerwall 	if (!np->queues)
367f599c64fSRoss Lagerwall 		return -ENODEV;
368f599c64fSRoss Lagerwall 
3692688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i) {
3702688fcb7SAndrew J. Bennieston 		queue = &np->queues[i];
3712688fcb7SAndrew J. Bennieston 		napi_enable(&queue->napi);
372bea3348eSStephen Hemminger 
3732688fcb7SAndrew J. Bennieston 		spin_lock_bh(&queue->rx_lock);
3740d160211SJeremy Fitzhardinge 		if (netif_carrier_ok(dev)) {
3752688fcb7SAndrew J. Bennieston 			xennet_alloc_rx_buffers(queue);
3762688fcb7SAndrew J. Bennieston 			queue->rx.sring->rsp_event = queue->rx.rsp_cons + 1;
3772688fcb7SAndrew J. Bennieston 			if (RING_HAS_UNCONSUMED_RESPONSES(&queue->rx))
3782688fcb7SAndrew J. Bennieston 				napi_schedule(&queue->napi);
3790d160211SJeremy Fitzhardinge 		}
3802688fcb7SAndrew J. Bennieston 		spin_unlock_bh(&queue->rx_lock);
3812688fcb7SAndrew J. Bennieston 	}
3820d160211SJeremy Fitzhardinge 
3832688fcb7SAndrew J. Bennieston 	netif_tx_start_all_queues(dev);
3840d160211SJeremy Fitzhardinge 
3850d160211SJeremy Fitzhardinge 	return 0;
3860d160211SJeremy Fitzhardinge }
3870d160211SJeremy Fitzhardinge 
3882688fcb7SAndrew J. Bennieston static void xennet_tx_buf_gc(struct netfront_queue *queue)
3890d160211SJeremy Fitzhardinge {
3900d160211SJeremy Fitzhardinge 	RING_IDX cons, prod;
3910d160211SJeremy Fitzhardinge 	unsigned short id;
3920d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
3937d0105b5SMalcolm Crossley 	bool more_to_do;
3940d160211SJeremy Fitzhardinge 
3952688fcb7SAndrew J. Bennieston 	BUG_ON(!netif_carrier_ok(queue->info->netdev));
3960d160211SJeremy Fitzhardinge 
3970d160211SJeremy Fitzhardinge 	do {
3982688fcb7SAndrew J. Bennieston 		prod = queue->tx.sring->rsp_prod;
3990d160211SJeremy Fitzhardinge 		rmb(); /* Ensure we see responses up to 'rp'. */
4000d160211SJeremy Fitzhardinge 
4012688fcb7SAndrew J. Bennieston 		for (cons = queue->tx.rsp_cons; cons != prod; cons++) {
4020d160211SJeremy Fitzhardinge 			struct xen_netif_tx_response *txrsp;
4030d160211SJeremy Fitzhardinge 
4042688fcb7SAndrew J. Bennieston 			txrsp = RING_GET_RESPONSE(&queue->tx, cons);
405f942dc25SIan Campbell 			if (txrsp->status == XEN_NETIF_RSP_NULL)
4060d160211SJeremy Fitzhardinge 				continue;
4070d160211SJeremy Fitzhardinge 
4080d160211SJeremy Fitzhardinge 			id  = txrsp->id;
4092688fcb7SAndrew J. Bennieston 			skb = queue->tx_skbs[id].skb;
4100d160211SJeremy Fitzhardinge 			if (unlikely(gnttab_query_foreign_access(
4112688fcb7SAndrew J. Bennieston 				queue->grant_tx_ref[id]) != 0)) {
412383eda32SJoe Perches 				pr_alert("%s: warning -- grant still in use by backend domain\n",
413383eda32SJoe Perches 					 __func__);
4140d160211SJeremy Fitzhardinge 				BUG();
4150d160211SJeremy Fitzhardinge 			}
4160d160211SJeremy Fitzhardinge 			gnttab_end_foreign_access_ref(
4172688fcb7SAndrew J. Bennieston 				queue->grant_tx_ref[id], GNTMAP_readonly);
4180d160211SJeremy Fitzhardinge 			gnttab_release_grant_reference(
4192688fcb7SAndrew J. Bennieston 				&queue->gref_tx_head, queue->grant_tx_ref[id]);
4202688fcb7SAndrew J. Bennieston 			queue->grant_tx_ref[id] = GRANT_INVALID_REF;
4212688fcb7SAndrew J. Bennieston 			queue->grant_tx_page[id] = NULL;
4222688fcb7SAndrew J. Bennieston 			add_id_to_freelist(&queue->tx_skb_freelist, queue->tx_skbs, id);
4230d160211SJeremy Fitzhardinge 			dev_kfree_skb_irq(skb);
4240d160211SJeremy Fitzhardinge 		}
4250d160211SJeremy Fitzhardinge 
4262688fcb7SAndrew J. Bennieston 		queue->tx.rsp_cons = prod;
4270d160211SJeremy Fitzhardinge 
4287d0105b5SMalcolm Crossley 		RING_FINAL_CHECK_FOR_RESPONSES(&queue->tx, more_to_do);
4297d0105b5SMalcolm Crossley 	} while (more_to_do);
4300d160211SJeremy Fitzhardinge 
4312688fcb7SAndrew J. Bennieston 	xennet_maybe_wake_tx(queue);
4320d160211SJeremy Fitzhardinge }
4330d160211SJeremy Fitzhardinge 
43430c5d7f0SJulien Grall struct xennet_gnttab_make_txreq {
43530c5d7f0SJulien Grall 	struct netfront_queue *queue;
43630c5d7f0SJulien Grall 	struct sk_buff *skb;
43730c5d7f0SJulien Grall 	struct page *page;
43830c5d7f0SJulien Grall 	struct xen_netif_tx_request *tx; /* Last request */
43930c5d7f0SJulien Grall 	unsigned int size;
44030c5d7f0SJulien Grall };
44130c5d7f0SJulien Grall 
44230c5d7f0SJulien Grall static void xennet_tx_setup_grant(unsigned long gfn, unsigned int offset,
44330c5d7f0SJulien Grall 				  unsigned int len, void *data)
4440d160211SJeremy Fitzhardinge {
44530c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq *info = data;
4460d160211SJeremy Fitzhardinge 	unsigned int id;
447a55e8bb8SDavid Vrabel 	struct xen_netif_tx_request *tx;
4480d160211SJeremy Fitzhardinge 	grant_ref_t ref;
44930c5d7f0SJulien Grall 	/* convenient aliases */
45030c5d7f0SJulien Grall 	struct page *page = info->page;
45130c5d7f0SJulien Grall 	struct netfront_queue *queue = info->queue;
45230c5d7f0SJulien Grall 	struct sk_buff *skb = info->skb;
4530d160211SJeremy Fitzhardinge 
4542688fcb7SAndrew J. Bennieston 	id = get_id_from_freelist(&queue->tx_skb_freelist, queue->tx_skbs);
455a55e8bb8SDavid Vrabel 	tx = RING_GET_REQUEST(&queue->tx, queue->tx.req_prod_pvt++);
4562688fcb7SAndrew J. Bennieston 	ref = gnttab_claim_grant_reference(&queue->gref_tx_head);
457269ebce4SDongli Zhang 	WARN_ON_ONCE(IS_ERR_VALUE((unsigned long)(int)ref));
4580d160211SJeremy Fitzhardinge 
45930c5d7f0SJulien Grall 	gnttab_grant_foreign_access_ref(ref, queue->info->xbdev->otherend_id,
46030c5d7f0SJulien Grall 					gfn, GNTMAP_readonly);
4610d160211SJeremy Fitzhardinge 
462a55e8bb8SDavid Vrabel 	queue->tx_skbs[id].skb = skb;
463a55e8bb8SDavid Vrabel 	queue->grant_tx_page[id] = page;
464a55e8bb8SDavid Vrabel 	queue->grant_tx_ref[id] = ref;
465a55e8bb8SDavid Vrabel 
466a55e8bb8SDavid Vrabel 	tx->id = id;
467a55e8bb8SDavid Vrabel 	tx->gref = ref;
4680d160211SJeremy Fitzhardinge 	tx->offset = offset;
4690d160211SJeremy Fitzhardinge 	tx->size = len;
4700d160211SJeremy Fitzhardinge 	tx->flags = 0;
471a55e8bb8SDavid Vrabel 
47230c5d7f0SJulien Grall 	info->tx = tx;
47330c5d7f0SJulien Grall 	info->size += tx->size;
47430c5d7f0SJulien Grall }
47530c5d7f0SJulien Grall 
47630c5d7f0SJulien Grall static struct xen_netif_tx_request *xennet_make_first_txreq(
47730c5d7f0SJulien Grall 	struct netfront_queue *queue, struct sk_buff *skb,
47830c5d7f0SJulien Grall 	struct page *page, unsigned int offset, unsigned int len)
47930c5d7f0SJulien Grall {
48030c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq info = {
48130c5d7f0SJulien Grall 		.queue = queue,
48230c5d7f0SJulien Grall 		.skb = skb,
48330c5d7f0SJulien Grall 		.page = page,
48430c5d7f0SJulien Grall 		.size = 0,
48530c5d7f0SJulien Grall 	};
48630c5d7f0SJulien Grall 
48730c5d7f0SJulien Grall 	gnttab_for_one_grant(page, offset, len, xennet_tx_setup_grant, &info);
48830c5d7f0SJulien Grall 
48930c5d7f0SJulien Grall 	return info.tx;
49030c5d7f0SJulien Grall }
49130c5d7f0SJulien Grall 
49230c5d7f0SJulien Grall static void xennet_make_one_txreq(unsigned long gfn, unsigned int offset,
49330c5d7f0SJulien Grall 				  unsigned int len, void *data)
49430c5d7f0SJulien Grall {
49530c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq *info = data;
49630c5d7f0SJulien Grall 
49730c5d7f0SJulien Grall 	info->tx->flags |= XEN_NETTXF_more_data;
49830c5d7f0SJulien Grall 	skb_get(info->skb);
49930c5d7f0SJulien Grall 	xennet_tx_setup_grant(gfn, offset, len, data);
5000d160211SJeremy Fitzhardinge }
5010d160211SJeremy Fitzhardinge 
502a55e8bb8SDavid Vrabel static struct xen_netif_tx_request *xennet_make_txreqs(
503a55e8bb8SDavid Vrabel 	struct netfront_queue *queue, struct xen_netif_tx_request *tx,
504a55e8bb8SDavid Vrabel 	struct sk_buff *skb, struct page *page,
505a55e8bb8SDavid Vrabel 	unsigned int offset, unsigned int len)
506a55e8bb8SDavid Vrabel {
50730c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq info = {
50830c5d7f0SJulien Grall 		.queue = queue,
50930c5d7f0SJulien Grall 		.skb = skb,
51030c5d7f0SJulien Grall 		.tx = tx,
51130c5d7f0SJulien Grall 	};
51230c5d7f0SJulien Grall 
513f36c3747SIan Campbell 	/* Skip unused frames from start of page */
514f36c3747SIan Campbell 	page += offset >> PAGE_SHIFT;
515f36c3747SIan Campbell 	offset &= ~PAGE_MASK;
516f36c3747SIan Campbell 
517a55e8bb8SDavid Vrabel 	while (len) {
51830c5d7f0SJulien Grall 		info.page = page;
51930c5d7f0SJulien Grall 		info.size = 0;
52030c5d7f0SJulien Grall 
52130c5d7f0SJulien Grall 		gnttab_foreach_grant_in_range(page, offset, len,
52230c5d7f0SJulien Grall 					      xennet_make_one_txreq,
52330c5d7f0SJulien Grall 					      &info);
52430c5d7f0SJulien Grall 
525f36c3747SIan Campbell 		page++;
526f36c3747SIan Campbell 		offset = 0;
52730c5d7f0SJulien Grall 		len -= info.size;
5280d160211SJeremy Fitzhardinge 	}
5290d160211SJeremy Fitzhardinge 
53030c5d7f0SJulien Grall 	return info.tx;
5310d160211SJeremy Fitzhardinge }
5320d160211SJeremy Fitzhardinge 
533f36c3747SIan Campbell /*
534e84448d5SDavid Vrabel  * Count how many ring slots are required to send this skb. Each frag
535e84448d5SDavid Vrabel  * might be a compound page.
536f36c3747SIan Campbell  */
537e84448d5SDavid Vrabel static int xennet_count_skb_slots(struct sk_buff *skb)
538f36c3747SIan Campbell {
539f36c3747SIan Campbell 	int i, frags = skb_shinfo(skb)->nr_frags;
54030c5d7f0SJulien Grall 	int slots;
541e84448d5SDavid Vrabel 
54230c5d7f0SJulien Grall 	slots = gnttab_count_grant(offset_in_page(skb->data),
54330c5d7f0SJulien Grall 				   skb_headlen(skb));
544f36c3747SIan Campbell 
545f36c3747SIan Campbell 	for (i = 0; i < frags; i++) {
546f36c3747SIan Campbell 		skb_frag_t *frag = skb_shinfo(skb)->frags + i;
547f36c3747SIan Campbell 		unsigned long size = skb_frag_size(frag);
548b54c9d5bSJonathan Lemon 		unsigned long offset = skb_frag_off(frag);
549f36c3747SIan Campbell 
550f36c3747SIan Campbell 		/* Skip unused frames from start of page */
551f36c3747SIan Campbell 		offset &= ~PAGE_MASK;
552f36c3747SIan Campbell 
55330c5d7f0SJulien Grall 		slots += gnttab_count_grant(offset, size);
554f36c3747SIan Campbell 	}
555f36c3747SIan Campbell 
55630c5d7f0SJulien Grall 	return slots;
557f36c3747SIan Campbell }
558f36c3747SIan Campbell 
55950ee6061SAndrew J. Bennieston static u16 xennet_select_queue(struct net_device *dev, struct sk_buff *skb,
560a350ecceSPaolo Abeni 			       struct net_device *sb_dev)
5612688fcb7SAndrew J. Bennieston {
56250ee6061SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
56350ee6061SAndrew J. Bennieston 	u32 hash;
56450ee6061SAndrew J. Bennieston 	u16 queue_idx;
56550ee6061SAndrew J. Bennieston 
56650ee6061SAndrew J. Bennieston 	/* First, check if there is only one queue */
56750ee6061SAndrew J. Bennieston 	if (num_queues == 1) {
56850ee6061SAndrew J. Bennieston 		queue_idx = 0;
56950ee6061SAndrew J. Bennieston 	} else {
57050ee6061SAndrew J. Bennieston 		hash = skb_get_hash(skb);
57150ee6061SAndrew J. Bennieston 		queue_idx = hash % num_queues;
57250ee6061SAndrew J. Bennieston 	}
57350ee6061SAndrew J. Bennieston 
57450ee6061SAndrew J. Bennieston 	return queue_idx;
5752688fcb7SAndrew J. Bennieston }
5762688fcb7SAndrew J. Bennieston 
5776c5aa6fcSDenis Kirjanov static int xennet_xdp_xmit_one(struct net_device *dev,
5786c5aa6fcSDenis Kirjanov 			       struct netfront_queue *queue,
5796c5aa6fcSDenis Kirjanov 			       struct xdp_frame *xdpf)
5806c5aa6fcSDenis Kirjanov {
5816c5aa6fcSDenis Kirjanov 	struct netfront_info *np = netdev_priv(dev);
5826c5aa6fcSDenis Kirjanov 	struct netfront_stats *tx_stats = this_cpu_ptr(np->tx_stats);
5836c5aa6fcSDenis Kirjanov 	int notify;
5846c5aa6fcSDenis Kirjanov 
5856c5aa6fcSDenis Kirjanov 	xennet_make_first_txreq(queue, NULL,
5866c5aa6fcSDenis Kirjanov 				virt_to_page(xdpf->data),
5876c5aa6fcSDenis Kirjanov 				offset_in_page(xdpf->data),
5886c5aa6fcSDenis Kirjanov 				xdpf->len);
5896c5aa6fcSDenis Kirjanov 
5906c5aa6fcSDenis Kirjanov 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&queue->tx, notify);
5916c5aa6fcSDenis Kirjanov 	if (notify)
5926c5aa6fcSDenis Kirjanov 		notify_remote_via_irq(queue->tx_irq);
5936c5aa6fcSDenis Kirjanov 
5946c5aa6fcSDenis Kirjanov 	u64_stats_update_begin(&tx_stats->syncp);
5956c5aa6fcSDenis Kirjanov 	tx_stats->bytes += xdpf->len;
5966c5aa6fcSDenis Kirjanov 	tx_stats->packets++;
5976c5aa6fcSDenis Kirjanov 	u64_stats_update_end(&tx_stats->syncp);
5986c5aa6fcSDenis Kirjanov 
5996c5aa6fcSDenis Kirjanov 	xennet_tx_buf_gc(queue);
6006c5aa6fcSDenis Kirjanov 
6016c5aa6fcSDenis Kirjanov 	return 0;
6026c5aa6fcSDenis Kirjanov }
6036c5aa6fcSDenis Kirjanov 
6046c5aa6fcSDenis Kirjanov static int xennet_xdp_xmit(struct net_device *dev, int n,
6056c5aa6fcSDenis Kirjanov 			   struct xdp_frame **frames, u32 flags)
6066c5aa6fcSDenis Kirjanov {
6076c5aa6fcSDenis Kirjanov 	unsigned int num_queues = dev->real_num_tx_queues;
6086c5aa6fcSDenis Kirjanov 	struct netfront_info *np = netdev_priv(dev);
6096c5aa6fcSDenis Kirjanov 	struct netfront_queue *queue = NULL;
6106c5aa6fcSDenis Kirjanov 	unsigned long irq_flags;
6116c5aa6fcSDenis Kirjanov 	int drops = 0;
6126c5aa6fcSDenis Kirjanov 	int i, err;
6136c5aa6fcSDenis Kirjanov 
6146c5aa6fcSDenis Kirjanov 	if (unlikely(flags & ~XDP_XMIT_FLAGS_MASK))
6156c5aa6fcSDenis Kirjanov 		return -EINVAL;
6166c5aa6fcSDenis Kirjanov 
6176c5aa6fcSDenis Kirjanov 	queue = &np->queues[smp_processor_id() % num_queues];
6186c5aa6fcSDenis Kirjanov 
6196c5aa6fcSDenis Kirjanov 	spin_lock_irqsave(&queue->tx_lock, irq_flags);
6206c5aa6fcSDenis Kirjanov 	for (i = 0; i < n; i++) {
6216c5aa6fcSDenis Kirjanov 		struct xdp_frame *xdpf = frames[i];
6226c5aa6fcSDenis Kirjanov 
6236c5aa6fcSDenis Kirjanov 		if (!xdpf)
6246c5aa6fcSDenis Kirjanov 			continue;
6256c5aa6fcSDenis Kirjanov 		err = xennet_xdp_xmit_one(dev, queue, xdpf);
6266c5aa6fcSDenis Kirjanov 		if (err) {
6276c5aa6fcSDenis Kirjanov 			xdp_return_frame_rx_napi(xdpf);
6286c5aa6fcSDenis Kirjanov 			drops++;
6296c5aa6fcSDenis Kirjanov 		}
6306c5aa6fcSDenis Kirjanov 	}
6316c5aa6fcSDenis Kirjanov 	spin_unlock_irqrestore(&queue->tx_lock, irq_flags);
6326c5aa6fcSDenis Kirjanov 
6336c5aa6fcSDenis Kirjanov 	return n - drops;
6346c5aa6fcSDenis Kirjanov }
6356c5aa6fcSDenis Kirjanov 
6366c5aa6fcSDenis Kirjanov 
63730c5d7f0SJulien Grall #define MAX_XEN_SKB_FRAGS (65536 / XEN_PAGE_SIZE + 1)
63830c5d7f0SJulien Grall 
63924a94b3cSLuc Van Oostenryck static netdev_tx_t xennet_start_xmit(struct sk_buff *skb, struct net_device *dev)
6400d160211SJeremy Fitzhardinge {
6410d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
642900e1833SDavid Vrabel 	struct netfront_stats *tx_stats = this_cpu_ptr(np->tx_stats);
643a55e8bb8SDavid Vrabel 	struct xen_netif_tx_request *tx, *first_tx;
644a55e8bb8SDavid Vrabel 	unsigned int i;
6450d160211SJeremy Fitzhardinge 	int notify;
646f36c3747SIan Campbell 	int slots;
647a55e8bb8SDavid Vrabel 	struct page *page;
648a55e8bb8SDavid Vrabel 	unsigned int offset;
649a55e8bb8SDavid Vrabel 	unsigned int len;
650cf66f9d4SKonrad Rzeszutek Wilk 	unsigned long flags;
6512688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
6522688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
6532688fcb7SAndrew J. Bennieston 	u16 queue_index;
654fd07160bSVitaly Kuznetsov 	struct sk_buff *nskb;
6552688fcb7SAndrew J. Bennieston 
6562688fcb7SAndrew J. Bennieston 	/* Drop the packet if no queues are set up */
6572688fcb7SAndrew J. Bennieston 	if (num_queues < 1)
6582688fcb7SAndrew J. Bennieston 		goto drop;
6592688fcb7SAndrew J. Bennieston 	/* Determine which queue to transmit this SKB on */
6602688fcb7SAndrew J. Bennieston 	queue_index = skb_get_queue_mapping(skb);
6612688fcb7SAndrew J. Bennieston 	queue = &np->queues[queue_index];
6620d160211SJeremy Fitzhardinge 
6639ecd1a75SWei Liu 	/* If skb->len is too big for wire format, drop skb and alert
6649ecd1a75SWei Liu 	 * user about misconfiguration.
6659ecd1a75SWei Liu 	 */
6669ecd1a75SWei Liu 	if (unlikely(skb->len > XEN_NETIF_MAX_TX_SIZE)) {
6679ecd1a75SWei Liu 		net_alert_ratelimited(
6689ecd1a75SWei Liu 			"xennet: skb->len = %u, too big for wire format\n",
6699ecd1a75SWei Liu 			skb->len);
6709ecd1a75SWei Liu 		goto drop;
6719ecd1a75SWei Liu 	}
6729ecd1a75SWei Liu 
673e84448d5SDavid Vrabel 	slots = xennet_count_skb_slots(skb);
67430c5d7f0SJulien Grall 	if (unlikely(slots > MAX_XEN_SKB_FRAGS + 1)) {
67597a6d1bbSZoltan Kiss 		net_dbg_ratelimited("xennet: skb rides the rocket: %d slots, %d bytes\n",
67697a6d1bbSZoltan Kiss 				    slots, skb->len);
67797a6d1bbSZoltan Kiss 		if (skb_linearize(skb))
6780d160211SJeremy Fitzhardinge 			goto drop;
6790d160211SJeremy Fitzhardinge 	}
6800d160211SJeremy Fitzhardinge 
681a55e8bb8SDavid Vrabel 	page = virt_to_page(skb->data);
682a55e8bb8SDavid Vrabel 	offset = offset_in_page(skb->data);
683fd07160bSVitaly Kuznetsov 
684fd07160bSVitaly Kuznetsov 	/* The first req should be at least ETH_HLEN size or the packet will be
685fd07160bSVitaly Kuznetsov 	 * dropped by netback.
686fd07160bSVitaly Kuznetsov 	 */
687fd07160bSVitaly Kuznetsov 	if (unlikely(PAGE_SIZE - offset < ETH_HLEN)) {
688fd07160bSVitaly Kuznetsov 		nskb = skb_copy(skb, GFP_ATOMIC);
689fd07160bSVitaly Kuznetsov 		if (!nskb)
690fd07160bSVitaly Kuznetsov 			goto drop;
69162f3250fSEric Dumazet 		dev_consume_skb_any(skb);
692fd07160bSVitaly Kuznetsov 		skb = nskb;
693fd07160bSVitaly Kuznetsov 		page = virt_to_page(skb->data);
694fd07160bSVitaly Kuznetsov 		offset = offset_in_page(skb->data);
695fd07160bSVitaly Kuznetsov 	}
696fd07160bSVitaly Kuznetsov 
697a55e8bb8SDavid Vrabel 	len = skb_headlen(skb);
698a55e8bb8SDavid Vrabel 
6992688fcb7SAndrew J. Bennieston 	spin_lock_irqsave(&queue->tx_lock, flags);
7000d160211SJeremy Fitzhardinge 
7010d160211SJeremy Fitzhardinge 	if (unlikely(!netif_carrier_ok(dev) ||
702f36c3747SIan Campbell 		     (slots > 1 && !xennet_can_sg(dev)) ||
7038b86a61dSJohannes Berg 		     netif_needs_gso(skb, netif_skb_features(skb)))) {
7042688fcb7SAndrew J. Bennieston 		spin_unlock_irqrestore(&queue->tx_lock, flags);
7050d160211SJeremy Fitzhardinge 		goto drop;
7060d160211SJeremy Fitzhardinge 	}
7070d160211SJeremy Fitzhardinge 
708a55e8bb8SDavid Vrabel 	/* First request for the linear area. */
70930c5d7f0SJulien Grall 	first_tx = tx = xennet_make_first_txreq(queue, skb,
710a55e8bb8SDavid Vrabel 						page, offset, len);
71130c5d7f0SJulien Grall 	offset += tx->size;
71230c5d7f0SJulien Grall 	if (offset == PAGE_SIZE) {
713a55e8bb8SDavid Vrabel 		page++;
714a55e8bb8SDavid Vrabel 		offset = 0;
71530c5d7f0SJulien Grall 	}
716a55e8bb8SDavid Vrabel 	len -= tx->size;
7170d160211SJeremy Fitzhardinge 
7180d160211SJeremy Fitzhardinge 	if (skb->ip_summed == CHECKSUM_PARTIAL)
7190d160211SJeremy Fitzhardinge 		/* local packet? */
720f942dc25SIan Campbell 		tx->flags |= XEN_NETTXF_csum_blank | XEN_NETTXF_data_validated;
7210d160211SJeremy Fitzhardinge 	else if (skb->ip_summed == CHECKSUM_UNNECESSARY)
7220d160211SJeremy Fitzhardinge 		/* remote but checksummed. */
723f942dc25SIan Campbell 		tx->flags |= XEN_NETTXF_data_validated;
7240d160211SJeremy Fitzhardinge 
725a55e8bb8SDavid Vrabel 	/* Optional extra info after the first request. */
7260d160211SJeremy Fitzhardinge 	if (skb_shinfo(skb)->gso_size) {
7270d160211SJeremy Fitzhardinge 		struct xen_netif_extra_info *gso;
7280d160211SJeremy Fitzhardinge 
7290d160211SJeremy Fitzhardinge 		gso = (struct xen_netif_extra_info *)
730a55e8bb8SDavid Vrabel 			RING_GET_REQUEST(&queue->tx, queue->tx.req_prod_pvt++);
7310d160211SJeremy Fitzhardinge 
732f942dc25SIan Campbell 		tx->flags |= XEN_NETTXF_extra_info;
7330d160211SJeremy Fitzhardinge 
7340d160211SJeremy Fitzhardinge 		gso->u.gso.size = skb_shinfo(skb)->gso_size;
7352c0057deSPaul Durrant 		gso->u.gso.type = (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6) ?
7362c0057deSPaul Durrant 			XEN_NETIF_GSO_TYPE_TCPV6 :
7372c0057deSPaul Durrant 			XEN_NETIF_GSO_TYPE_TCPV4;
7380d160211SJeremy Fitzhardinge 		gso->u.gso.pad = 0;
7390d160211SJeremy Fitzhardinge 		gso->u.gso.features = 0;
7400d160211SJeremy Fitzhardinge 
7410d160211SJeremy Fitzhardinge 		gso->type = XEN_NETIF_EXTRA_TYPE_GSO;
7420d160211SJeremy Fitzhardinge 		gso->flags = 0;
7430d160211SJeremy Fitzhardinge 	}
7440d160211SJeremy Fitzhardinge 
745a55e8bb8SDavid Vrabel 	/* Requests for the rest of the linear area. */
746a55e8bb8SDavid Vrabel 	tx = xennet_make_txreqs(queue, tx, skb, page, offset, len);
7470d160211SJeremy Fitzhardinge 
748a55e8bb8SDavid Vrabel 	/* Requests for all the frags. */
749a55e8bb8SDavid Vrabel 	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
750a55e8bb8SDavid Vrabel 		skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
751b54c9d5bSJonathan Lemon 		tx = xennet_make_txreqs(queue, tx, skb, skb_frag_page(frag),
752b54c9d5bSJonathan Lemon 					skb_frag_off(frag),
753a55e8bb8SDavid Vrabel 					skb_frag_size(frag));
754a55e8bb8SDavid Vrabel 	}
755a55e8bb8SDavid Vrabel 
756a55e8bb8SDavid Vrabel 	/* First request has the packet length. */
757a55e8bb8SDavid Vrabel 	first_tx->size = skb->len;
7580d160211SJeremy Fitzhardinge 
75991ffb9d3SDaniel Drown 	/* timestamp packet in software */
76091ffb9d3SDaniel Drown 	skb_tx_timestamp(skb);
76191ffb9d3SDaniel Drown 
7622688fcb7SAndrew J. Bennieston 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&queue->tx, notify);
7630d160211SJeremy Fitzhardinge 	if (notify)
7642688fcb7SAndrew J. Bennieston 		notify_remote_via_irq(queue->tx_irq);
7650d160211SJeremy Fitzhardinge 
766900e1833SDavid Vrabel 	u64_stats_update_begin(&tx_stats->syncp);
767900e1833SDavid Vrabel 	tx_stats->bytes += skb->len;
768900e1833SDavid Vrabel 	tx_stats->packets++;
769900e1833SDavid Vrabel 	u64_stats_update_end(&tx_stats->syncp);
77010a273a6SJeremy Fitzhardinge 
77110a273a6SJeremy Fitzhardinge 	/* Note: It is not safe to access skb after xennet_tx_buf_gc()! */
7722688fcb7SAndrew J. Bennieston 	xennet_tx_buf_gc(queue);
7730d160211SJeremy Fitzhardinge 
7742688fcb7SAndrew J. Bennieston 	if (!netfront_tx_slot_available(queue))
7752688fcb7SAndrew J. Bennieston 		netif_tx_stop_queue(netdev_get_tx_queue(dev, queue->id));
7760d160211SJeremy Fitzhardinge 
7772688fcb7SAndrew J. Bennieston 	spin_unlock_irqrestore(&queue->tx_lock, flags);
7780d160211SJeremy Fitzhardinge 
7796ed10654SPatrick McHardy 	return NETDEV_TX_OK;
7800d160211SJeremy Fitzhardinge 
7810d160211SJeremy Fitzhardinge  drop:
78209f75cd7SJeff Garzik 	dev->stats.tx_dropped++;
783979de8a0SEric W. Biederman 	dev_kfree_skb_any(skb);
7846ed10654SPatrick McHardy 	return NETDEV_TX_OK;
7850d160211SJeremy Fitzhardinge }
7860d160211SJeremy Fitzhardinge 
7870d160211SJeremy Fitzhardinge static int xennet_close(struct net_device *dev)
7880d160211SJeremy Fitzhardinge {
7890d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
7902688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
7912688fcb7SAndrew J. Bennieston 	unsigned int i;
7922688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue;
7932688fcb7SAndrew J. Bennieston 	netif_tx_stop_all_queues(np->netdev);
7942688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i) {
7952688fcb7SAndrew J. Bennieston 		queue = &np->queues[i];
7962688fcb7SAndrew J. Bennieston 		napi_disable(&queue->napi);
7972688fcb7SAndrew J. Bennieston 	}
7980d160211SJeremy Fitzhardinge 	return 0;
7990d160211SJeremy Fitzhardinge }
8000d160211SJeremy Fitzhardinge 
8012688fcb7SAndrew J. Bennieston static void xennet_move_rx_slot(struct netfront_queue *queue, struct sk_buff *skb,
8020d160211SJeremy Fitzhardinge 				grant_ref_t ref)
8030d160211SJeremy Fitzhardinge {
8042688fcb7SAndrew J. Bennieston 	int new = xennet_rxidx(queue->rx.req_prod_pvt);
8050d160211SJeremy Fitzhardinge 
8062688fcb7SAndrew J. Bennieston 	BUG_ON(queue->rx_skbs[new]);
8072688fcb7SAndrew J. Bennieston 	queue->rx_skbs[new] = skb;
8082688fcb7SAndrew J. Bennieston 	queue->grant_rx_ref[new] = ref;
8092688fcb7SAndrew J. Bennieston 	RING_GET_REQUEST(&queue->rx, queue->rx.req_prod_pvt)->id = new;
8102688fcb7SAndrew J. Bennieston 	RING_GET_REQUEST(&queue->rx, queue->rx.req_prod_pvt)->gref = ref;
8112688fcb7SAndrew J. Bennieston 	queue->rx.req_prod_pvt++;
8120d160211SJeremy Fitzhardinge }
8130d160211SJeremy Fitzhardinge 
8142688fcb7SAndrew J. Bennieston static int xennet_get_extras(struct netfront_queue *queue,
8150d160211SJeremy Fitzhardinge 			     struct xen_netif_extra_info *extras,
8160d160211SJeremy Fitzhardinge 			     RING_IDX rp)
8170d160211SJeremy Fitzhardinge 
8180d160211SJeremy Fitzhardinge {
8190d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extra;
8202688fcb7SAndrew J. Bennieston 	struct device *dev = &queue->info->netdev->dev;
8212688fcb7SAndrew J. Bennieston 	RING_IDX cons = queue->rx.rsp_cons;
8220d160211SJeremy Fitzhardinge 	int err = 0;
8230d160211SJeremy Fitzhardinge 
8240d160211SJeremy Fitzhardinge 	do {
8250d160211SJeremy Fitzhardinge 		struct sk_buff *skb;
8260d160211SJeremy Fitzhardinge 		grant_ref_t ref;
8270d160211SJeremy Fitzhardinge 
8280d160211SJeremy Fitzhardinge 		if (unlikely(cons + 1 == rp)) {
8290d160211SJeremy Fitzhardinge 			if (net_ratelimit())
8300d160211SJeremy Fitzhardinge 				dev_warn(dev, "Missing extra info\n");
8310d160211SJeremy Fitzhardinge 			err = -EBADR;
8320d160211SJeremy Fitzhardinge 			break;
8330d160211SJeremy Fitzhardinge 		}
8340d160211SJeremy Fitzhardinge 
8350d160211SJeremy Fitzhardinge 		extra = (struct xen_netif_extra_info *)
8362688fcb7SAndrew J. Bennieston 			RING_GET_RESPONSE(&queue->rx, ++cons);
8370d160211SJeremy Fitzhardinge 
8380d160211SJeremy Fitzhardinge 		if (unlikely(!extra->type ||
8390d160211SJeremy Fitzhardinge 			     extra->type >= XEN_NETIF_EXTRA_TYPE_MAX)) {
8400d160211SJeremy Fitzhardinge 			if (net_ratelimit())
8410d160211SJeremy Fitzhardinge 				dev_warn(dev, "Invalid extra type: %d\n",
8420d160211SJeremy Fitzhardinge 					extra->type);
8430d160211SJeremy Fitzhardinge 			err = -EINVAL;
8440d160211SJeremy Fitzhardinge 		} else {
8450d160211SJeremy Fitzhardinge 			memcpy(&extras[extra->type - 1], extra,
8460d160211SJeremy Fitzhardinge 			       sizeof(*extra));
8470d160211SJeremy Fitzhardinge 		}
8480d160211SJeremy Fitzhardinge 
8492688fcb7SAndrew J. Bennieston 		skb = xennet_get_rx_skb(queue, cons);
8502688fcb7SAndrew J. Bennieston 		ref = xennet_get_rx_ref(queue, cons);
8512688fcb7SAndrew J. Bennieston 		xennet_move_rx_slot(queue, skb, ref);
8520d160211SJeremy Fitzhardinge 	} while (extra->flags & XEN_NETIF_EXTRA_FLAG_MORE);
8530d160211SJeremy Fitzhardinge 
8542688fcb7SAndrew J. Bennieston 	queue->rx.rsp_cons = cons;
8550d160211SJeremy Fitzhardinge 	return err;
8560d160211SJeremy Fitzhardinge }
8570d160211SJeremy Fitzhardinge 
8586c5aa6fcSDenis Kirjanov static u32 xennet_run_xdp(struct netfront_queue *queue, struct page *pdata,
8596c5aa6fcSDenis Kirjanov 		   struct xen_netif_rx_response *rx, struct bpf_prog *prog,
8606c5aa6fcSDenis Kirjanov 		   struct xdp_buff *xdp, bool *need_xdp_flush)
8616c5aa6fcSDenis Kirjanov {
8626c5aa6fcSDenis Kirjanov 	struct xdp_frame *xdpf;
8636c5aa6fcSDenis Kirjanov 	u32 len = rx->status;
864e44f65fdSColin Ian King 	u32 act;
8656c5aa6fcSDenis Kirjanov 	int err;
8666c5aa6fcSDenis Kirjanov 
867*43b5169dSLorenzo Bianconi 	xdp_init_buff(xdp, XEN_PAGE_SIZE - XDP_PACKET_HEADROOM,
868*43b5169dSLorenzo Bianconi 		      &queue->xdp_rxq);
8696c5aa6fcSDenis Kirjanov 	xdp->data_hard_start = page_address(pdata);
8706c5aa6fcSDenis Kirjanov 	xdp->data = xdp->data_hard_start + XDP_PACKET_HEADROOM;
8716c5aa6fcSDenis Kirjanov 	xdp_set_data_meta_invalid(xdp);
8726c5aa6fcSDenis Kirjanov 	xdp->data_end = xdp->data + len;
8736c5aa6fcSDenis Kirjanov 
8746c5aa6fcSDenis Kirjanov 	act = bpf_prog_run_xdp(prog, xdp);
8756c5aa6fcSDenis Kirjanov 	switch (act) {
8766c5aa6fcSDenis Kirjanov 	case XDP_TX:
8776c5aa6fcSDenis Kirjanov 		get_page(pdata);
8786c5aa6fcSDenis Kirjanov 		xdpf = xdp_convert_buff_to_frame(xdp);
8796c5aa6fcSDenis Kirjanov 		err = xennet_xdp_xmit(queue->info->netdev, 1, &xdpf, 0);
8806c5aa6fcSDenis Kirjanov 		if (unlikely(err < 0))
8816c5aa6fcSDenis Kirjanov 			trace_xdp_exception(queue->info->netdev, prog, act);
8826c5aa6fcSDenis Kirjanov 		break;
8836c5aa6fcSDenis Kirjanov 	case XDP_REDIRECT:
8846c5aa6fcSDenis Kirjanov 		get_page(pdata);
8856c5aa6fcSDenis Kirjanov 		err = xdp_do_redirect(queue->info->netdev, xdp, prog);
8866c5aa6fcSDenis Kirjanov 		*need_xdp_flush = true;
8876c5aa6fcSDenis Kirjanov 		if (unlikely(err))
8886c5aa6fcSDenis Kirjanov 			trace_xdp_exception(queue->info->netdev, prog, act);
8896c5aa6fcSDenis Kirjanov 		break;
8906c5aa6fcSDenis Kirjanov 	case XDP_PASS:
8916c5aa6fcSDenis Kirjanov 	case XDP_DROP:
8926c5aa6fcSDenis Kirjanov 		break;
8936c5aa6fcSDenis Kirjanov 
8946c5aa6fcSDenis Kirjanov 	case XDP_ABORTED:
8956c5aa6fcSDenis Kirjanov 		trace_xdp_exception(queue->info->netdev, prog, act);
8966c5aa6fcSDenis Kirjanov 		break;
8976c5aa6fcSDenis Kirjanov 
8986c5aa6fcSDenis Kirjanov 	default:
8996c5aa6fcSDenis Kirjanov 		bpf_warn_invalid_xdp_action(act);
9006c5aa6fcSDenis Kirjanov 	}
9016c5aa6fcSDenis Kirjanov 
9026c5aa6fcSDenis Kirjanov 	return act;
9036c5aa6fcSDenis Kirjanov }
9046c5aa6fcSDenis Kirjanov 
9052688fcb7SAndrew J. Bennieston static int xennet_get_responses(struct netfront_queue *queue,
9060d160211SJeremy Fitzhardinge 				struct netfront_rx_info *rinfo, RING_IDX rp,
9076c5aa6fcSDenis Kirjanov 				struct sk_buff_head *list,
9086c5aa6fcSDenis Kirjanov 				bool *need_xdp_flush)
9090d160211SJeremy Fitzhardinge {
9100d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response *rx = &rinfo->rx;
9116c5aa6fcSDenis Kirjanov 	int max = XEN_NETIF_NR_SLOTS_MIN + (rx->status <= RX_COPY_THRESHOLD);
9122688fcb7SAndrew J. Bennieston 	RING_IDX cons = queue->rx.rsp_cons;
9132688fcb7SAndrew J. Bennieston 	struct sk_buff *skb = xennet_get_rx_skb(queue, cons);
9146c5aa6fcSDenis Kirjanov 	struct xen_netif_extra_info *extras = rinfo->extras;
9152688fcb7SAndrew J. Bennieston 	grant_ref_t ref = xennet_get_rx_ref(queue, cons);
9166c5aa6fcSDenis Kirjanov 	struct device *dev = &queue->info->netdev->dev;
9176c5aa6fcSDenis Kirjanov 	struct bpf_prog *xdp_prog;
9186c5aa6fcSDenis Kirjanov 	struct xdp_buff xdp;
9196c5aa6fcSDenis Kirjanov 	unsigned long ret;
9207158ff6dSWei Liu 	int slots = 1;
9210d160211SJeremy Fitzhardinge 	int err = 0;
9226c5aa6fcSDenis Kirjanov 	u32 verdict;
9230d160211SJeremy Fitzhardinge 
924f942dc25SIan Campbell 	if (rx->flags & XEN_NETRXF_extra_info) {
9252688fcb7SAndrew J. Bennieston 		err = xennet_get_extras(queue, extras, rp);
9266c5aa6fcSDenis Kirjanov 		if (!err) {
9276c5aa6fcSDenis Kirjanov 			if (extras[XEN_NETIF_EXTRA_TYPE_XDP - 1].type) {
9286c5aa6fcSDenis Kirjanov 				struct xen_netif_extra_info *xdp;
9296c5aa6fcSDenis Kirjanov 
9306c5aa6fcSDenis Kirjanov 				xdp = &extras[XEN_NETIF_EXTRA_TYPE_XDP - 1];
9316c5aa6fcSDenis Kirjanov 				rx->offset = xdp->u.xdp.headroom;
9326c5aa6fcSDenis Kirjanov 			}
9336c5aa6fcSDenis Kirjanov 		}
9342688fcb7SAndrew J. Bennieston 		cons = queue->rx.rsp_cons;
9350d160211SJeremy Fitzhardinge 	}
9360d160211SJeremy Fitzhardinge 
9370d160211SJeremy Fitzhardinge 	for (;;) {
9380d160211SJeremy Fitzhardinge 		if (unlikely(rx->status < 0 ||
93930c5d7f0SJulien Grall 			     rx->offset + rx->status > XEN_PAGE_SIZE)) {
9400d160211SJeremy Fitzhardinge 			if (net_ratelimit())
9416c10127dSJulien Grall 				dev_warn(dev, "rx->offset: %u, size: %d\n",
9420d160211SJeremy Fitzhardinge 					 rx->offset, rx->status);
9432688fcb7SAndrew J. Bennieston 			xennet_move_rx_slot(queue, skb, ref);
9440d160211SJeremy Fitzhardinge 			err = -EINVAL;
9450d160211SJeremy Fitzhardinge 			goto next;
9460d160211SJeremy Fitzhardinge 		}
9470d160211SJeremy Fitzhardinge 
9480d160211SJeremy Fitzhardinge 		/*
9490d160211SJeremy Fitzhardinge 		 * This definitely indicates a bug, either in this driver or in
9500d160211SJeremy Fitzhardinge 		 * the backend driver. In future this should flag the bad
951697089dcSWei Liu 		 * situation to the system controller to reboot the backend.
9520d160211SJeremy Fitzhardinge 		 */
9530d160211SJeremy Fitzhardinge 		if (ref == GRANT_INVALID_REF) {
9540d160211SJeremy Fitzhardinge 			if (net_ratelimit())
9550d160211SJeremy Fitzhardinge 				dev_warn(dev, "Bad rx response id %d.\n",
9560d160211SJeremy Fitzhardinge 					 rx->id);
9570d160211SJeremy Fitzhardinge 			err = -EINVAL;
9580d160211SJeremy Fitzhardinge 			goto next;
9590d160211SJeremy Fitzhardinge 		}
9600d160211SJeremy Fitzhardinge 
9610d160211SJeremy Fitzhardinge 		ret = gnttab_end_foreign_access_ref(ref, 0);
9620d160211SJeremy Fitzhardinge 		BUG_ON(!ret);
9630d160211SJeremy Fitzhardinge 
9642688fcb7SAndrew J. Bennieston 		gnttab_release_grant_reference(&queue->gref_rx_head, ref);
9650d160211SJeremy Fitzhardinge 
9666c5aa6fcSDenis Kirjanov 		rcu_read_lock();
9676c5aa6fcSDenis Kirjanov 		xdp_prog = rcu_dereference(queue->xdp_prog);
9686c5aa6fcSDenis Kirjanov 		if (xdp_prog) {
9696c5aa6fcSDenis Kirjanov 			if (!(rx->flags & XEN_NETRXF_more_data)) {
9706c5aa6fcSDenis Kirjanov 				/* currently only a single page contains data */
9716c5aa6fcSDenis Kirjanov 				verdict = xennet_run_xdp(queue,
9726c5aa6fcSDenis Kirjanov 							 skb_frag_page(&skb_shinfo(skb)->frags[0]),
9736c5aa6fcSDenis Kirjanov 							 rx, xdp_prog, &xdp, need_xdp_flush);
9746c5aa6fcSDenis Kirjanov 				if (verdict != XDP_PASS)
9756c5aa6fcSDenis Kirjanov 					err = -EINVAL;
9766c5aa6fcSDenis Kirjanov 			} else {
9776c5aa6fcSDenis Kirjanov 				/* drop the frame */
9786c5aa6fcSDenis Kirjanov 				err = -EINVAL;
9796c5aa6fcSDenis Kirjanov 			}
9806c5aa6fcSDenis Kirjanov 		}
9816c5aa6fcSDenis Kirjanov 		rcu_read_unlock();
9820d160211SJeremy Fitzhardinge next:
9836c5aa6fcSDenis Kirjanov 		__skb_queue_tail(list, skb);
984f942dc25SIan Campbell 		if (!(rx->flags & XEN_NETRXF_more_data))
9850d160211SJeremy Fitzhardinge 			break;
9860d160211SJeremy Fitzhardinge 
9877158ff6dSWei Liu 		if (cons + slots == rp) {
9880d160211SJeremy Fitzhardinge 			if (net_ratelimit())
9897158ff6dSWei Liu 				dev_warn(dev, "Need more slots\n");
9900d160211SJeremy Fitzhardinge 			err = -ENOENT;
9910d160211SJeremy Fitzhardinge 			break;
9920d160211SJeremy Fitzhardinge 		}
9930d160211SJeremy Fitzhardinge 
9942688fcb7SAndrew J. Bennieston 		rx = RING_GET_RESPONSE(&queue->rx, cons + slots);
9952688fcb7SAndrew J. Bennieston 		skb = xennet_get_rx_skb(queue, cons + slots);
9962688fcb7SAndrew J. Bennieston 		ref = xennet_get_rx_ref(queue, cons + slots);
9977158ff6dSWei Liu 		slots++;
9980d160211SJeremy Fitzhardinge 	}
9990d160211SJeremy Fitzhardinge 
10007158ff6dSWei Liu 	if (unlikely(slots > max)) {
10010d160211SJeremy Fitzhardinge 		if (net_ratelimit())
1002697089dcSWei Liu 			dev_warn(dev, "Too many slots\n");
10030d160211SJeremy Fitzhardinge 		err = -E2BIG;
10040d160211SJeremy Fitzhardinge 	}
10050d160211SJeremy Fitzhardinge 
10060d160211SJeremy Fitzhardinge 	if (unlikely(err))
10072688fcb7SAndrew J. Bennieston 		queue->rx.rsp_cons = cons + slots;
10080d160211SJeremy Fitzhardinge 
10090d160211SJeremy Fitzhardinge 	return err;
10100d160211SJeremy Fitzhardinge }
10110d160211SJeremy Fitzhardinge 
10120d160211SJeremy Fitzhardinge static int xennet_set_skb_gso(struct sk_buff *skb,
10130d160211SJeremy Fitzhardinge 			      struct xen_netif_extra_info *gso)
10140d160211SJeremy Fitzhardinge {
10150d160211SJeremy Fitzhardinge 	if (!gso->u.gso.size) {
10160d160211SJeremy Fitzhardinge 		if (net_ratelimit())
1017383eda32SJoe Perches 			pr_warn("GSO size must not be zero\n");
10180d160211SJeremy Fitzhardinge 		return -EINVAL;
10190d160211SJeremy Fitzhardinge 	}
10200d160211SJeremy Fitzhardinge 
10212c0057deSPaul Durrant 	if (gso->u.gso.type != XEN_NETIF_GSO_TYPE_TCPV4 &&
10222c0057deSPaul Durrant 	    gso->u.gso.type != XEN_NETIF_GSO_TYPE_TCPV6) {
10230d160211SJeremy Fitzhardinge 		if (net_ratelimit())
1024383eda32SJoe Perches 			pr_warn("Bad GSO type %d\n", gso->u.gso.type);
10250d160211SJeremy Fitzhardinge 		return -EINVAL;
10260d160211SJeremy Fitzhardinge 	}
10270d160211SJeremy Fitzhardinge 
10280d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_size = gso->u.gso.size;
10292c0057deSPaul Durrant 	skb_shinfo(skb)->gso_type =
10302c0057deSPaul Durrant 		(gso->u.gso.type == XEN_NETIF_GSO_TYPE_TCPV4) ?
10312c0057deSPaul Durrant 		SKB_GSO_TCPV4 :
10322c0057deSPaul Durrant 		SKB_GSO_TCPV6;
10330d160211SJeremy Fitzhardinge 
10340d160211SJeremy Fitzhardinge 	/* Header must be checked, and gso_segs computed. */
10350d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
10360d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_segs = 0;
10370d160211SJeremy Fitzhardinge 
10380d160211SJeremy Fitzhardinge 	return 0;
10390d160211SJeremy Fitzhardinge }
10400d160211SJeremy Fitzhardinge 
1041a761129eSDongli Zhang static int xennet_fill_frags(struct netfront_queue *queue,
10420d160211SJeremy Fitzhardinge 			     struct sk_buff *skb,
10430d160211SJeremy Fitzhardinge 			     struct sk_buff_head *list)
10440d160211SJeremy Fitzhardinge {
10452688fcb7SAndrew J. Bennieston 	RING_IDX cons = queue->rx.rsp_cons;
10460d160211SJeremy Fitzhardinge 	struct sk_buff *nskb;
10470d160211SJeremy Fitzhardinge 
10480d160211SJeremy Fitzhardinge 	while ((nskb = __skb_dequeue(list))) {
10490d160211SJeremy Fitzhardinge 		struct xen_netif_rx_response *rx =
10502688fcb7SAndrew J. Bennieston 			RING_GET_RESPONSE(&queue->rx, ++cons);
105101c68026SIan Campbell 		skb_frag_t *nfrag = &skb_shinfo(nskb)->frags[0];
10520d160211SJeremy Fitzhardinge 
1053d472b3a6SJuergen Gross 		if (skb_shinfo(skb)->nr_frags == MAX_SKB_FRAGS) {
1054093b9c71SJan Beulich 			unsigned int pull_to = NETFRONT_SKB_CB(skb)->pull_to;
10550d160211SJeremy Fitzhardinge 
1056d81c5054SJuergen Gross 			BUG_ON(pull_to < skb_headlen(skb));
1057093b9c71SJan Beulich 			__pskb_pull_tail(skb, pull_to - skb_headlen(skb));
1058093b9c71SJan Beulich 		}
1059ad4f15dcSJuergen Gross 		if (unlikely(skb_shinfo(skb)->nr_frags >= MAX_SKB_FRAGS)) {
106000b36850SDongli Zhang 			queue->rx.rsp_cons = ++cons + skb_queue_len(list);
1061ad4f15dcSJuergen Gross 			kfree_skb(nskb);
1062a761129eSDongli Zhang 			return -ENOENT;
1063ad4f15dcSJuergen Gross 		}
1064093b9c71SJan Beulich 
1065d472b3a6SJuergen Gross 		skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags,
1066d472b3a6SJuergen Gross 				skb_frag_page(nfrag),
1067093b9c71SJan Beulich 				rx->offset, rx->status, PAGE_SIZE);
10680d160211SJeremy Fitzhardinge 
10690d160211SJeremy Fitzhardinge 		skb_shinfo(nskb)->nr_frags = 0;
10700d160211SJeremy Fitzhardinge 		kfree_skb(nskb);
10710d160211SJeremy Fitzhardinge 	}
10720d160211SJeremy Fitzhardinge 
1073a761129eSDongli Zhang 	queue->rx.rsp_cons = cons;
1074a761129eSDongli Zhang 
1075a761129eSDongli Zhang 	return 0;
10760d160211SJeremy Fitzhardinge }
10770d160211SJeremy Fitzhardinge 
1078e0ce4af9SIan Campbell static int checksum_setup(struct net_device *dev, struct sk_buff *skb)
10790d160211SJeremy Fitzhardinge {
1080b5cf66cdSPaul Durrant 	bool recalculate_partial_csum = false;
1081e0ce4af9SIan Campbell 
1082e0ce4af9SIan Campbell 	/*
1083e0ce4af9SIan Campbell 	 * A GSO SKB must be CHECKSUM_PARTIAL. However some buggy
1084e0ce4af9SIan Campbell 	 * peers can fail to set NETRXF_csum_blank when sending a GSO
1085e0ce4af9SIan Campbell 	 * frame. In this case force the SKB to CHECKSUM_PARTIAL and
1086e0ce4af9SIan Campbell 	 * recalculate the partial checksum.
1087e0ce4af9SIan Campbell 	 */
1088e0ce4af9SIan Campbell 	if (skb->ip_summed != CHECKSUM_PARTIAL && skb_is_gso(skb)) {
1089e0ce4af9SIan Campbell 		struct netfront_info *np = netdev_priv(dev);
10902688fcb7SAndrew J. Bennieston 		atomic_inc(&np->rx_gso_checksum_fixup);
1091e0ce4af9SIan Campbell 		skb->ip_summed = CHECKSUM_PARTIAL;
1092b5cf66cdSPaul Durrant 		recalculate_partial_csum = true;
1093e0ce4af9SIan Campbell 	}
1094e0ce4af9SIan Campbell 
1095e0ce4af9SIan Campbell 	/* A non-CHECKSUM_PARTIAL SKB does not require setup. */
1096e0ce4af9SIan Campbell 	if (skb->ip_summed != CHECKSUM_PARTIAL)
1097e0ce4af9SIan Campbell 		return 0;
10980d160211SJeremy Fitzhardinge 
1099b5cf66cdSPaul Durrant 	return skb_checksum_setup(skb, recalculate_partial_csum);
11000d160211SJeremy Fitzhardinge }
11010d160211SJeremy Fitzhardinge 
11022688fcb7SAndrew J. Bennieston static int handle_incoming_queue(struct netfront_queue *queue,
11030d160211SJeremy Fitzhardinge 				 struct sk_buff_head *rxq)
11040d160211SJeremy Fitzhardinge {
1105900e1833SDavid Vrabel 	struct netfront_stats *rx_stats = this_cpu_ptr(queue->info->rx_stats);
11060d160211SJeremy Fitzhardinge 	int packets_dropped = 0;
11070d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
11080d160211SJeremy Fitzhardinge 
11090d160211SJeremy Fitzhardinge 	while ((skb = __skb_dequeue(rxq)) != NULL) {
11103683243bSIan Campbell 		int pull_to = NETFRONT_SKB_CB(skb)->pull_to;
11110d160211SJeremy Fitzhardinge 
1112093b9c71SJan Beulich 		if (pull_to > skb_headlen(skb))
11133683243bSIan Campbell 			__pskb_pull_tail(skb, pull_to - skb_headlen(skb));
11140d160211SJeremy Fitzhardinge 
11150d160211SJeremy Fitzhardinge 		/* Ethernet work: Delayed to here as it peeks the header. */
11162688fcb7SAndrew J. Bennieston 		skb->protocol = eth_type_trans(skb, queue->info->netdev);
1117d554f73dSWei Liu 		skb_reset_network_header(skb);
11180d160211SJeremy Fitzhardinge 
11192688fcb7SAndrew J. Bennieston 		if (checksum_setup(queue->info->netdev, skb)) {
11200d160211SJeremy Fitzhardinge 			kfree_skb(skb);
11210d160211SJeremy Fitzhardinge 			packets_dropped++;
11222688fcb7SAndrew J. Bennieston 			queue->info->netdev->stats.rx_errors++;
11230d160211SJeremy Fitzhardinge 			continue;
11240d160211SJeremy Fitzhardinge 		}
11250d160211SJeremy Fitzhardinge 
1126900e1833SDavid Vrabel 		u64_stats_update_begin(&rx_stats->syncp);
1127900e1833SDavid Vrabel 		rx_stats->packets++;
1128900e1833SDavid Vrabel 		rx_stats->bytes += skb->len;
1129900e1833SDavid Vrabel 		u64_stats_update_end(&rx_stats->syncp);
11300d160211SJeremy Fitzhardinge 
11310d160211SJeremy Fitzhardinge 		/* Pass it up. */
11322688fcb7SAndrew J. Bennieston 		napi_gro_receive(&queue->napi, skb);
11330d160211SJeremy Fitzhardinge 	}
11340d160211SJeremy Fitzhardinge 
11350d160211SJeremy Fitzhardinge 	return packets_dropped;
11360d160211SJeremy Fitzhardinge }
11370d160211SJeremy Fitzhardinge 
1138bea3348eSStephen Hemminger static int xennet_poll(struct napi_struct *napi, int budget)
11390d160211SJeremy Fitzhardinge {
11402688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = container_of(napi, struct netfront_queue, napi);
11412688fcb7SAndrew J. Bennieston 	struct net_device *dev = queue->info->netdev;
11420d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
11430d160211SJeremy Fitzhardinge 	struct netfront_rx_info rinfo;
11440d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response *rx = &rinfo.rx;
11450d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extras = rinfo.extras;
11460d160211SJeremy Fitzhardinge 	RING_IDX i, rp;
1147bea3348eSStephen Hemminger 	int work_done;
11480d160211SJeremy Fitzhardinge 	struct sk_buff_head rxq;
11490d160211SJeremy Fitzhardinge 	struct sk_buff_head errq;
11500d160211SJeremy Fitzhardinge 	struct sk_buff_head tmpq;
11510d160211SJeremy Fitzhardinge 	int err;
11526c5aa6fcSDenis Kirjanov 	bool need_xdp_flush = false;
11530d160211SJeremy Fitzhardinge 
11542688fcb7SAndrew J. Bennieston 	spin_lock(&queue->rx_lock);
11550d160211SJeremy Fitzhardinge 
11560d160211SJeremy Fitzhardinge 	skb_queue_head_init(&rxq);
11570d160211SJeremy Fitzhardinge 	skb_queue_head_init(&errq);
11580d160211SJeremy Fitzhardinge 	skb_queue_head_init(&tmpq);
11590d160211SJeremy Fitzhardinge 
11602688fcb7SAndrew J. Bennieston 	rp = queue->rx.sring->rsp_prod;
11610d160211SJeremy Fitzhardinge 	rmb(); /* Ensure we see queued responses up to 'rp'. */
11620d160211SJeremy Fitzhardinge 
11632688fcb7SAndrew J. Bennieston 	i = queue->rx.rsp_cons;
11640d160211SJeremy Fitzhardinge 	work_done = 0;
11650d160211SJeremy Fitzhardinge 	while ((i != rp) && (work_done < budget)) {
11662688fcb7SAndrew J. Bennieston 		memcpy(rx, RING_GET_RESPONSE(&queue->rx, i), sizeof(*rx));
11670d160211SJeremy Fitzhardinge 		memset(extras, 0, sizeof(rinfo.extras));
11680d160211SJeremy Fitzhardinge 
11696c5aa6fcSDenis Kirjanov 		err = xennet_get_responses(queue, &rinfo, rp, &tmpq,
11706c5aa6fcSDenis Kirjanov 					   &need_xdp_flush);
11710d160211SJeremy Fitzhardinge 
11720d160211SJeremy Fitzhardinge 		if (unlikely(err)) {
11730d160211SJeremy Fitzhardinge err:
11740d160211SJeremy Fitzhardinge 			while ((skb = __skb_dequeue(&tmpq)))
11750d160211SJeremy Fitzhardinge 				__skb_queue_tail(&errq, skb);
117609f75cd7SJeff Garzik 			dev->stats.rx_errors++;
11772688fcb7SAndrew J. Bennieston 			i = queue->rx.rsp_cons;
11780d160211SJeremy Fitzhardinge 			continue;
11790d160211SJeremy Fitzhardinge 		}
11800d160211SJeremy Fitzhardinge 
11810d160211SJeremy Fitzhardinge 		skb = __skb_dequeue(&tmpq);
11820d160211SJeremy Fitzhardinge 
11830d160211SJeremy Fitzhardinge 		if (extras[XEN_NETIF_EXTRA_TYPE_GSO - 1].type) {
11840d160211SJeremy Fitzhardinge 			struct xen_netif_extra_info *gso;
11850d160211SJeremy Fitzhardinge 			gso = &extras[XEN_NETIF_EXTRA_TYPE_GSO - 1];
11860d160211SJeremy Fitzhardinge 
11870d160211SJeremy Fitzhardinge 			if (unlikely(xennet_set_skb_gso(skb, gso))) {
11880d160211SJeremy Fitzhardinge 				__skb_queue_head(&tmpq, skb);
11892688fcb7SAndrew J. Bennieston 				queue->rx.rsp_cons += skb_queue_len(&tmpq);
11900d160211SJeremy Fitzhardinge 				goto err;
11910d160211SJeremy Fitzhardinge 			}
11920d160211SJeremy Fitzhardinge 		}
11930d160211SJeremy Fitzhardinge 
11943683243bSIan Campbell 		NETFRONT_SKB_CB(skb)->pull_to = rx->status;
11953683243bSIan Campbell 		if (NETFRONT_SKB_CB(skb)->pull_to > RX_COPY_THRESHOLD)
11963683243bSIan Campbell 			NETFRONT_SKB_CB(skb)->pull_to = RX_COPY_THRESHOLD;
11970d160211SJeremy Fitzhardinge 
1198b54c9d5bSJonathan Lemon 		skb_frag_off_set(&skb_shinfo(skb)->frags[0], rx->offset);
11993683243bSIan Campbell 		skb_frag_size_set(&skb_shinfo(skb)->frags[0], rx->status);
12003683243bSIan Campbell 		skb->data_len = rx->status;
1201093b9c71SJan Beulich 		skb->len += rx->status;
12020d160211SJeremy Fitzhardinge 
1203a761129eSDongli Zhang 		if (unlikely(xennet_fill_frags(queue, skb, &tmpq)))
1204ad4f15dcSJuergen Gross 			goto err;
12050d160211SJeremy Fitzhardinge 
1206f942dc25SIan Campbell 		if (rx->flags & XEN_NETRXF_csum_blank)
12070d160211SJeremy Fitzhardinge 			skb->ip_summed = CHECKSUM_PARTIAL;
1208f942dc25SIan Campbell 		else if (rx->flags & XEN_NETRXF_data_validated)
12090d160211SJeremy Fitzhardinge 			skb->ip_summed = CHECKSUM_UNNECESSARY;
12100d160211SJeremy Fitzhardinge 
12110d160211SJeremy Fitzhardinge 		__skb_queue_tail(&rxq, skb);
12120d160211SJeremy Fitzhardinge 
1213a761129eSDongli Zhang 		i = ++queue->rx.rsp_cons;
12140d160211SJeremy Fitzhardinge 		work_done++;
12150d160211SJeremy Fitzhardinge 	}
12166c5aa6fcSDenis Kirjanov 	if (need_xdp_flush)
12176c5aa6fcSDenis Kirjanov 		xdp_do_flush();
12180d160211SJeremy Fitzhardinge 
121956cfe5d0SWang Chen 	__skb_queue_purge(&errq);
12200d160211SJeremy Fitzhardinge 
12212688fcb7SAndrew J. Bennieston 	work_done -= handle_incoming_queue(queue, &rxq);
12220d160211SJeremy Fitzhardinge 
12232688fcb7SAndrew J. Bennieston 	xennet_alloc_rx_buffers(queue);
12240d160211SJeremy Fitzhardinge 
12250d160211SJeremy Fitzhardinge 	if (work_done < budget) {
1226bea3348eSStephen Hemminger 		int more_to_do = 0;
1227bea3348eSStephen Hemminger 
12286ad20165SEric Dumazet 		napi_complete_done(napi, work_done);
12290d160211SJeremy Fitzhardinge 
12302688fcb7SAndrew J. Bennieston 		RING_FINAL_CHECK_FOR_RESPONSES(&queue->rx, more_to_do);
12316a6dc08fSDavid Vrabel 		if (more_to_do)
12326a6dc08fSDavid Vrabel 			napi_schedule(napi);
12330d160211SJeremy Fitzhardinge 	}
12340d160211SJeremy Fitzhardinge 
12352688fcb7SAndrew J. Bennieston 	spin_unlock(&queue->rx_lock);
12360d160211SJeremy Fitzhardinge 
1237bea3348eSStephen Hemminger 	return work_done;
12380d160211SJeremy Fitzhardinge }
12390d160211SJeremy Fitzhardinge 
12400d160211SJeremy Fitzhardinge static int xennet_change_mtu(struct net_device *dev, int mtu)
12410d160211SJeremy Fitzhardinge {
12420c36820eSJonathan Davies 	int max = xennet_can_sg(dev) ? XEN_NETIF_MAX_TX_SIZE : ETH_DATA_LEN;
12430d160211SJeremy Fitzhardinge 
12440d160211SJeremy Fitzhardinge 	if (mtu > max)
12450d160211SJeremy Fitzhardinge 		return -EINVAL;
12460d160211SJeremy Fitzhardinge 	dev->mtu = mtu;
12470d160211SJeremy Fitzhardinge 	return 0;
12480d160211SJeremy Fitzhardinge }
12490d160211SJeremy Fitzhardinge 
1250bc1f4470Sstephen hemminger static void xennet_get_stats64(struct net_device *dev,
1251e00f85beSstephen hemminger 			       struct rtnl_link_stats64 *tot)
1252e00f85beSstephen hemminger {
1253e00f85beSstephen hemminger 	struct netfront_info *np = netdev_priv(dev);
1254e00f85beSstephen hemminger 	int cpu;
1255e00f85beSstephen hemminger 
1256e00f85beSstephen hemminger 	for_each_possible_cpu(cpu) {
1257900e1833SDavid Vrabel 		struct netfront_stats *rx_stats = per_cpu_ptr(np->rx_stats, cpu);
1258900e1833SDavid Vrabel 		struct netfront_stats *tx_stats = per_cpu_ptr(np->tx_stats, cpu);
1259e00f85beSstephen hemminger 		u64 rx_packets, rx_bytes, tx_packets, tx_bytes;
1260e00f85beSstephen hemminger 		unsigned int start;
1261e00f85beSstephen hemminger 
1262e00f85beSstephen hemminger 		do {
1263900e1833SDavid Vrabel 			start = u64_stats_fetch_begin_irq(&tx_stats->syncp);
1264900e1833SDavid Vrabel 			tx_packets = tx_stats->packets;
1265900e1833SDavid Vrabel 			tx_bytes = tx_stats->bytes;
1266900e1833SDavid Vrabel 		} while (u64_stats_fetch_retry_irq(&tx_stats->syncp, start));
1267e00f85beSstephen hemminger 
1268900e1833SDavid Vrabel 		do {
1269900e1833SDavid Vrabel 			start = u64_stats_fetch_begin_irq(&rx_stats->syncp);
1270900e1833SDavid Vrabel 			rx_packets = rx_stats->packets;
1271900e1833SDavid Vrabel 			rx_bytes = rx_stats->bytes;
1272900e1833SDavid Vrabel 		} while (u64_stats_fetch_retry_irq(&rx_stats->syncp, start));
1273e00f85beSstephen hemminger 
1274e00f85beSstephen hemminger 		tot->rx_packets += rx_packets;
1275e00f85beSstephen hemminger 		tot->tx_packets += tx_packets;
1276e00f85beSstephen hemminger 		tot->rx_bytes   += rx_bytes;
1277e00f85beSstephen hemminger 		tot->tx_bytes   += tx_bytes;
1278e00f85beSstephen hemminger 	}
1279e00f85beSstephen hemminger 
1280e00f85beSstephen hemminger 	tot->rx_errors  = dev->stats.rx_errors;
1281e00f85beSstephen hemminger 	tot->tx_dropped = dev->stats.tx_dropped;
1282e00f85beSstephen hemminger }
1283e00f85beSstephen hemminger 
12842688fcb7SAndrew J. Bennieston static void xennet_release_tx_bufs(struct netfront_queue *queue)
12850d160211SJeremy Fitzhardinge {
12860d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
12870d160211SJeremy Fitzhardinge 	int i;
12880d160211SJeremy Fitzhardinge 
12890d160211SJeremy Fitzhardinge 	for (i = 0; i < NET_TX_RING_SIZE; i++) {
12900d160211SJeremy Fitzhardinge 		/* Skip over entries which are actually freelist references */
12912688fcb7SAndrew J. Bennieston 		if (skb_entry_is_link(&queue->tx_skbs[i]))
12920d160211SJeremy Fitzhardinge 			continue;
12930d160211SJeremy Fitzhardinge 
12942688fcb7SAndrew J. Bennieston 		skb = queue->tx_skbs[i].skb;
12952688fcb7SAndrew J. Bennieston 		get_page(queue->grant_tx_page[i]);
12962688fcb7SAndrew J. Bennieston 		gnttab_end_foreign_access(queue->grant_tx_ref[i],
1297cefe0078SAnnie Li 					  GNTMAP_readonly,
12982688fcb7SAndrew J. Bennieston 					  (unsigned long)page_address(queue->grant_tx_page[i]));
12992688fcb7SAndrew J. Bennieston 		queue->grant_tx_page[i] = NULL;
13002688fcb7SAndrew J. Bennieston 		queue->grant_tx_ref[i] = GRANT_INVALID_REF;
13012688fcb7SAndrew J. Bennieston 		add_id_to_freelist(&queue->tx_skb_freelist, queue->tx_skbs, i);
13020d160211SJeremy Fitzhardinge 		dev_kfree_skb_irq(skb);
13030d160211SJeremy Fitzhardinge 	}
13040d160211SJeremy Fitzhardinge }
13050d160211SJeremy Fitzhardinge 
13062688fcb7SAndrew J. Bennieston static void xennet_release_rx_bufs(struct netfront_queue *queue)
13070d160211SJeremy Fitzhardinge {
13080d160211SJeremy Fitzhardinge 	int id, ref;
13090d160211SJeremy Fitzhardinge 
13102688fcb7SAndrew J. Bennieston 	spin_lock_bh(&queue->rx_lock);
13110d160211SJeremy Fitzhardinge 
13120d160211SJeremy Fitzhardinge 	for (id = 0; id < NET_RX_RING_SIZE; id++) {
1313cefe0078SAnnie Li 		struct sk_buff *skb;
1314cefe0078SAnnie Li 		struct page *page;
13150d160211SJeremy Fitzhardinge 
13162688fcb7SAndrew J. Bennieston 		skb = queue->rx_skbs[id];
1317cefe0078SAnnie Li 		if (!skb)
1318cefe0078SAnnie Li 			continue;
1319cefe0078SAnnie Li 
13202688fcb7SAndrew J. Bennieston 		ref = queue->grant_rx_ref[id];
1321cefe0078SAnnie Li 		if (ref == GRANT_INVALID_REF)
1322cefe0078SAnnie Li 			continue;
1323cefe0078SAnnie Li 
1324cefe0078SAnnie Li 		page = skb_frag_page(&skb_shinfo(skb)->frags[0]);
1325cefe0078SAnnie Li 
1326cefe0078SAnnie Li 		/* gnttab_end_foreign_access() needs a page ref until
1327cefe0078SAnnie Li 		 * foreign access is ended (which may be deferred).
1328cefe0078SAnnie Li 		 */
1329cefe0078SAnnie Li 		get_page(page);
1330cefe0078SAnnie Li 		gnttab_end_foreign_access(ref, 0,
1331cefe0078SAnnie Li 					  (unsigned long)page_address(page));
13322688fcb7SAndrew J. Bennieston 		queue->grant_rx_ref[id] = GRANT_INVALID_REF;
13330d160211SJeremy Fitzhardinge 
1334cefe0078SAnnie Li 		kfree_skb(skb);
13350d160211SJeremy Fitzhardinge 	}
13360d160211SJeremy Fitzhardinge 
13372688fcb7SAndrew J. Bennieston 	spin_unlock_bh(&queue->rx_lock);
13380d160211SJeremy Fitzhardinge }
13390d160211SJeremy Fitzhardinge 
1340c8f44affSMichał Mirosław static netdev_features_t xennet_fix_features(struct net_device *dev,
1341c8f44affSMichał Mirosław 	netdev_features_t features)
13428f7b01a1SEric Dumazet {
13438f7b01a1SEric Dumazet 	struct netfront_info *np = netdev_priv(dev);
13448f7b01a1SEric Dumazet 
13452890ea5cSJuergen Gross 	if (features & NETIF_F_SG &&
13462890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend, "feature-sg", 0))
13478f7b01a1SEric Dumazet 		features &= ~NETIF_F_SG;
13488f7b01a1SEric Dumazet 
13492890ea5cSJuergen Gross 	if (features & NETIF_F_IPV6_CSUM &&
13502890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend,
13512890ea5cSJuergen Gross 				  "feature-ipv6-csum-offload", 0))
13522c0057deSPaul Durrant 		features &= ~NETIF_F_IPV6_CSUM;
13532c0057deSPaul Durrant 
13542890ea5cSJuergen Gross 	if (features & NETIF_F_TSO &&
13552890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend, "feature-gso-tcpv4", 0))
13568f7b01a1SEric Dumazet 		features &= ~NETIF_F_TSO;
13578f7b01a1SEric Dumazet 
13582890ea5cSJuergen Gross 	if (features & NETIF_F_TSO6 &&
13592890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend, "feature-gso-tcpv6", 0))
13602c0057deSPaul Durrant 		features &= ~NETIF_F_TSO6;
13612c0057deSPaul Durrant 
13628f7b01a1SEric Dumazet 	return features;
13638f7b01a1SEric Dumazet }
13648f7b01a1SEric Dumazet 
1365c8f44affSMichał Mirosław static int xennet_set_features(struct net_device *dev,
1366c8f44affSMichał Mirosław 	netdev_features_t features)
13678f7b01a1SEric Dumazet {
13688f7b01a1SEric Dumazet 	if (!(features & NETIF_F_SG) && dev->mtu > ETH_DATA_LEN) {
13698f7b01a1SEric Dumazet 		netdev_info(dev, "Reducing MTU because no SG offload");
13708f7b01a1SEric Dumazet 		dev->mtu = ETH_DATA_LEN;
13718f7b01a1SEric Dumazet 	}
13728f7b01a1SEric Dumazet 
13738f7b01a1SEric Dumazet 	return 0;
13748f7b01a1SEric Dumazet }
13758f7b01a1SEric Dumazet 
1376d634bf2cSWei Liu static irqreturn_t xennet_tx_interrupt(int irq, void *dev_id)
1377cf66f9d4SKonrad Rzeszutek Wilk {
13782688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = dev_id;
1379cf66f9d4SKonrad Rzeszutek Wilk 	unsigned long flags;
1380cf66f9d4SKonrad Rzeszutek Wilk 
13812688fcb7SAndrew J. Bennieston 	spin_lock_irqsave(&queue->tx_lock, flags);
13822688fcb7SAndrew J. Bennieston 	xennet_tx_buf_gc(queue);
13832688fcb7SAndrew J. Bennieston 	spin_unlock_irqrestore(&queue->tx_lock, flags);
1384cf66f9d4SKonrad Rzeszutek Wilk 
1385cf66f9d4SKonrad Rzeszutek Wilk 	return IRQ_HANDLED;
1386cf66f9d4SKonrad Rzeszutek Wilk }
1387cf66f9d4SKonrad Rzeszutek Wilk 
1388d634bf2cSWei Liu static irqreturn_t xennet_rx_interrupt(int irq, void *dev_id)
1389d634bf2cSWei Liu {
13902688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = dev_id;
13912688fcb7SAndrew J. Bennieston 	struct net_device *dev = queue->info->netdev;
1392d634bf2cSWei Liu 
1393d634bf2cSWei Liu 	if (likely(netif_carrier_ok(dev) &&
13942688fcb7SAndrew J. Bennieston 		   RING_HAS_UNCONSUMED_RESPONSES(&queue->rx)))
13952688fcb7SAndrew J. Bennieston 		napi_schedule(&queue->napi);
1396d634bf2cSWei Liu 
1397d634bf2cSWei Liu 	return IRQ_HANDLED;
1398d634bf2cSWei Liu }
1399d634bf2cSWei Liu 
1400d634bf2cSWei Liu static irqreturn_t xennet_interrupt(int irq, void *dev_id)
1401d634bf2cSWei Liu {
1402d634bf2cSWei Liu 	xennet_tx_interrupt(irq, dev_id);
1403d634bf2cSWei Liu 	xennet_rx_interrupt(irq, dev_id);
1404d634bf2cSWei Liu 	return IRQ_HANDLED;
1405d634bf2cSWei Liu }
1406d634bf2cSWei Liu 
1407cf66f9d4SKonrad Rzeszutek Wilk #ifdef CONFIG_NET_POLL_CONTROLLER
1408cf66f9d4SKonrad Rzeszutek Wilk static void xennet_poll_controller(struct net_device *dev)
1409cf66f9d4SKonrad Rzeszutek Wilk {
14102688fcb7SAndrew J. Bennieston 	/* Poll each queue */
14112688fcb7SAndrew J. Bennieston 	struct netfront_info *info = netdev_priv(dev);
14122688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
14132688fcb7SAndrew J. Bennieston 	unsigned int i;
14142688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i)
14152688fcb7SAndrew J. Bennieston 		xennet_interrupt(0, &info->queues[i]);
1416cf66f9d4SKonrad Rzeszutek Wilk }
1417cf66f9d4SKonrad Rzeszutek Wilk #endif
1418cf66f9d4SKonrad Rzeszutek Wilk 
14196c5aa6fcSDenis Kirjanov #define NETBACK_XDP_HEADROOM_DISABLE	0
14206c5aa6fcSDenis Kirjanov #define NETBACK_XDP_HEADROOM_ENABLE	1
14216c5aa6fcSDenis Kirjanov 
14226c5aa6fcSDenis Kirjanov static int talk_to_netback_xdp(struct netfront_info *np, int xdp)
14236c5aa6fcSDenis Kirjanov {
14246c5aa6fcSDenis Kirjanov 	int err;
14256c5aa6fcSDenis Kirjanov 	unsigned short headroom;
14266c5aa6fcSDenis Kirjanov 
14276c5aa6fcSDenis Kirjanov 	headroom = xdp ? XDP_PACKET_HEADROOM : 0;
14286c5aa6fcSDenis Kirjanov 	err = xenbus_printf(XBT_NIL, np->xbdev->nodename,
14296c5aa6fcSDenis Kirjanov 			    "xdp-headroom", "%hu",
14306c5aa6fcSDenis Kirjanov 			    headroom);
14316c5aa6fcSDenis Kirjanov 	if (err)
14326c5aa6fcSDenis Kirjanov 		pr_warn("Error writing xdp-headroom\n");
14336c5aa6fcSDenis Kirjanov 
14346c5aa6fcSDenis Kirjanov 	return err;
14356c5aa6fcSDenis Kirjanov }
14366c5aa6fcSDenis Kirjanov 
14376c5aa6fcSDenis Kirjanov static int xennet_xdp_set(struct net_device *dev, struct bpf_prog *prog,
14386c5aa6fcSDenis Kirjanov 			  struct netlink_ext_ack *extack)
14396c5aa6fcSDenis Kirjanov {
14406c5aa6fcSDenis Kirjanov 	unsigned long max_mtu = XEN_PAGE_SIZE - XDP_PACKET_HEADROOM;
14416c5aa6fcSDenis Kirjanov 	struct netfront_info *np = netdev_priv(dev);
14426c5aa6fcSDenis Kirjanov 	struct bpf_prog *old_prog;
14436c5aa6fcSDenis Kirjanov 	unsigned int i, err;
14446c5aa6fcSDenis Kirjanov 
14456c5aa6fcSDenis Kirjanov 	if (dev->mtu > max_mtu) {
14466c5aa6fcSDenis Kirjanov 		netdev_warn(dev, "XDP requires MTU less than %lu\n", max_mtu);
14476c5aa6fcSDenis Kirjanov 		return -EINVAL;
14486c5aa6fcSDenis Kirjanov 	}
14496c5aa6fcSDenis Kirjanov 
14506c5aa6fcSDenis Kirjanov 	if (!np->netback_has_xdp_headroom)
14516c5aa6fcSDenis Kirjanov 		return 0;
14526c5aa6fcSDenis Kirjanov 
14536c5aa6fcSDenis Kirjanov 	xenbus_switch_state(np->xbdev, XenbusStateReconfiguring);
14546c5aa6fcSDenis Kirjanov 
14556c5aa6fcSDenis Kirjanov 	err = talk_to_netback_xdp(np, prog ? NETBACK_XDP_HEADROOM_ENABLE :
14566c5aa6fcSDenis Kirjanov 				  NETBACK_XDP_HEADROOM_DISABLE);
14576c5aa6fcSDenis Kirjanov 	if (err)
14586c5aa6fcSDenis Kirjanov 		return err;
14596c5aa6fcSDenis Kirjanov 
14606c5aa6fcSDenis Kirjanov 	/* avoid the race with XDP headroom adjustment */
14616c5aa6fcSDenis Kirjanov 	wait_event(module_wq,
14626c5aa6fcSDenis Kirjanov 		   xenbus_read_driver_state(np->xbdev->otherend) ==
14636c5aa6fcSDenis Kirjanov 		   XenbusStateReconfigured);
14646c5aa6fcSDenis Kirjanov 	np->netfront_xdp_enabled = true;
14656c5aa6fcSDenis Kirjanov 
14666c5aa6fcSDenis Kirjanov 	old_prog = rtnl_dereference(np->queues[0].xdp_prog);
14676c5aa6fcSDenis Kirjanov 
14686c5aa6fcSDenis Kirjanov 	if (prog)
14696c5aa6fcSDenis Kirjanov 		bpf_prog_add(prog, dev->real_num_tx_queues);
14706c5aa6fcSDenis Kirjanov 
14716c5aa6fcSDenis Kirjanov 	for (i = 0; i < dev->real_num_tx_queues; ++i)
14726c5aa6fcSDenis Kirjanov 		rcu_assign_pointer(np->queues[i].xdp_prog, prog);
14736c5aa6fcSDenis Kirjanov 
14746c5aa6fcSDenis Kirjanov 	if (old_prog)
14756c5aa6fcSDenis Kirjanov 		for (i = 0; i < dev->real_num_tx_queues; ++i)
14766c5aa6fcSDenis Kirjanov 			bpf_prog_put(old_prog);
14776c5aa6fcSDenis Kirjanov 
14786c5aa6fcSDenis Kirjanov 	xenbus_switch_state(np->xbdev, XenbusStateConnected);
14796c5aa6fcSDenis Kirjanov 
14806c5aa6fcSDenis Kirjanov 	return 0;
14816c5aa6fcSDenis Kirjanov }
14826c5aa6fcSDenis Kirjanov 
14836c5aa6fcSDenis Kirjanov static int xennet_xdp(struct net_device *dev, struct netdev_bpf *xdp)
14846c5aa6fcSDenis Kirjanov {
14856c5aa6fcSDenis Kirjanov 	switch (xdp->command) {
14866c5aa6fcSDenis Kirjanov 	case XDP_SETUP_PROG:
14876c5aa6fcSDenis Kirjanov 		return xennet_xdp_set(dev, xdp->prog, xdp->extack);
14886c5aa6fcSDenis Kirjanov 	default:
14896c5aa6fcSDenis Kirjanov 		return -EINVAL;
14906c5aa6fcSDenis Kirjanov 	}
14916c5aa6fcSDenis Kirjanov }
14926c5aa6fcSDenis Kirjanov 
14930a0b9d2eSStephen Hemminger static const struct net_device_ops xennet_netdev_ops = {
14940a0b9d2eSStephen Hemminger 	.ndo_open            = xennet_open,
14950a0b9d2eSStephen Hemminger 	.ndo_stop            = xennet_close,
14960a0b9d2eSStephen Hemminger 	.ndo_start_xmit      = xennet_start_xmit,
14970a0b9d2eSStephen Hemminger 	.ndo_change_mtu	     = xennet_change_mtu,
1498e00f85beSstephen hemminger 	.ndo_get_stats64     = xennet_get_stats64,
14990a0b9d2eSStephen Hemminger 	.ndo_set_mac_address = eth_mac_addr,
15000a0b9d2eSStephen Hemminger 	.ndo_validate_addr   = eth_validate_addr,
1501fb507934SMichał Mirosław 	.ndo_fix_features    = xennet_fix_features,
1502fb507934SMichał Mirosław 	.ndo_set_features    = xennet_set_features,
15032688fcb7SAndrew J. Bennieston 	.ndo_select_queue    = xennet_select_queue,
15046c5aa6fcSDenis Kirjanov 	.ndo_bpf            = xennet_xdp,
15056c5aa6fcSDenis Kirjanov 	.ndo_xdp_xmit	    = xennet_xdp_xmit,
1506cf66f9d4SKonrad Rzeszutek Wilk #ifdef CONFIG_NET_POLL_CONTROLLER
1507cf66f9d4SKonrad Rzeszutek Wilk 	.ndo_poll_controller = xennet_poll_controller,
1508cf66f9d4SKonrad Rzeszutek Wilk #endif
15090a0b9d2eSStephen Hemminger };
15100a0b9d2eSStephen Hemminger 
1511900e1833SDavid Vrabel static void xennet_free_netdev(struct net_device *netdev)
1512900e1833SDavid Vrabel {
1513900e1833SDavid Vrabel 	struct netfront_info *np = netdev_priv(netdev);
1514900e1833SDavid Vrabel 
1515900e1833SDavid Vrabel 	free_percpu(np->rx_stats);
1516900e1833SDavid Vrabel 	free_percpu(np->tx_stats);
1517900e1833SDavid Vrabel 	free_netdev(netdev);
1518900e1833SDavid Vrabel }
1519900e1833SDavid Vrabel 
15208e0e46bbSBill Pemberton static struct net_device *xennet_create_dev(struct xenbus_device *dev)
15210d160211SJeremy Fitzhardinge {
15222688fcb7SAndrew J. Bennieston 	int err;
15230d160211SJeremy Fitzhardinge 	struct net_device *netdev;
15240d160211SJeremy Fitzhardinge 	struct netfront_info *np;
15250d160211SJeremy Fitzhardinge 
152650ee6061SAndrew J. Bennieston 	netdev = alloc_etherdev_mq(sizeof(struct netfront_info), xennet_max_queues);
152741de8d4cSJoe Perches 	if (!netdev)
15280d160211SJeremy Fitzhardinge 		return ERR_PTR(-ENOMEM);
15290d160211SJeremy Fitzhardinge 
15300d160211SJeremy Fitzhardinge 	np                   = netdev_priv(netdev);
15310d160211SJeremy Fitzhardinge 	np->xbdev            = dev;
15320d160211SJeremy Fitzhardinge 
15332688fcb7SAndrew J. Bennieston 	np->queues = NULL;
15340d160211SJeremy Fitzhardinge 
1535e00f85beSstephen hemminger 	err = -ENOMEM;
1536900e1833SDavid Vrabel 	np->rx_stats = netdev_alloc_pcpu_stats(struct netfront_stats);
1537900e1833SDavid Vrabel 	if (np->rx_stats == NULL)
1538900e1833SDavid Vrabel 		goto exit;
1539900e1833SDavid Vrabel 	np->tx_stats = netdev_alloc_pcpu_stats(struct netfront_stats);
1540900e1833SDavid Vrabel 	if (np->tx_stats == NULL)
1541e00f85beSstephen hemminger 		goto exit;
1542e00f85beSstephen hemminger 
15430a0b9d2eSStephen Hemminger 	netdev->netdev_ops	= &xennet_netdev_ops;
15440a0b9d2eSStephen Hemminger 
1545fb507934SMichał Mirosław 	netdev->features        = NETIF_F_IP_CSUM | NETIF_F_RXCSUM |
1546fb507934SMichał Mirosław 				  NETIF_F_GSO_ROBUST;
15472c0057deSPaul Durrant 	netdev->hw_features	= NETIF_F_SG |
15482c0057deSPaul Durrant 				  NETIF_F_IPV6_CSUM |
15492c0057deSPaul Durrant 				  NETIF_F_TSO | NETIF_F_TSO6;
15500d160211SJeremy Fitzhardinge 
1551fc3e5941SIan Campbell 	/*
1552fc3e5941SIan Campbell          * Assume that all hw features are available for now. This set
1553fc3e5941SIan Campbell          * will be adjusted by the call to netdev_update_features() in
1554fc3e5941SIan Campbell          * xennet_connect() which is the earliest point where we can
1555fc3e5941SIan Campbell          * negotiate with the backend regarding supported features.
1556fc3e5941SIan Campbell          */
1557fc3e5941SIan Campbell 	netdev->features |= netdev->hw_features;
1558fc3e5941SIan Campbell 
15597ad24ea4SWilfried Klaebe 	netdev->ethtool_ops = &xennet_ethtool_ops;
1560e1043a4bSMohammed Gamal 	netdev->min_mtu = ETH_MIN_MTU;
1561d0c2c997SJarod Wilson 	netdev->max_mtu = XEN_NETIF_MAX_TX_SIZE;
15620d160211SJeremy Fitzhardinge 	SET_NETDEV_DEV(netdev, &dev->dev);
15630d160211SJeremy Fitzhardinge 
15640d160211SJeremy Fitzhardinge 	np->netdev = netdev;
15656c5aa6fcSDenis Kirjanov 	np->netfront_xdp_enabled = false;
15660d160211SJeremy Fitzhardinge 
15670d160211SJeremy Fitzhardinge 	netif_carrier_off(netdev);
15680d160211SJeremy Fitzhardinge 
1569c2c63310SAndrea Righi 	do {
1570b707fda2SEduardo Otubo 		xenbus_switch_state(dev, XenbusStateInitialising);
1571c2c63310SAndrea Righi 		err = wait_event_timeout(module_wq,
1572822fb18aSXiao Liang 				 xenbus_read_driver_state(dev->otherend) !=
1573822fb18aSXiao Liang 				 XenbusStateClosed &&
1574822fb18aSXiao Liang 				 xenbus_read_driver_state(dev->otherend) !=
1575c2c63310SAndrea Righi 				 XenbusStateUnknown, XENNET_TIMEOUT);
1576c2c63310SAndrea Righi 	} while (!err);
1577c2c63310SAndrea Righi 
15780d160211SJeremy Fitzhardinge 	return netdev;
15790d160211SJeremy Fitzhardinge 
15800d160211SJeremy Fitzhardinge  exit:
1581900e1833SDavid Vrabel 	xennet_free_netdev(netdev);
15820d160211SJeremy Fitzhardinge 	return ERR_PTR(err);
15830d160211SJeremy Fitzhardinge }
15840d160211SJeremy Fitzhardinge 
15850d160211SJeremy Fitzhardinge /**
15860d160211SJeremy Fitzhardinge  * Entry point to this code when a new device is created.  Allocate the basic
15870d160211SJeremy Fitzhardinge  * structures and the ring buffers for communication with the backend, and
15880d160211SJeremy Fitzhardinge  * inform the backend of the appropriate details for those.
15890d160211SJeremy Fitzhardinge  */
15908e0e46bbSBill Pemberton static int netfront_probe(struct xenbus_device *dev,
15910d160211SJeremy Fitzhardinge 			  const struct xenbus_device_id *id)
15920d160211SJeremy Fitzhardinge {
15930d160211SJeremy Fitzhardinge 	int err;
15940d160211SJeremy Fitzhardinge 	struct net_device *netdev;
15950d160211SJeremy Fitzhardinge 	struct netfront_info *info;
15960d160211SJeremy Fitzhardinge 
15970d160211SJeremy Fitzhardinge 	netdev = xennet_create_dev(dev);
15980d160211SJeremy Fitzhardinge 	if (IS_ERR(netdev)) {
15990d160211SJeremy Fitzhardinge 		err = PTR_ERR(netdev);
16000d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "creating netdev");
16010d160211SJeremy Fitzhardinge 		return err;
16020d160211SJeremy Fitzhardinge 	}
16030d160211SJeremy Fitzhardinge 
16040d160211SJeremy Fitzhardinge 	info = netdev_priv(netdev);
16051b713e00SGreg Kroah-Hartman 	dev_set_drvdata(&dev->dev, info);
160627b917e5STakashi Iwai #ifdef CONFIG_SYSFS
160727b917e5STakashi Iwai 	info->netdev->sysfs_groups[0] = &xennet_dev_group;
160827b917e5STakashi Iwai #endif
16090d160211SJeremy Fitzhardinge 
16100d160211SJeremy Fitzhardinge 	return 0;
16110d160211SJeremy Fitzhardinge }
16120d160211SJeremy Fitzhardinge 
16130d160211SJeremy Fitzhardinge static void xennet_end_access(int ref, void *page)
16140d160211SJeremy Fitzhardinge {
16150d160211SJeremy Fitzhardinge 	/* This frees the page as a side-effect */
16160d160211SJeremy Fitzhardinge 	if (ref != GRANT_INVALID_REF)
16170d160211SJeremy Fitzhardinge 		gnttab_end_foreign_access(ref, 0, (unsigned long)page);
16180d160211SJeremy Fitzhardinge }
16190d160211SJeremy Fitzhardinge 
16200d160211SJeremy Fitzhardinge static void xennet_disconnect_backend(struct netfront_info *info)
16210d160211SJeremy Fitzhardinge {
16222688fcb7SAndrew J. Bennieston 	unsigned int i = 0;
16232688fcb7SAndrew J. Bennieston 	unsigned int num_queues = info->netdev->real_num_tx_queues;
16240d160211SJeremy Fitzhardinge 
1625f9feb1e6SDavid Vrabel 	netif_carrier_off(info->netdev);
1626f9feb1e6SDavid Vrabel 
16279a873c71SChas Williams 	for (i = 0; i < num_queues && info->queues; ++i) {
162876541869SDavid Vrabel 		struct netfront_queue *queue = &info->queues[i];
162976541869SDavid Vrabel 
163074470954SBoris Ostrovsky 		del_timer_sync(&queue->rx_refill_timer);
163174470954SBoris Ostrovsky 
16322688fcb7SAndrew J. Bennieston 		if (queue->tx_irq && (queue->tx_irq == queue->rx_irq))
16332688fcb7SAndrew J. Bennieston 			unbind_from_irqhandler(queue->tx_irq, queue);
16342688fcb7SAndrew J. Bennieston 		if (queue->tx_irq && (queue->tx_irq != queue->rx_irq)) {
16352688fcb7SAndrew J. Bennieston 			unbind_from_irqhandler(queue->tx_irq, queue);
16362688fcb7SAndrew J. Bennieston 			unbind_from_irqhandler(queue->rx_irq, queue);
1637d634bf2cSWei Liu 		}
16382688fcb7SAndrew J. Bennieston 		queue->tx_evtchn = queue->rx_evtchn = 0;
16392688fcb7SAndrew J. Bennieston 		queue->tx_irq = queue->rx_irq = 0;
16400d160211SJeremy Fitzhardinge 
1641274b0455SChas Williams 		if (netif_running(info->netdev))
1642f9feb1e6SDavid Vrabel 			napi_synchronize(&queue->napi);
1643f9feb1e6SDavid Vrabel 
1644a5b5dc3cSDavid Vrabel 		xennet_release_tx_bufs(queue);
1645a5b5dc3cSDavid Vrabel 		xennet_release_rx_bufs(queue);
1646a5b5dc3cSDavid Vrabel 		gnttab_free_grant_references(queue->gref_tx_head);
1647a5b5dc3cSDavid Vrabel 		gnttab_free_grant_references(queue->gref_rx_head);
1648a5b5dc3cSDavid Vrabel 
16490d160211SJeremy Fitzhardinge 		/* End access and free the pages */
16502688fcb7SAndrew J. Bennieston 		xennet_end_access(queue->tx_ring_ref, queue->tx.sring);
16512688fcb7SAndrew J. Bennieston 		xennet_end_access(queue->rx_ring_ref, queue->rx.sring);
16520d160211SJeremy Fitzhardinge 
16532688fcb7SAndrew J. Bennieston 		queue->tx_ring_ref = GRANT_INVALID_REF;
16542688fcb7SAndrew J. Bennieston 		queue->rx_ring_ref = GRANT_INVALID_REF;
16552688fcb7SAndrew J. Bennieston 		queue->tx.sring = NULL;
16562688fcb7SAndrew J. Bennieston 		queue->rx.sring = NULL;
16576c5aa6fcSDenis Kirjanov 
16586c5aa6fcSDenis Kirjanov 		page_pool_destroy(queue->page_pool);
16592688fcb7SAndrew J. Bennieston 	}
16600d160211SJeremy Fitzhardinge }
16610d160211SJeremy Fitzhardinge 
16620d160211SJeremy Fitzhardinge /**
16630d160211SJeremy Fitzhardinge  * We are reconnecting to the backend, due to a suspend/resume, or a backend
16640d160211SJeremy Fitzhardinge  * driver restart.  We tear down our netif structure and recreate it, but
16650d160211SJeremy Fitzhardinge  * leave the device-layer structures intact so that this is transparent to the
16660d160211SJeremy Fitzhardinge  * rest of the kernel.
16670d160211SJeremy Fitzhardinge  */
16680d160211SJeremy Fitzhardinge static int netfront_resume(struct xenbus_device *dev)
16690d160211SJeremy Fitzhardinge {
16701b713e00SGreg Kroah-Hartman 	struct netfront_info *info = dev_get_drvdata(&dev->dev);
16710d160211SJeremy Fitzhardinge 
16720d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", dev->nodename);
16730d160211SJeremy Fitzhardinge 
16740d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
16750d160211SJeremy Fitzhardinge 	return 0;
16760d160211SJeremy Fitzhardinge }
16770d160211SJeremy Fitzhardinge 
16780d160211SJeremy Fitzhardinge static int xen_net_read_mac(struct xenbus_device *dev, u8 mac[])
16790d160211SJeremy Fitzhardinge {
16800d160211SJeremy Fitzhardinge 	char *s, *e, *macstr;
16810d160211SJeremy Fitzhardinge 	int i;
16820d160211SJeremy Fitzhardinge 
16830d160211SJeremy Fitzhardinge 	macstr = s = xenbus_read(XBT_NIL, dev->nodename, "mac", NULL);
16840d160211SJeremy Fitzhardinge 	if (IS_ERR(macstr))
16850d160211SJeremy Fitzhardinge 		return PTR_ERR(macstr);
16860d160211SJeremy Fitzhardinge 
16870d160211SJeremy Fitzhardinge 	for (i = 0; i < ETH_ALEN; i++) {
16880d160211SJeremy Fitzhardinge 		mac[i] = simple_strtoul(s, &e, 16);
16890d160211SJeremy Fitzhardinge 		if ((s == e) || (*e != ((i == ETH_ALEN-1) ? '\0' : ':'))) {
16900d160211SJeremy Fitzhardinge 			kfree(macstr);
16910d160211SJeremy Fitzhardinge 			return -ENOENT;
16920d160211SJeremy Fitzhardinge 		}
16930d160211SJeremy Fitzhardinge 		s = e+1;
16940d160211SJeremy Fitzhardinge 	}
16950d160211SJeremy Fitzhardinge 
16960d160211SJeremy Fitzhardinge 	kfree(macstr);
16970d160211SJeremy Fitzhardinge 	return 0;
16980d160211SJeremy Fitzhardinge }
16990d160211SJeremy Fitzhardinge 
17002688fcb7SAndrew J. Bennieston static int setup_netfront_single(struct netfront_queue *queue)
1701d634bf2cSWei Liu {
1702d634bf2cSWei Liu 	int err;
1703d634bf2cSWei Liu 
17042688fcb7SAndrew J. Bennieston 	err = xenbus_alloc_evtchn(queue->info->xbdev, &queue->tx_evtchn);
1705d634bf2cSWei Liu 	if (err < 0)
1706d634bf2cSWei Liu 		goto fail;
1707d634bf2cSWei Liu 
17082688fcb7SAndrew J. Bennieston 	err = bind_evtchn_to_irqhandler(queue->tx_evtchn,
1709d634bf2cSWei Liu 					xennet_interrupt,
17102688fcb7SAndrew J. Bennieston 					0, queue->info->netdev->name, queue);
1711d634bf2cSWei Liu 	if (err < 0)
1712d634bf2cSWei Liu 		goto bind_fail;
17132688fcb7SAndrew J. Bennieston 	queue->rx_evtchn = queue->tx_evtchn;
17142688fcb7SAndrew J. Bennieston 	queue->rx_irq = queue->tx_irq = err;
1715d634bf2cSWei Liu 
1716d634bf2cSWei Liu 	return 0;
1717d634bf2cSWei Liu 
1718d634bf2cSWei Liu bind_fail:
17192688fcb7SAndrew J. Bennieston 	xenbus_free_evtchn(queue->info->xbdev, queue->tx_evtchn);
17202688fcb7SAndrew J. Bennieston 	queue->tx_evtchn = 0;
1721d634bf2cSWei Liu fail:
1722d634bf2cSWei Liu 	return err;
1723d634bf2cSWei Liu }
1724d634bf2cSWei Liu 
17252688fcb7SAndrew J. Bennieston static int setup_netfront_split(struct netfront_queue *queue)
1726d634bf2cSWei Liu {
1727d634bf2cSWei Liu 	int err;
1728d634bf2cSWei Liu 
17292688fcb7SAndrew J. Bennieston 	err = xenbus_alloc_evtchn(queue->info->xbdev, &queue->tx_evtchn);
1730d634bf2cSWei Liu 	if (err < 0)
1731d634bf2cSWei Liu 		goto fail;
17322688fcb7SAndrew J. Bennieston 	err = xenbus_alloc_evtchn(queue->info->xbdev, &queue->rx_evtchn);
1733d634bf2cSWei Liu 	if (err < 0)
1734d634bf2cSWei Liu 		goto alloc_rx_evtchn_fail;
1735d634bf2cSWei Liu 
17362688fcb7SAndrew J. Bennieston 	snprintf(queue->tx_irq_name, sizeof(queue->tx_irq_name),
17372688fcb7SAndrew J. Bennieston 		 "%s-tx", queue->name);
17382688fcb7SAndrew J. Bennieston 	err = bind_evtchn_to_irqhandler(queue->tx_evtchn,
1739d634bf2cSWei Liu 					xennet_tx_interrupt,
17402688fcb7SAndrew J. Bennieston 					0, queue->tx_irq_name, queue);
1741d634bf2cSWei Liu 	if (err < 0)
1742d634bf2cSWei Liu 		goto bind_tx_fail;
17432688fcb7SAndrew J. Bennieston 	queue->tx_irq = err;
1744d634bf2cSWei Liu 
17452688fcb7SAndrew J. Bennieston 	snprintf(queue->rx_irq_name, sizeof(queue->rx_irq_name),
17462688fcb7SAndrew J. Bennieston 		 "%s-rx", queue->name);
17472688fcb7SAndrew J. Bennieston 	err = bind_evtchn_to_irqhandler(queue->rx_evtchn,
1748d634bf2cSWei Liu 					xennet_rx_interrupt,
17492688fcb7SAndrew J. Bennieston 					0, queue->rx_irq_name, queue);
1750d634bf2cSWei Liu 	if (err < 0)
1751d634bf2cSWei Liu 		goto bind_rx_fail;
17522688fcb7SAndrew J. Bennieston 	queue->rx_irq = err;
1753d634bf2cSWei Liu 
1754d634bf2cSWei Liu 	return 0;
1755d634bf2cSWei Liu 
1756d634bf2cSWei Liu bind_rx_fail:
17572688fcb7SAndrew J. Bennieston 	unbind_from_irqhandler(queue->tx_irq, queue);
17582688fcb7SAndrew J. Bennieston 	queue->tx_irq = 0;
1759d634bf2cSWei Liu bind_tx_fail:
17602688fcb7SAndrew J. Bennieston 	xenbus_free_evtchn(queue->info->xbdev, queue->rx_evtchn);
17612688fcb7SAndrew J. Bennieston 	queue->rx_evtchn = 0;
1762d634bf2cSWei Liu alloc_rx_evtchn_fail:
17632688fcb7SAndrew J. Bennieston 	xenbus_free_evtchn(queue->info->xbdev, queue->tx_evtchn);
17642688fcb7SAndrew J. Bennieston 	queue->tx_evtchn = 0;
1765d634bf2cSWei Liu fail:
1766d634bf2cSWei Liu 	return err;
1767d634bf2cSWei Liu }
1768d634bf2cSWei Liu 
17692688fcb7SAndrew J. Bennieston static int setup_netfront(struct xenbus_device *dev,
17702688fcb7SAndrew J. Bennieston 			struct netfront_queue *queue, unsigned int feature_split_evtchn)
17710d160211SJeremy Fitzhardinge {
17720d160211SJeremy Fitzhardinge 	struct xen_netif_tx_sring *txs;
17730d160211SJeremy Fitzhardinge 	struct xen_netif_rx_sring *rxs;
1774ccc9d90aSWei Liu 	grant_ref_t gref;
17750d160211SJeremy Fitzhardinge 	int err;
17760d160211SJeremy Fitzhardinge 
17772688fcb7SAndrew J. Bennieston 	queue->tx_ring_ref = GRANT_INVALID_REF;
17782688fcb7SAndrew J. Bennieston 	queue->rx_ring_ref = GRANT_INVALID_REF;
17792688fcb7SAndrew J. Bennieston 	queue->rx.sring = NULL;
17802688fcb7SAndrew J. Bennieston 	queue->tx.sring = NULL;
17810d160211SJeremy Fitzhardinge 
1782a144ff09SIan Campbell 	txs = (struct xen_netif_tx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH);
17830d160211SJeremy Fitzhardinge 	if (!txs) {
17840d160211SJeremy Fitzhardinge 		err = -ENOMEM;
17850d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "allocating tx ring page");
17860d160211SJeremy Fitzhardinge 		goto fail;
17870d160211SJeremy Fitzhardinge 	}
17880d160211SJeremy Fitzhardinge 	SHARED_RING_INIT(txs);
178930c5d7f0SJulien Grall 	FRONT_RING_INIT(&queue->tx, txs, XEN_PAGE_SIZE);
17900d160211SJeremy Fitzhardinge 
1791ccc9d90aSWei Liu 	err = xenbus_grant_ring(dev, txs, 1, &gref);
17921ca2983aSWei Liu 	if (err < 0)
17931ca2983aSWei Liu 		goto grant_tx_ring_fail;
1794ccc9d90aSWei Liu 	queue->tx_ring_ref = gref;
17950d160211SJeremy Fitzhardinge 
1796a144ff09SIan Campbell 	rxs = (struct xen_netif_rx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH);
17970d160211SJeremy Fitzhardinge 	if (!rxs) {
17980d160211SJeremy Fitzhardinge 		err = -ENOMEM;
17990d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "allocating rx ring page");
18001ca2983aSWei Liu 		goto alloc_rx_ring_fail;
18010d160211SJeremy Fitzhardinge 	}
18020d160211SJeremy Fitzhardinge 	SHARED_RING_INIT(rxs);
180330c5d7f0SJulien Grall 	FRONT_RING_INIT(&queue->rx, rxs, XEN_PAGE_SIZE);
18040d160211SJeremy Fitzhardinge 
1805ccc9d90aSWei Liu 	err = xenbus_grant_ring(dev, rxs, 1, &gref);
18061ca2983aSWei Liu 	if (err < 0)
18071ca2983aSWei Liu 		goto grant_rx_ring_fail;
1808ccc9d90aSWei Liu 	queue->rx_ring_ref = gref;
18090d160211SJeremy Fitzhardinge 
1810d634bf2cSWei Liu 	if (feature_split_evtchn)
18112688fcb7SAndrew J. Bennieston 		err = setup_netfront_split(queue);
1812d634bf2cSWei Liu 	/* setup single event channel if
1813d634bf2cSWei Liu 	 *  a) feature-split-event-channels == 0
1814d634bf2cSWei Liu 	 *  b) feature-split-event-channels == 1 but failed to setup
1815d634bf2cSWei Liu 	 */
1816d634bf2cSWei Liu 	if (!feature_split_evtchn || (feature_split_evtchn && err))
18172688fcb7SAndrew J. Bennieston 		err = setup_netfront_single(queue);
1818d634bf2cSWei Liu 
18190d160211SJeremy Fitzhardinge 	if (err)
18201ca2983aSWei Liu 		goto alloc_evtchn_fail;
18210d160211SJeremy Fitzhardinge 
18220d160211SJeremy Fitzhardinge 	return 0;
18230d160211SJeremy Fitzhardinge 
18241ca2983aSWei Liu 	/* If we fail to setup netfront, it is safe to just revoke access to
18251ca2983aSWei Liu 	 * granted pages because backend is not accessing it at this point.
18261ca2983aSWei Liu 	 */
18271ca2983aSWei Liu alloc_evtchn_fail:
18282688fcb7SAndrew J. Bennieston 	gnttab_end_foreign_access_ref(queue->rx_ring_ref, 0);
18291ca2983aSWei Liu grant_rx_ring_fail:
18301ca2983aSWei Liu 	free_page((unsigned long)rxs);
18311ca2983aSWei Liu alloc_rx_ring_fail:
18322688fcb7SAndrew J. Bennieston 	gnttab_end_foreign_access_ref(queue->tx_ring_ref, 0);
18331ca2983aSWei Liu grant_tx_ring_fail:
18341ca2983aSWei Liu 	free_page((unsigned long)txs);
18350d160211SJeremy Fitzhardinge fail:
18360d160211SJeremy Fitzhardinge 	return err;
18370d160211SJeremy Fitzhardinge }
18380d160211SJeremy Fitzhardinge 
18392688fcb7SAndrew J. Bennieston /* Queue-specific initialisation
18402688fcb7SAndrew J. Bennieston  * This used to be done in xennet_create_dev() but must now
18412688fcb7SAndrew J. Bennieston  * be run per-queue.
18422688fcb7SAndrew J. Bennieston  */
18432688fcb7SAndrew J. Bennieston static int xennet_init_queue(struct netfront_queue *queue)
18442688fcb7SAndrew J. Bennieston {
18452688fcb7SAndrew J. Bennieston 	unsigned short i;
18462688fcb7SAndrew J. Bennieston 	int err = 0;
184721f2706bSXiao Liang 	char *devid;
18482688fcb7SAndrew J. Bennieston 
18492688fcb7SAndrew J. Bennieston 	spin_lock_init(&queue->tx_lock);
18502688fcb7SAndrew J. Bennieston 	spin_lock_init(&queue->rx_lock);
18512688fcb7SAndrew J. Bennieston 
1852e99e88a9SKees Cook 	timer_setup(&queue->rx_refill_timer, rx_refill_timeout, 0);
18532688fcb7SAndrew J. Bennieston 
185421f2706bSXiao Liang 	devid = strrchr(queue->info->xbdev->nodename, '/') + 1;
185521f2706bSXiao Liang 	snprintf(queue->name, sizeof(queue->name), "vif%s-q%u",
185621f2706bSXiao Liang 		 devid, queue->id);
18578b715010SWei Liu 
18582688fcb7SAndrew J. Bennieston 	/* Initialise tx_skbs as a free chain containing every entry. */
18592688fcb7SAndrew J. Bennieston 	queue->tx_skb_freelist = 0;
18602688fcb7SAndrew J. Bennieston 	for (i = 0; i < NET_TX_RING_SIZE; i++) {
18612688fcb7SAndrew J. Bennieston 		skb_entry_set_link(&queue->tx_skbs[i], i+1);
18622688fcb7SAndrew J. Bennieston 		queue->grant_tx_ref[i] = GRANT_INVALID_REF;
18632688fcb7SAndrew J. Bennieston 		queue->grant_tx_page[i] = NULL;
18642688fcb7SAndrew J. Bennieston 	}
18652688fcb7SAndrew J. Bennieston 
18662688fcb7SAndrew J. Bennieston 	/* Clear out rx_skbs */
18672688fcb7SAndrew J. Bennieston 	for (i = 0; i < NET_RX_RING_SIZE; i++) {
18682688fcb7SAndrew J. Bennieston 		queue->rx_skbs[i] = NULL;
18692688fcb7SAndrew J. Bennieston 		queue->grant_rx_ref[i] = GRANT_INVALID_REF;
18702688fcb7SAndrew J. Bennieston 	}
18712688fcb7SAndrew J. Bennieston 
18722688fcb7SAndrew J. Bennieston 	/* A grant for every tx ring slot */
18731f3c2ebaSDavid Vrabel 	if (gnttab_alloc_grant_references(NET_TX_RING_SIZE,
18742688fcb7SAndrew J. Bennieston 					  &queue->gref_tx_head) < 0) {
18752688fcb7SAndrew J. Bennieston 		pr_alert("can't alloc tx grant refs\n");
18762688fcb7SAndrew J. Bennieston 		err = -ENOMEM;
18772688fcb7SAndrew J. Bennieston 		goto exit;
18782688fcb7SAndrew J. Bennieston 	}
18792688fcb7SAndrew J. Bennieston 
18802688fcb7SAndrew J. Bennieston 	/* A grant for every rx ring slot */
18811f3c2ebaSDavid Vrabel 	if (gnttab_alloc_grant_references(NET_RX_RING_SIZE,
18822688fcb7SAndrew J. Bennieston 					  &queue->gref_rx_head) < 0) {
18832688fcb7SAndrew J. Bennieston 		pr_alert("can't alloc rx grant refs\n");
18842688fcb7SAndrew J. Bennieston 		err = -ENOMEM;
18852688fcb7SAndrew J. Bennieston 		goto exit_free_tx;
18862688fcb7SAndrew J. Bennieston 	}
18872688fcb7SAndrew J. Bennieston 
18882688fcb7SAndrew J. Bennieston 	return 0;
18892688fcb7SAndrew J. Bennieston 
18902688fcb7SAndrew J. Bennieston  exit_free_tx:
18912688fcb7SAndrew J. Bennieston 	gnttab_free_grant_references(queue->gref_tx_head);
18922688fcb7SAndrew J. Bennieston  exit:
18932688fcb7SAndrew J. Bennieston 	return err;
18942688fcb7SAndrew J. Bennieston }
18952688fcb7SAndrew J. Bennieston 
189650ee6061SAndrew J. Bennieston static int write_queue_xenstore_keys(struct netfront_queue *queue,
189750ee6061SAndrew J. Bennieston 			   struct xenbus_transaction *xbt, int write_hierarchical)
189850ee6061SAndrew J. Bennieston {
189950ee6061SAndrew J. Bennieston 	/* Write the queue-specific keys into XenStore in the traditional
190050ee6061SAndrew J. Bennieston 	 * way for a single queue, or in a queue subkeys for multiple
190150ee6061SAndrew J. Bennieston 	 * queues.
190250ee6061SAndrew J. Bennieston 	 */
190350ee6061SAndrew J. Bennieston 	struct xenbus_device *dev = queue->info->xbdev;
190450ee6061SAndrew J. Bennieston 	int err;
190550ee6061SAndrew J. Bennieston 	const char *message;
190650ee6061SAndrew J. Bennieston 	char *path;
190750ee6061SAndrew J. Bennieston 	size_t pathsize;
190850ee6061SAndrew J. Bennieston 
190950ee6061SAndrew J. Bennieston 	/* Choose the correct place to write the keys */
191050ee6061SAndrew J. Bennieston 	if (write_hierarchical) {
191150ee6061SAndrew J. Bennieston 		pathsize = strlen(dev->nodename) + 10;
191250ee6061SAndrew J. Bennieston 		path = kzalloc(pathsize, GFP_KERNEL);
191350ee6061SAndrew J. Bennieston 		if (!path) {
191450ee6061SAndrew J. Bennieston 			err = -ENOMEM;
191550ee6061SAndrew J. Bennieston 			message = "out of memory while writing ring references";
191650ee6061SAndrew J. Bennieston 			goto error;
191750ee6061SAndrew J. Bennieston 		}
191850ee6061SAndrew J. Bennieston 		snprintf(path, pathsize, "%s/queue-%u",
191950ee6061SAndrew J. Bennieston 				dev->nodename, queue->id);
192050ee6061SAndrew J. Bennieston 	} else {
192150ee6061SAndrew J. Bennieston 		path = (char *)dev->nodename;
192250ee6061SAndrew J. Bennieston 	}
192350ee6061SAndrew J. Bennieston 
192450ee6061SAndrew J. Bennieston 	/* Write ring references */
192550ee6061SAndrew J. Bennieston 	err = xenbus_printf(*xbt, path, "tx-ring-ref", "%u",
192650ee6061SAndrew J. Bennieston 			queue->tx_ring_ref);
192750ee6061SAndrew J. Bennieston 	if (err) {
192850ee6061SAndrew J. Bennieston 		message = "writing tx-ring-ref";
192950ee6061SAndrew J. Bennieston 		goto error;
193050ee6061SAndrew J. Bennieston 	}
193150ee6061SAndrew J. Bennieston 
193250ee6061SAndrew J. Bennieston 	err = xenbus_printf(*xbt, path, "rx-ring-ref", "%u",
193350ee6061SAndrew J. Bennieston 			queue->rx_ring_ref);
193450ee6061SAndrew J. Bennieston 	if (err) {
193550ee6061SAndrew J. Bennieston 		message = "writing rx-ring-ref";
193650ee6061SAndrew J. Bennieston 		goto error;
193750ee6061SAndrew J. Bennieston 	}
193850ee6061SAndrew J. Bennieston 
193950ee6061SAndrew J. Bennieston 	/* Write event channels; taking into account both shared
194050ee6061SAndrew J. Bennieston 	 * and split event channel scenarios.
194150ee6061SAndrew J. Bennieston 	 */
194250ee6061SAndrew J. Bennieston 	if (queue->tx_evtchn == queue->rx_evtchn) {
194350ee6061SAndrew J. Bennieston 		/* Shared event channel */
194450ee6061SAndrew J. Bennieston 		err = xenbus_printf(*xbt, path,
194550ee6061SAndrew J. Bennieston 				"event-channel", "%u", queue->tx_evtchn);
194650ee6061SAndrew J. Bennieston 		if (err) {
194750ee6061SAndrew J. Bennieston 			message = "writing event-channel";
194850ee6061SAndrew J. Bennieston 			goto error;
194950ee6061SAndrew J. Bennieston 		}
195050ee6061SAndrew J. Bennieston 	} else {
195150ee6061SAndrew J. Bennieston 		/* Split event channels */
195250ee6061SAndrew J. Bennieston 		err = xenbus_printf(*xbt, path,
195350ee6061SAndrew J. Bennieston 				"event-channel-tx", "%u", queue->tx_evtchn);
195450ee6061SAndrew J. Bennieston 		if (err) {
195550ee6061SAndrew J. Bennieston 			message = "writing event-channel-tx";
195650ee6061SAndrew J. Bennieston 			goto error;
195750ee6061SAndrew J. Bennieston 		}
195850ee6061SAndrew J. Bennieston 
195950ee6061SAndrew J. Bennieston 		err = xenbus_printf(*xbt, path,
196050ee6061SAndrew J. Bennieston 				"event-channel-rx", "%u", queue->rx_evtchn);
196150ee6061SAndrew J. Bennieston 		if (err) {
196250ee6061SAndrew J. Bennieston 			message = "writing event-channel-rx";
196350ee6061SAndrew J. Bennieston 			goto error;
196450ee6061SAndrew J. Bennieston 		}
196550ee6061SAndrew J. Bennieston 	}
196650ee6061SAndrew J. Bennieston 
196750ee6061SAndrew J. Bennieston 	if (write_hierarchical)
196850ee6061SAndrew J. Bennieston 		kfree(path);
196950ee6061SAndrew J. Bennieston 	return 0;
197050ee6061SAndrew J. Bennieston 
197150ee6061SAndrew J. Bennieston error:
197250ee6061SAndrew J. Bennieston 	if (write_hierarchical)
197350ee6061SAndrew J. Bennieston 		kfree(path);
197450ee6061SAndrew J. Bennieston 	xenbus_dev_fatal(dev, err, "%s", message);
197550ee6061SAndrew J. Bennieston 	return err;
197650ee6061SAndrew J. Bennieston }
197750ee6061SAndrew J. Bennieston 
1978ce58725fSDavid Vrabel static void xennet_destroy_queues(struct netfront_info *info)
1979ce58725fSDavid Vrabel {
1980ce58725fSDavid Vrabel 	unsigned int i;
1981ce58725fSDavid Vrabel 
1982ce58725fSDavid Vrabel 	for (i = 0; i < info->netdev->real_num_tx_queues; i++) {
1983ce58725fSDavid Vrabel 		struct netfront_queue *queue = &info->queues[i];
1984ce58725fSDavid Vrabel 
1985ce58725fSDavid Vrabel 		if (netif_running(info->netdev))
1986ce58725fSDavid Vrabel 			napi_disable(&queue->napi);
1987ce58725fSDavid Vrabel 		netif_napi_del(&queue->napi);
1988ce58725fSDavid Vrabel 	}
1989ce58725fSDavid Vrabel 
1990ce58725fSDavid Vrabel 	kfree(info->queues);
1991ce58725fSDavid Vrabel 	info->queues = NULL;
1992ce58725fSDavid Vrabel }
1993ce58725fSDavid Vrabel 
19946c5aa6fcSDenis Kirjanov 
19956c5aa6fcSDenis Kirjanov 
19966c5aa6fcSDenis Kirjanov static int xennet_create_page_pool(struct netfront_queue *queue)
19976c5aa6fcSDenis Kirjanov {
19986c5aa6fcSDenis Kirjanov 	int err;
19996c5aa6fcSDenis Kirjanov 	struct page_pool_params pp_params = {
20006c5aa6fcSDenis Kirjanov 		.order = 0,
20016c5aa6fcSDenis Kirjanov 		.flags = 0,
20026c5aa6fcSDenis Kirjanov 		.pool_size = NET_RX_RING_SIZE,
20036c5aa6fcSDenis Kirjanov 		.nid = NUMA_NO_NODE,
20046c5aa6fcSDenis Kirjanov 		.dev = &queue->info->netdev->dev,
20056c5aa6fcSDenis Kirjanov 		.offset = XDP_PACKET_HEADROOM,
20066c5aa6fcSDenis Kirjanov 		.max_len = XEN_PAGE_SIZE - XDP_PACKET_HEADROOM,
20076c5aa6fcSDenis Kirjanov 	};
20086c5aa6fcSDenis Kirjanov 
20096c5aa6fcSDenis Kirjanov 	queue->page_pool = page_pool_create(&pp_params);
20106c5aa6fcSDenis Kirjanov 	if (IS_ERR(queue->page_pool)) {
20116c5aa6fcSDenis Kirjanov 		err = PTR_ERR(queue->page_pool);
20126c5aa6fcSDenis Kirjanov 		queue->page_pool = NULL;
20136c5aa6fcSDenis Kirjanov 		return err;
20146c5aa6fcSDenis Kirjanov 	}
20156c5aa6fcSDenis Kirjanov 
20166c5aa6fcSDenis Kirjanov 	err = xdp_rxq_info_reg(&queue->xdp_rxq, queue->info->netdev,
2017b02e5a0eSBjörn Töpel 			       queue->id, 0);
20186c5aa6fcSDenis Kirjanov 	if (err) {
20196c5aa6fcSDenis Kirjanov 		netdev_err(queue->info->netdev, "xdp_rxq_info_reg failed\n");
20206c5aa6fcSDenis Kirjanov 		goto err_free_pp;
20216c5aa6fcSDenis Kirjanov 	}
20226c5aa6fcSDenis Kirjanov 
20236c5aa6fcSDenis Kirjanov 	err = xdp_rxq_info_reg_mem_model(&queue->xdp_rxq,
20246c5aa6fcSDenis Kirjanov 					 MEM_TYPE_PAGE_POOL, queue->page_pool);
20256c5aa6fcSDenis Kirjanov 	if (err) {
20266c5aa6fcSDenis Kirjanov 		netdev_err(queue->info->netdev, "xdp_rxq_info_reg_mem_model failed\n");
20276c5aa6fcSDenis Kirjanov 		goto err_unregister_rxq;
20286c5aa6fcSDenis Kirjanov 	}
20296c5aa6fcSDenis Kirjanov 	return 0;
20306c5aa6fcSDenis Kirjanov 
20316c5aa6fcSDenis Kirjanov err_unregister_rxq:
20326c5aa6fcSDenis Kirjanov 	xdp_rxq_info_unreg(&queue->xdp_rxq);
20336c5aa6fcSDenis Kirjanov err_free_pp:
20346c5aa6fcSDenis Kirjanov 	page_pool_destroy(queue->page_pool);
20356c5aa6fcSDenis Kirjanov 	queue->page_pool = NULL;
20366c5aa6fcSDenis Kirjanov 	return err;
20376c5aa6fcSDenis Kirjanov }
20386c5aa6fcSDenis Kirjanov 
2039ce58725fSDavid Vrabel static int xennet_create_queues(struct netfront_info *info,
2040ca88ea12SJoe Jin 				unsigned int *num_queues)
2041ce58725fSDavid Vrabel {
2042ce58725fSDavid Vrabel 	unsigned int i;
2043ce58725fSDavid Vrabel 	int ret;
2044ce58725fSDavid Vrabel 
2045ca88ea12SJoe Jin 	info->queues = kcalloc(*num_queues, sizeof(struct netfront_queue),
2046ce58725fSDavid Vrabel 			       GFP_KERNEL);
2047ce58725fSDavid Vrabel 	if (!info->queues)
2048ce58725fSDavid Vrabel 		return -ENOMEM;
2049ce58725fSDavid Vrabel 
2050ca88ea12SJoe Jin 	for (i = 0; i < *num_queues; i++) {
2051ce58725fSDavid Vrabel 		struct netfront_queue *queue = &info->queues[i];
2052ce58725fSDavid Vrabel 
2053ce58725fSDavid Vrabel 		queue->id = i;
2054ce58725fSDavid Vrabel 		queue->info = info;
2055ce58725fSDavid Vrabel 
2056ce58725fSDavid Vrabel 		ret = xennet_init_queue(queue);
2057ce58725fSDavid Vrabel 		if (ret < 0) {
2058f599c64fSRoss Lagerwall 			dev_warn(&info->xbdev->dev,
205969cb8524SDavid Vrabel 				 "only created %d queues\n", i);
2060ca88ea12SJoe Jin 			*num_queues = i;
2061ce58725fSDavid Vrabel 			break;
2062ce58725fSDavid Vrabel 		}
2063ce58725fSDavid Vrabel 
20646c5aa6fcSDenis Kirjanov 		/* use page pool recycling instead of buddy allocator */
20656c5aa6fcSDenis Kirjanov 		ret = xennet_create_page_pool(queue);
20666c5aa6fcSDenis Kirjanov 		if (ret < 0) {
20676c5aa6fcSDenis Kirjanov 			dev_err(&info->xbdev->dev, "can't allocate page pool\n");
20686c5aa6fcSDenis Kirjanov 			*num_queues = i;
20696c5aa6fcSDenis Kirjanov 			return ret;
20706c5aa6fcSDenis Kirjanov 		}
20716c5aa6fcSDenis Kirjanov 
2072ce58725fSDavid Vrabel 		netif_napi_add(queue->info->netdev, &queue->napi,
2073ce58725fSDavid Vrabel 			       xennet_poll, 64);
2074ce58725fSDavid Vrabel 		if (netif_running(info->netdev))
2075ce58725fSDavid Vrabel 			napi_enable(&queue->napi);
2076ce58725fSDavid Vrabel 	}
2077ce58725fSDavid Vrabel 
2078ca88ea12SJoe Jin 	netif_set_real_num_tx_queues(info->netdev, *num_queues);
2079ce58725fSDavid Vrabel 
2080ca88ea12SJoe Jin 	if (*num_queues == 0) {
2081f599c64fSRoss Lagerwall 		dev_err(&info->xbdev->dev, "no queues\n");
2082ce58725fSDavid Vrabel 		return -EINVAL;
2083ce58725fSDavid Vrabel 	}
2084ce58725fSDavid Vrabel 	return 0;
2085ce58725fSDavid Vrabel }
2086ce58725fSDavid Vrabel 
20870d160211SJeremy Fitzhardinge /* Common code used when first setting up, and when resuming. */
2088f502bf2bSIan Campbell static int talk_to_netback(struct xenbus_device *dev,
20890d160211SJeremy Fitzhardinge 			   struct netfront_info *info)
20900d160211SJeremy Fitzhardinge {
20910d160211SJeremy Fitzhardinge 	const char *message;
20920d160211SJeremy Fitzhardinge 	struct xenbus_transaction xbt;
20930d160211SJeremy Fitzhardinge 	int err;
20942688fcb7SAndrew J. Bennieston 	unsigned int feature_split_evtchn;
20952688fcb7SAndrew J. Bennieston 	unsigned int i = 0;
209650ee6061SAndrew J. Bennieston 	unsigned int max_queues = 0;
20972688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
20982688fcb7SAndrew J. Bennieston 	unsigned int num_queues = 1;
20990d160211SJeremy Fitzhardinge 
21002688fcb7SAndrew J. Bennieston 	info->netdev->irq = 0;
21012688fcb7SAndrew J. Bennieston 
210250ee6061SAndrew J. Bennieston 	/* Check if backend supports multiple queues */
21032890ea5cSJuergen Gross 	max_queues = xenbus_read_unsigned(info->xbdev->otherend,
21042890ea5cSJuergen Gross 					  "multi-queue-max-queues", 1);
210550ee6061SAndrew J. Bennieston 	num_queues = min(max_queues, xennet_max_queues);
210650ee6061SAndrew J. Bennieston 
21072688fcb7SAndrew J. Bennieston 	/* Check feature-split-event-channels */
21082890ea5cSJuergen Gross 	feature_split_evtchn = xenbus_read_unsigned(info->xbdev->otherend,
21092890ea5cSJuergen Gross 					"feature-split-event-channels", 0);
21102688fcb7SAndrew J. Bennieston 
21112688fcb7SAndrew J. Bennieston 	/* Read mac addr. */
21122688fcb7SAndrew J. Bennieston 	err = xen_net_read_mac(dev, info->netdev->dev_addr);
21132688fcb7SAndrew J. Bennieston 	if (err) {
21142688fcb7SAndrew J. Bennieston 		xenbus_dev_fatal(dev, err, "parsing %s/mac", dev->nodename);
2115cb257783SRoss Lagerwall 		goto out_unlocked;
21162688fcb7SAndrew J. Bennieston 	}
21172688fcb7SAndrew J. Bennieston 
21186c5aa6fcSDenis Kirjanov 	info->netback_has_xdp_headroom = xenbus_read_unsigned(info->xbdev->otherend,
21196c5aa6fcSDenis Kirjanov 							      "feature-xdp-headroom", 0);
21206c5aa6fcSDenis Kirjanov 	if (info->netback_has_xdp_headroom) {
21216c5aa6fcSDenis Kirjanov 		/* set the current xen-netfront xdp state */
21226c5aa6fcSDenis Kirjanov 		err = talk_to_netback_xdp(info, info->netfront_xdp_enabled ?
21236c5aa6fcSDenis Kirjanov 					  NETBACK_XDP_HEADROOM_ENABLE :
21246c5aa6fcSDenis Kirjanov 					  NETBACK_XDP_HEADROOM_DISABLE);
21256c5aa6fcSDenis Kirjanov 		if (err)
21266c5aa6fcSDenis Kirjanov 			goto out_unlocked;
21276c5aa6fcSDenis Kirjanov 	}
21286c5aa6fcSDenis Kirjanov 
2129f599c64fSRoss Lagerwall 	rtnl_lock();
2130ce58725fSDavid Vrabel 	if (info->queues)
2131ce58725fSDavid Vrabel 		xennet_destroy_queues(info);
2132ce58725fSDavid Vrabel 
2133ca88ea12SJoe Jin 	err = xennet_create_queues(info, &num_queues);
2134e2e004acSRoss Lagerwall 	if (err < 0) {
2135e2e004acSRoss Lagerwall 		xenbus_dev_fatal(dev, err, "creating queues");
2136e2e004acSRoss Lagerwall 		kfree(info->queues);
2137e2e004acSRoss Lagerwall 		info->queues = NULL;
2138e2e004acSRoss Lagerwall 		goto out;
2139e2e004acSRoss Lagerwall 	}
2140f599c64fSRoss Lagerwall 	rtnl_unlock();
21412688fcb7SAndrew J. Bennieston 
21422688fcb7SAndrew J. Bennieston 	/* Create shared ring, alloc event channel -- for each queue */
21432688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i) {
21442688fcb7SAndrew J. Bennieston 		queue = &info->queues[i];
21452688fcb7SAndrew J. Bennieston 		err = setup_netfront(dev, queue, feature_split_evtchn);
2146e2e004acSRoss Lagerwall 		if (err)
21472688fcb7SAndrew J. Bennieston 			goto destroy_ring;
21482688fcb7SAndrew J. Bennieston 	}
21490d160211SJeremy Fitzhardinge 
21500d160211SJeremy Fitzhardinge again:
21510d160211SJeremy Fitzhardinge 	err = xenbus_transaction_start(&xbt);
21520d160211SJeremy Fitzhardinge 	if (err) {
21530d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "starting transaction");
21540d160211SJeremy Fitzhardinge 		goto destroy_ring;
21550d160211SJeremy Fitzhardinge 	}
21560d160211SJeremy Fitzhardinge 
2157812494d9Schas williams 	if (xenbus_exists(XBT_NIL,
2158812494d9Schas williams 			  info->xbdev->otherend, "multi-queue-max-queues")) {
2159812494d9Schas williams 		/* Write the number of queues */
2160812494d9Schas williams 		err = xenbus_printf(xbt, dev->nodename,
2161812494d9Schas williams 				    "multi-queue-num-queues", "%u", num_queues);
2162812494d9Schas williams 		if (err) {
2163812494d9Schas williams 			message = "writing multi-queue-num-queues";
2164812494d9Schas williams 			goto abort_transaction_no_dev_fatal;
2165812494d9Schas williams 		}
2166812494d9Schas williams 	}
2167812494d9Schas williams 
216850ee6061SAndrew J. Bennieston 	if (num_queues == 1) {
216950ee6061SAndrew J. Bennieston 		err = write_queue_xenstore_keys(&info->queues[0], &xbt, 0); /* flat */
217050ee6061SAndrew J. Bennieston 		if (err)
217150ee6061SAndrew J. Bennieston 			goto abort_transaction_no_dev_fatal;
2172d634bf2cSWei Liu 	} else {
217350ee6061SAndrew J. Bennieston 		/* Write the keys for each queue */
217450ee6061SAndrew J. Bennieston 		for (i = 0; i < num_queues; ++i) {
217550ee6061SAndrew J. Bennieston 			queue = &info->queues[i];
217650ee6061SAndrew J. Bennieston 			err = write_queue_xenstore_keys(queue, &xbt, 1); /* hierarchical */
217750ee6061SAndrew J. Bennieston 			if (err)
217850ee6061SAndrew J. Bennieston 				goto abort_transaction_no_dev_fatal;
2179d634bf2cSWei Liu 		}
2180d634bf2cSWei Liu 	}
21810d160211SJeremy Fitzhardinge 
218250ee6061SAndrew J. Bennieston 	/* The remaining keys are not queue-specific */
21830d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "request-rx-copy", "%u",
21840d160211SJeremy Fitzhardinge 			    1);
21850d160211SJeremy Fitzhardinge 	if (err) {
21860d160211SJeremy Fitzhardinge 		message = "writing request-rx-copy";
21870d160211SJeremy Fitzhardinge 		goto abort_transaction;
21880d160211SJeremy Fitzhardinge 	}
21890d160211SJeremy Fitzhardinge 
21900d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-rx-notify", "%d", 1);
21910d160211SJeremy Fitzhardinge 	if (err) {
21920d160211SJeremy Fitzhardinge 		message = "writing feature-rx-notify";
21930d160211SJeremy Fitzhardinge 		goto abort_transaction;
21940d160211SJeremy Fitzhardinge 	}
21950d160211SJeremy Fitzhardinge 
21960d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-sg", "%d", 1);
21970d160211SJeremy Fitzhardinge 	if (err) {
21980d160211SJeremy Fitzhardinge 		message = "writing feature-sg";
21990d160211SJeremy Fitzhardinge 		goto abort_transaction;
22000d160211SJeremy Fitzhardinge 	}
22010d160211SJeremy Fitzhardinge 
22020d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-gso-tcpv4", "%d", 1);
22030d160211SJeremy Fitzhardinge 	if (err) {
22040d160211SJeremy Fitzhardinge 		message = "writing feature-gso-tcpv4";
22050d160211SJeremy Fitzhardinge 		goto abort_transaction;
22060d160211SJeremy Fitzhardinge 	}
22070d160211SJeremy Fitzhardinge 
22082c0057deSPaul Durrant 	err = xenbus_write(xbt, dev->nodename, "feature-gso-tcpv6", "1");
22092c0057deSPaul Durrant 	if (err) {
22102c0057deSPaul Durrant 		message = "writing feature-gso-tcpv6";
22112c0057deSPaul Durrant 		goto abort_transaction;
22122c0057deSPaul Durrant 	}
22132c0057deSPaul Durrant 
22142c0057deSPaul Durrant 	err = xenbus_write(xbt, dev->nodename, "feature-ipv6-csum-offload",
22152c0057deSPaul Durrant 			   "1");
22162c0057deSPaul Durrant 	if (err) {
22172c0057deSPaul Durrant 		message = "writing feature-ipv6-csum-offload";
22182c0057deSPaul Durrant 		goto abort_transaction;
22192c0057deSPaul Durrant 	}
22202c0057deSPaul Durrant 
22210d160211SJeremy Fitzhardinge 	err = xenbus_transaction_end(xbt, 0);
22220d160211SJeremy Fitzhardinge 	if (err) {
22230d160211SJeremy Fitzhardinge 		if (err == -EAGAIN)
22240d160211SJeremy Fitzhardinge 			goto again;
22250d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "completing transaction");
22260d160211SJeremy Fitzhardinge 		goto destroy_ring;
22270d160211SJeremy Fitzhardinge 	}
22280d160211SJeremy Fitzhardinge 
22290d160211SJeremy Fitzhardinge 	return 0;
22300d160211SJeremy Fitzhardinge 
22310d160211SJeremy Fitzhardinge  abort_transaction:
22320d160211SJeremy Fitzhardinge 	xenbus_dev_fatal(dev, err, "%s", message);
223350ee6061SAndrew J. Bennieston abort_transaction_no_dev_fatal:
223450ee6061SAndrew J. Bennieston 	xenbus_transaction_end(xbt, 1);
22350d160211SJeremy Fitzhardinge  destroy_ring:
22360d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
2237f599c64fSRoss Lagerwall 	rtnl_lock();
2238e2e004acSRoss Lagerwall 	xennet_destroy_queues(info);
22390d160211SJeremy Fitzhardinge  out:
2240f599c64fSRoss Lagerwall 	rtnl_unlock();
2241cb257783SRoss Lagerwall out_unlocked:
2242d86b5672SVitaly Kuznetsov 	device_unregister(&dev->dev);
22430d160211SJeremy Fitzhardinge 	return err;
22440d160211SJeremy Fitzhardinge }
22450d160211SJeremy Fitzhardinge 
22460d160211SJeremy Fitzhardinge static int xennet_connect(struct net_device *dev)
22470d160211SJeremy Fitzhardinge {
22480d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
22492688fcb7SAndrew J. Bennieston 	unsigned int num_queues = 0;
2250a5b5dc3cSDavid Vrabel 	int err;
22512688fcb7SAndrew J. Bennieston 	unsigned int j = 0;
22522688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
22530d160211SJeremy Fitzhardinge 
22542890ea5cSJuergen Gross 	if (!xenbus_read_unsigned(np->xbdev->otherend, "feature-rx-copy", 0)) {
22550d160211SJeremy Fitzhardinge 		dev_info(&dev->dev,
2256898eb71cSJoe Perches 			 "backend does not support copying receive path\n");
22570d160211SJeremy Fitzhardinge 		return -ENODEV;
22580d160211SJeremy Fitzhardinge 	}
22590d160211SJeremy Fitzhardinge 
2260f502bf2bSIan Campbell 	err = talk_to_netback(np->xbdev, np);
22610d160211SJeremy Fitzhardinge 	if (err)
22620d160211SJeremy Fitzhardinge 		return err;
22636c5aa6fcSDenis Kirjanov 	if (np->netback_has_xdp_headroom)
22646c5aa6fcSDenis Kirjanov 		pr_info("backend supports XDP headroom\n");
22650d160211SJeremy Fitzhardinge 
22662688fcb7SAndrew J. Bennieston 	/* talk_to_netback() sets the correct number of queues */
22672688fcb7SAndrew J. Bennieston 	num_queues = dev->real_num_tx_queues;
22682688fcb7SAndrew J. Bennieston 
2269f599c64fSRoss Lagerwall 	if (dev->reg_state == NETREG_UNINITIALIZED) {
2270f599c64fSRoss Lagerwall 		err = register_netdev(dev);
2271f599c64fSRoss Lagerwall 		if (err) {
2272f599c64fSRoss Lagerwall 			pr_warn("%s: register_netdev err=%d\n", __func__, err);
2273f599c64fSRoss Lagerwall 			device_unregister(&np->xbdev->dev);
2274f599c64fSRoss Lagerwall 			return err;
2275f599c64fSRoss Lagerwall 		}
2276f599c64fSRoss Lagerwall 	}
2277f599c64fSRoss Lagerwall 
227845c8184cSRoss Lagerwall 	rtnl_lock();
227945c8184cSRoss Lagerwall 	netdev_update_features(dev);
228045c8184cSRoss Lagerwall 	rtnl_unlock();
228145c8184cSRoss Lagerwall 
22820d160211SJeremy Fitzhardinge 	/*
2283a5b5dc3cSDavid Vrabel 	 * All public and private state should now be sane.  Get
22840d160211SJeremy Fitzhardinge 	 * ready to start sending and receiving packets and give the driver
22850d160211SJeremy Fitzhardinge 	 * domain a kick because we've probably just requeued some
22860d160211SJeremy Fitzhardinge 	 * packets.
22870d160211SJeremy Fitzhardinge 	 */
22880d160211SJeremy Fitzhardinge 	netif_carrier_on(np->netdev);
22892688fcb7SAndrew J. Bennieston 	for (j = 0; j < num_queues; ++j) {
22902688fcb7SAndrew J. Bennieston 		queue = &np->queues[j];
2291f50b4076SDavid Vrabel 
22922688fcb7SAndrew J. Bennieston 		notify_remote_via_irq(queue->tx_irq);
22932688fcb7SAndrew J. Bennieston 		if (queue->tx_irq != queue->rx_irq)
22942688fcb7SAndrew J. Bennieston 			notify_remote_via_irq(queue->rx_irq);
22950d160211SJeremy Fitzhardinge 
2296f50b4076SDavid Vrabel 		spin_lock_irq(&queue->tx_lock);
2297f50b4076SDavid Vrabel 		xennet_tx_buf_gc(queue);
22982688fcb7SAndrew J. Bennieston 		spin_unlock_irq(&queue->tx_lock);
2299f50b4076SDavid Vrabel 
2300f50b4076SDavid Vrabel 		spin_lock_bh(&queue->rx_lock);
2301f50b4076SDavid Vrabel 		xennet_alloc_rx_buffers(queue);
23022688fcb7SAndrew J. Bennieston 		spin_unlock_bh(&queue->rx_lock);
23032688fcb7SAndrew J. Bennieston 	}
23040d160211SJeremy Fitzhardinge 
23050d160211SJeremy Fitzhardinge 	return 0;
23060d160211SJeremy Fitzhardinge }
23070d160211SJeremy Fitzhardinge 
23080d160211SJeremy Fitzhardinge /**
23090d160211SJeremy Fitzhardinge  * Callback received when the backend's state changes.
23100d160211SJeremy Fitzhardinge  */
2311f502bf2bSIan Campbell static void netback_changed(struct xenbus_device *dev,
23120d160211SJeremy Fitzhardinge 			    enum xenbus_state backend_state)
23130d160211SJeremy Fitzhardinge {
23141b713e00SGreg Kroah-Hartman 	struct netfront_info *np = dev_get_drvdata(&dev->dev);
23150d160211SJeremy Fitzhardinge 	struct net_device *netdev = np->netdev;
23160d160211SJeremy Fitzhardinge 
23170d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", xenbus_strstate(backend_state));
23180d160211SJeremy Fitzhardinge 
23198edfe2e9SJuergen Gross 	wake_up_all(&module_wq);
23208edfe2e9SJuergen Gross 
23210d160211SJeremy Fitzhardinge 	switch (backend_state) {
23220d160211SJeremy Fitzhardinge 	case XenbusStateInitialising:
23230d160211SJeremy Fitzhardinge 	case XenbusStateInitialised:
2324b78c9512SNoboru Iwamatsu 	case XenbusStateReconfiguring:
2325b78c9512SNoboru Iwamatsu 	case XenbusStateReconfigured:
23260d160211SJeremy Fitzhardinge 	case XenbusStateUnknown:
23270d160211SJeremy Fitzhardinge 		break;
23280d160211SJeremy Fitzhardinge 
23290d160211SJeremy Fitzhardinge 	case XenbusStateInitWait:
23300d160211SJeremy Fitzhardinge 		if (dev->state != XenbusStateInitialising)
23310d160211SJeremy Fitzhardinge 			break;
23320d160211SJeremy Fitzhardinge 		if (xennet_connect(netdev) != 0)
23330d160211SJeremy Fitzhardinge 			break;
23340d160211SJeremy Fitzhardinge 		xenbus_switch_state(dev, XenbusStateConnected);
233508e34eb1SLaszlo Ersek 		break;
233608e34eb1SLaszlo Ersek 
233708e34eb1SLaszlo Ersek 	case XenbusStateConnected:
2338ee89bab1SAmerigo Wang 		netdev_notify_peers(netdev);
23390d160211SJeremy Fitzhardinge 		break;
23400d160211SJeremy Fitzhardinge 
2341bce3ea81SDavid Vrabel 	case XenbusStateClosed:
2342bce3ea81SDavid Vrabel 		if (dev->state == XenbusStateClosed)
2343bce3ea81SDavid Vrabel 			break;
2344df561f66SGustavo A. R. Silva 		fallthrough;	/* Missed the backend's CLOSING state */
23450d160211SJeremy Fitzhardinge 	case XenbusStateClosing:
23460d160211SJeremy Fitzhardinge 		xenbus_frontend_closed(dev);
23470d160211SJeremy Fitzhardinge 		break;
23480d160211SJeremy Fitzhardinge 	}
23490d160211SJeremy Fitzhardinge }
23500d160211SJeremy Fitzhardinge 
2351e0ce4af9SIan Campbell static const struct xennet_stat {
2352e0ce4af9SIan Campbell 	char name[ETH_GSTRING_LEN];
2353e0ce4af9SIan Campbell 	u16 offset;
2354e0ce4af9SIan Campbell } xennet_stats[] = {
2355e0ce4af9SIan Campbell 	{
2356e0ce4af9SIan Campbell 		"rx_gso_checksum_fixup",
2357e0ce4af9SIan Campbell 		offsetof(struct netfront_info, rx_gso_checksum_fixup)
2358e0ce4af9SIan Campbell 	},
2359e0ce4af9SIan Campbell };
2360e0ce4af9SIan Campbell 
2361e0ce4af9SIan Campbell static int xennet_get_sset_count(struct net_device *dev, int string_set)
2362e0ce4af9SIan Campbell {
2363e0ce4af9SIan Campbell 	switch (string_set) {
2364e0ce4af9SIan Campbell 	case ETH_SS_STATS:
2365e0ce4af9SIan Campbell 		return ARRAY_SIZE(xennet_stats);
2366e0ce4af9SIan Campbell 	default:
2367e0ce4af9SIan Campbell 		return -EINVAL;
2368e0ce4af9SIan Campbell 	}
2369e0ce4af9SIan Campbell }
2370e0ce4af9SIan Campbell 
2371e0ce4af9SIan Campbell static void xennet_get_ethtool_stats(struct net_device *dev,
2372e0ce4af9SIan Campbell 				     struct ethtool_stats *stats, u64 * data)
2373e0ce4af9SIan Campbell {
2374e0ce4af9SIan Campbell 	void *np = netdev_priv(dev);
2375e0ce4af9SIan Campbell 	int i;
2376e0ce4af9SIan Campbell 
2377e0ce4af9SIan Campbell 	for (i = 0; i < ARRAY_SIZE(xennet_stats); i++)
23782688fcb7SAndrew J. Bennieston 		data[i] = atomic_read((atomic_t *)(np + xennet_stats[i].offset));
2379e0ce4af9SIan Campbell }
2380e0ce4af9SIan Campbell 
2381e0ce4af9SIan Campbell static void xennet_get_strings(struct net_device *dev, u32 stringset, u8 * data)
2382e0ce4af9SIan Campbell {
2383e0ce4af9SIan Campbell 	int i;
2384e0ce4af9SIan Campbell 
2385e0ce4af9SIan Campbell 	switch (stringset) {
2386e0ce4af9SIan Campbell 	case ETH_SS_STATS:
2387e0ce4af9SIan Campbell 		for (i = 0; i < ARRAY_SIZE(xennet_stats); i++)
2388e0ce4af9SIan Campbell 			memcpy(data + i * ETH_GSTRING_LEN,
2389e0ce4af9SIan Campbell 			       xennet_stats[i].name, ETH_GSTRING_LEN);
2390e0ce4af9SIan Campbell 		break;
2391e0ce4af9SIan Campbell 	}
2392e0ce4af9SIan Campbell }
2393e0ce4af9SIan Campbell 
23940fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops =
23950d160211SJeremy Fitzhardinge {
23960d160211SJeremy Fitzhardinge 	.get_link = ethtool_op_get_link,
2397e0ce4af9SIan Campbell 
2398e0ce4af9SIan Campbell 	.get_sset_count = xennet_get_sset_count,
2399e0ce4af9SIan Campbell 	.get_ethtool_stats = xennet_get_ethtool_stats,
2400e0ce4af9SIan Campbell 	.get_strings = xennet_get_strings,
240191ffb9d3SDaniel Drown 	.get_ts_info = ethtool_op_get_ts_info,
24020d160211SJeremy Fitzhardinge };
24030d160211SJeremy Fitzhardinge 
24040d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS
24051f3c2ebaSDavid Vrabel static ssize_t show_rxbuf(struct device *dev,
24060d160211SJeremy Fitzhardinge 			  struct device_attribute *attr, char *buf)
24070d160211SJeremy Fitzhardinge {
24081f3c2ebaSDavid Vrabel 	return sprintf(buf, "%lu\n", NET_RX_RING_SIZE);
24090d160211SJeremy Fitzhardinge }
24100d160211SJeremy Fitzhardinge 
24111f3c2ebaSDavid Vrabel static ssize_t store_rxbuf(struct device *dev,
24120d160211SJeremy Fitzhardinge 			   struct device_attribute *attr,
24130d160211SJeremy Fitzhardinge 			   const char *buf, size_t len)
24140d160211SJeremy Fitzhardinge {
24150d160211SJeremy Fitzhardinge 	char *endp;
24160d160211SJeremy Fitzhardinge 
24170d160211SJeremy Fitzhardinge 	if (!capable(CAP_NET_ADMIN))
24180d160211SJeremy Fitzhardinge 		return -EPERM;
24190d160211SJeremy Fitzhardinge 
24208ed7ec13SAndrew Lunn 	simple_strtoul(buf, &endp, 0);
24210d160211SJeremy Fitzhardinge 	if (endp == buf)
24220d160211SJeremy Fitzhardinge 		return -EBADMSG;
24230d160211SJeremy Fitzhardinge 
24241f3c2ebaSDavid Vrabel 	/* rxbuf_min and rxbuf_max are no longer configurable. */
24250d160211SJeremy Fitzhardinge 
24260d160211SJeremy Fitzhardinge 	return len;
24270d160211SJeremy Fitzhardinge }
24280d160211SJeremy Fitzhardinge 
2429d61e4038SJoe Perches static DEVICE_ATTR(rxbuf_min, 0644, show_rxbuf, store_rxbuf);
2430d61e4038SJoe Perches static DEVICE_ATTR(rxbuf_max, 0644, show_rxbuf, store_rxbuf);
2431d61e4038SJoe Perches static DEVICE_ATTR(rxbuf_cur, 0444, show_rxbuf, NULL);
243227b917e5STakashi Iwai 
243327b917e5STakashi Iwai static struct attribute *xennet_dev_attrs[] = {
243427b917e5STakashi Iwai 	&dev_attr_rxbuf_min.attr,
243527b917e5STakashi Iwai 	&dev_attr_rxbuf_max.attr,
243627b917e5STakashi Iwai 	&dev_attr_rxbuf_cur.attr,
243727b917e5STakashi Iwai 	NULL
24380d160211SJeremy Fitzhardinge };
24390d160211SJeremy Fitzhardinge 
244027b917e5STakashi Iwai static const struct attribute_group xennet_dev_group = {
244127b917e5STakashi Iwai 	.attrs = xennet_dev_attrs
244227b917e5STakashi Iwai };
24430d160211SJeremy Fitzhardinge #endif /* CONFIG_SYSFS */
24440d160211SJeremy Fitzhardinge 
2445c2c63310SAndrea Righi static void xennet_bus_close(struct xenbus_device *dev)
2446c2c63310SAndrea Righi {
2447c2c63310SAndrea Righi 	int ret;
2448c2c63310SAndrea Righi 
2449c2c63310SAndrea Righi 	if (xenbus_read_driver_state(dev->otherend) == XenbusStateClosed)
2450c2c63310SAndrea Righi 		return;
2451c2c63310SAndrea Righi 	do {
2452c2c63310SAndrea Righi 		xenbus_switch_state(dev, XenbusStateClosing);
2453c2c63310SAndrea Righi 		ret = wait_event_timeout(module_wq,
2454c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2455c2c63310SAndrea Righi 				   XenbusStateClosing ||
2456c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2457c2c63310SAndrea Righi 				   XenbusStateClosed ||
2458c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2459c2c63310SAndrea Righi 				   XenbusStateUnknown,
2460c2c63310SAndrea Righi 				   XENNET_TIMEOUT);
2461c2c63310SAndrea Righi 	} while (!ret);
2462c2c63310SAndrea Righi 
2463c2c63310SAndrea Righi 	if (xenbus_read_driver_state(dev->otherend) == XenbusStateClosed)
2464c2c63310SAndrea Righi 		return;
2465c2c63310SAndrea Righi 
2466c2c63310SAndrea Righi 	do {
2467c2c63310SAndrea Righi 		xenbus_switch_state(dev, XenbusStateClosed);
2468c2c63310SAndrea Righi 		ret = wait_event_timeout(module_wq,
2469c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2470c2c63310SAndrea Righi 				   XenbusStateClosed ||
2471c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2472c2c63310SAndrea Righi 				   XenbusStateUnknown,
2473c2c63310SAndrea Righi 				   XENNET_TIMEOUT);
2474c2c63310SAndrea Righi 	} while (!ret);
2475c2c63310SAndrea Righi }
2476c2c63310SAndrea Righi 
24778e0e46bbSBill Pemberton static int xennet_remove(struct xenbus_device *dev)
24780d160211SJeremy Fitzhardinge {
24791b713e00SGreg Kroah-Hartman 	struct netfront_info *info = dev_get_drvdata(&dev->dev);
24800d160211SJeremy Fitzhardinge 
2481c2c63310SAndrea Righi 	xennet_bus_close(dev);
24820d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
24830d160211SJeremy Fitzhardinge 
2484f599c64fSRoss Lagerwall 	if (info->netdev->reg_state == NETREG_REGISTERED)
24856bc96d04SIan Campbell 		unregister_netdev(info->netdev);
24866bc96d04SIan Campbell 
2487f599c64fSRoss Lagerwall 	if (info->queues) {
2488f599c64fSRoss Lagerwall 		rtnl_lock();
2489ad068118SDavid Vrabel 		xennet_destroy_queues(info);
2490f599c64fSRoss Lagerwall 		rtnl_unlock();
2491f599c64fSRoss Lagerwall 	}
2492900e1833SDavid Vrabel 	xennet_free_netdev(info->netdev);
24930d160211SJeremy Fitzhardinge 
24940d160211SJeremy Fitzhardinge 	return 0;
24950d160211SJeremy Fitzhardinge }
24960d160211SJeremy Fitzhardinge 
249795afae48SDavid Vrabel static const struct xenbus_device_id netfront_ids[] = {
249895afae48SDavid Vrabel 	{ "vif" },
249995afae48SDavid Vrabel 	{ "" }
250095afae48SDavid Vrabel };
250195afae48SDavid Vrabel 
250295afae48SDavid Vrabel static struct xenbus_driver netfront_driver = {
250395afae48SDavid Vrabel 	.ids = netfront_ids,
25040d160211SJeremy Fitzhardinge 	.probe = netfront_probe,
25058e0e46bbSBill Pemberton 	.remove = xennet_remove,
25060d160211SJeremy Fitzhardinge 	.resume = netfront_resume,
2507f502bf2bSIan Campbell 	.otherend_changed = netback_changed,
250895afae48SDavid Vrabel };
25090d160211SJeremy Fitzhardinge 
25100d160211SJeremy Fitzhardinge static int __init netif_init(void)
25110d160211SJeremy Fitzhardinge {
25126e833587SJeremy Fitzhardinge 	if (!xen_domain())
25130d160211SJeremy Fitzhardinge 		return -ENODEV;
25140d160211SJeremy Fitzhardinge 
251551c71a3bSKonrad Rzeszutek Wilk 	if (!xen_has_pv_nic_devices())
2516b9136d20SIgor Mammedov 		return -ENODEV;
2517b9136d20SIgor Mammedov 
2518383eda32SJoe Perches 	pr_info("Initialising Xen virtual ethernet driver\n");
25190d160211SJeremy Fitzhardinge 
2520034702a6SJuergen Gross 	/* Allow as many queues as there are CPUs inut max. 8 if user has not
252132a84405SWei Liu 	 * specified a value.
252232a84405SWei Liu 	 */
252332a84405SWei Liu 	if (xennet_max_queues == 0)
2524034702a6SJuergen Gross 		xennet_max_queues = min_t(unsigned int, MAX_QUEUES_DEFAULT,
2525034702a6SJuergen Gross 					  num_online_cpus());
252650ee6061SAndrew J. Bennieston 
2527ffb78a26SAl Viro 	return xenbus_register_frontend(&netfront_driver);
25280d160211SJeremy Fitzhardinge }
25290d160211SJeremy Fitzhardinge module_init(netif_init);
25300d160211SJeremy Fitzhardinge 
25310d160211SJeremy Fitzhardinge 
25320d160211SJeremy Fitzhardinge static void __exit netif_exit(void)
25330d160211SJeremy Fitzhardinge {
2534ffb78a26SAl Viro 	xenbus_unregister_driver(&netfront_driver);
25350d160211SJeremy Fitzhardinge }
25360d160211SJeremy Fitzhardinge module_exit(netif_exit);
25370d160211SJeremy Fitzhardinge 
25380d160211SJeremy Fitzhardinge MODULE_DESCRIPTION("Xen virtual network device frontend");
25390d160211SJeremy Fitzhardinge MODULE_LICENSE("GPL");
2540d2f0c52bSMark McLoughlin MODULE_ALIAS("xen:vif");
25414f93f09bSMark McLoughlin MODULE_ALIAS("xennet");
2542