xref: /openbmc/linux/drivers/net/xen-netfront.c (revision fdc13979)
10d160211SJeremy Fitzhardinge /*
20d160211SJeremy Fitzhardinge  * Virtual network driver for conversing with remote driver backends.
30d160211SJeremy Fitzhardinge  *
40d160211SJeremy Fitzhardinge  * Copyright (c) 2002-2005, K A Fraser
50d160211SJeremy Fitzhardinge  * Copyright (c) 2005, XenSource Ltd
60d160211SJeremy Fitzhardinge  *
70d160211SJeremy Fitzhardinge  * This program is free software; you can redistribute it and/or
80d160211SJeremy Fitzhardinge  * modify it under the terms of the GNU General Public License version 2
90d160211SJeremy Fitzhardinge  * as published by the Free Software Foundation; or, when distributed
100d160211SJeremy Fitzhardinge  * separately from the Linux kernel or incorporated into other
110d160211SJeremy Fitzhardinge  * software packages, subject to the following license:
120d160211SJeremy Fitzhardinge  *
130d160211SJeremy Fitzhardinge  * Permission is hereby granted, free of charge, to any person obtaining a copy
140d160211SJeremy Fitzhardinge  * of this source file (the "Software"), to deal in the Software without
150d160211SJeremy Fitzhardinge  * restriction, including without limitation the rights to use, copy, modify,
160d160211SJeremy Fitzhardinge  * merge, publish, distribute, sublicense, and/or sell copies of the Software,
170d160211SJeremy Fitzhardinge  * and to permit persons to whom the Software is furnished to do so, subject to
180d160211SJeremy Fitzhardinge  * the following conditions:
190d160211SJeremy Fitzhardinge  *
200d160211SJeremy Fitzhardinge  * The above copyright notice and this permission notice shall be included in
210d160211SJeremy Fitzhardinge  * all copies or substantial portions of the Software.
220d160211SJeremy Fitzhardinge  *
230d160211SJeremy Fitzhardinge  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
240d160211SJeremy Fitzhardinge  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
250d160211SJeremy Fitzhardinge  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
260d160211SJeremy Fitzhardinge  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
270d160211SJeremy Fitzhardinge  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
280d160211SJeremy Fitzhardinge  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
290d160211SJeremy Fitzhardinge  * IN THE SOFTWARE.
300d160211SJeremy Fitzhardinge  */
310d160211SJeremy Fitzhardinge 
32383eda32SJoe Perches #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
33383eda32SJoe Perches 
340d160211SJeremy Fitzhardinge #include <linux/module.h>
350d160211SJeremy Fitzhardinge #include <linux/kernel.h>
360d160211SJeremy Fitzhardinge #include <linux/netdevice.h>
370d160211SJeremy Fitzhardinge #include <linux/etherdevice.h>
380d160211SJeremy Fitzhardinge #include <linux/skbuff.h>
390d160211SJeremy Fitzhardinge #include <linux/ethtool.h>
400d160211SJeremy Fitzhardinge #include <linux/if_ether.h>
419ecd1a75SWei Liu #include <net/tcp.h>
420d160211SJeremy Fitzhardinge #include <linux/udp.h>
430d160211SJeremy Fitzhardinge #include <linux/moduleparam.h>
440d160211SJeremy Fitzhardinge #include <linux/mm.h>
455a0e3ad6STejun Heo #include <linux/slab.h>
460d160211SJeremy Fitzhardinge #include <net/ip.h>
476c5aa6fcSDenis Kirjanov #include <linux/bpf.h>
486c5aa6fcSDenis Kirjanov #include <net/page_pool.h>
496c5aa6fcSDenis Kirjanov #include <linux/bpf_trace.h>
500d160211SJeremy Fitzhardinge 
511ccbf534SJeremy Fitzhardinge #include <xen/xen.h>
520d160211SJeremy Fitzhardinge #include <xen/xenbus.h>
530d160211SJeremy Fitzhardinge #include <xen/events.h>
540d160211SJeremy Fitzhardinge #include <xen/page.h>
55b9136d20SIgor Mammedov #include <xen/platform_pci.h>
560d160211SJeremy Fitzhardinge #include <xen/grant_table.h>
570d160211SJeremy Fitzhardinge 
580d160211SJeremy Fitzhardinge #include <xen/interface/io/netif.h>
590d160211SJeremy Fitzhardinge #include <xen/interface/memory.h>
600d160211SJeremy Fitzhardinge #include <xen/interface/grant_table.h>
610d160211SJeremy Fitzhardinge 
6250ee6061SAndrew J. Bennieston /* Module parameters */
63034702a6SJuergen Gross #define MAX_QUEUES_DEFAULT 8
6450ee6061SAndrew J. Bennieston static unsigned int xennet_max_queues;
6550ee6061SAndrew J. Bennieston module_param_named(max_queues, xennet_max_queues, uint, 0644);
6650ee6061SAndrew J. Bennieston MODULE_PARM_DESC(max_queues,
6750ee6061SAndrew J. Bennieston 		 "Maximum number of queues per virtual interface");
6850ee6061SAndrew J. Bennieston 
69c2c63310SAndrea Righi #define XENNET_TIMEOUT  (5 * HZ)
70c2c63310SAndrea Righi 
710fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops;
720d160211SJeremy Fitzhardinge 
730d160211SJeremy Fitzhardinge struct netfront_cb {
743683243bSIan Campbell 	int pull_to;
750d160211SJeremy Fitzhardinge };
760d160211SJeremy Fitzhardinge 
770d160211SJeremy Fitzhardinge #define NETFRONT_SKB_CB(skb)	((struct netfront_cb *)((skb)->cb))
780d160211SJeremy Fitzhardinge 
790d160211SJeremy Fitzhardinge #define RX_COPY_THRESHOLD 256
800d160211SJeremy Fitzhardinge 
810d160211SJeremy Fitzhardinge #define GRANT_INVALID_REF	0
820d160211SJeremy Fitzhardinge 
8330c5d7f0SJulien Grall #define NET_TX_RING_SIZE __CONST_RING_SIZE(xen_netif_tx, XEN_PAGE_SIZE)
8430c5d7f0SJulien Grall #define NET_RX_RING_SIZE __CONST_RING_SIZE(xen_netif_rx, XEN_PAGE_SIZE)
851f3c2ebaSDavid Vrabel 
861f3c2ebaSDavid Vrabel /* Minimum number of Rx slots (includes slot for GSO metadata). */
871f3c2ebaSDavid Vrabel #define NET_RX_SLOTS_MIN (XEN_NETIF_NR_SLOTS_MIN + 1)
880d160211SJeremy Fitzhardinge 
892688fcb7SAndrew J. Bennieston /* Queue name is interface name with "-qNNN" appended */
902688fcb7SAndrew J. Bennieston #define QUEUE_NAME_SIZE (IFNAMSIZ + 6)
912688fcb7SAndrew J. Bennieston 
922688fcb7SAndrew J. Bennieston /* IRQ name is queue name with "-tx" or "-rx" appended */
932688fcb7SAndrew J. Bennieston #define IRQ_NAME_SIZE (QUEUE_NAME_SIZE + 3)
942688fcb7SAndrew J. Bennieston 
958edfe2e9SJuergen Gross static DECLARE_WAIT_QUEUE_HEAD(module_wq);
965b5971dfSEduardo Otubo 
97e00f85beSstephen hemminger struct netfront_stats {
98900e1833SDavid Vrabel 	u64			packets;
99900e1833SDavid Vrabel 	u64			bytes;
100e00f85beSstephen hemminger 	struct u64_stats_sync	syncp;
101e00f85beSstephen hemminger };
102e00f85beSstephen hemminger 
1032688fcb7SAndrew J. Bennieston struct netfront_info;
1042688fcb7SAndrew J. Bennieston 
1052688fcb7SAndrew J. Bennieston struct netfront_queue {
1062688fcb7SAndrew J. Bennieston 	unsigned int id; /* Queue ID, 0-based */
1072688fcb7SAndrew J. Bennieston 	char name[QUEUE_NAME_SIZE]; /* DEVNAME-qN */
1082688fcb7SAndrew J. Bennieston 	struct netfront_info *info;
1090d160211SJeremy Fitzhardinge 
1106c5aa6fcSDenis Kirjanov 	struct bpf_prog __rcu *xdp_prog;
1116c5aa6fcSDenis Kirjanov 
112bea3348eSStephen Hemminger 	struct napi_struct napi;
1130d160211SJeremy Fitzhardinge 
114d634bf2cSWei Liu 	/* Split event channels support, tx_* == rx_* when using
115d634bf2cSWei Liu 	 * single event channel.
116d634bf2cSWei Liu 	 */
117d634bf2cSWei Liu 	unsigned int tx_evtchn, rx_evtchn;
118d634bf2cSWei Liu 	unsigned int tx_irq, rx_irq;
119d634bf2cSWei Liu 	/* Only used when split event channels support is enabled */
1202688fcb7SAndrew J. Bennieston 	char tx_irq_name[IRQ_NAME_SIZE]; /* DEVNAME-qN-tx */
1212688fcb7SAndrew J. Bennieston 	char rx_irq_name[IRQ_NAME_SIZE]; /* DEVNAME-qN-rx */
1220d160211SJeremy Fitzhardinge 
1230d160211SJeremy Fitzhardinge 	spinlock_t   tx_lock;
12484284d3cSJeremy Fitzhardinge 	struct xen_netif_tx_front_ring tx;
12584284d3cSJeremy Fitzhardinge 	int tx_ring_ref;
1260d160211SJeremy Fitzhardinge 
1270d160211SJeremy Fitzhardinge 	/*
1280d160211SJeremy Fitzhardinge 	 * {tx,rx}_skbs store outstanding skbuffs. Free tx_skb entries
1290d160211SJeremy Fitzhardinge 	 * are linked from tx_skb_freelist through skb_entry.link.
1300d160211SJeremy Fitzhardinge 	 *
1310d160211SJeremy Fitzhardinge 	 *  NB. Freelist index entries are always going to be less than
1320d160211SJeremy Fitzhardinge 	 *  PAGE_OFFSET, whereas pointers to skbs will always be equal or
1330d160211SJeremy Fitzhardinge 	 *  greater than PAGE_OFFSET: we use this property to distinguish
1340d160211SJeremy Fitzhardinge 	 *  them.
1350d160211SJeremy Fitzhardinge 	 */
1360d160211SJeremy Fitzhardinge 	union skb_entry {
1370d160211SJeremy Fitzhardinge 		struct sk_buff *skb;
1381ffb40b8SIsaku Yamahata 		unsigned long link;
1390d160211SJeremy Fitzhardinge 	} tx_skbs[NET_TX_RING_SIZE];
1400d160211SJeremy Fitzhardinge 	grant_ref_t gref_tx_head;
1410d160211SJeremy Fitzhardinge 	grant_ref_t grant_tx_ref[NET_TX_RING_SIZE];
142cefe0078SAnnie Li 	struct page *grant_tx_page[NET_TX_RING_SIZE];
1430d160211SJeremy Fitzhardinge 	unsigned tx_skb_freelist;
1440d160211SJeremy Fitzhardinge 
14584284d3cSJeremy Fitzhardinge 	spinlock_t   rx_lock ____cacheline_aligned_in_smp;
14684284d3cSJeremy Fitzhardinge 	struct xen_netif_rx_front_ring rx;
14784284d3cSJeremy Fitzhardinge 	int rx_ring_ref;
14884284d3cSJeremy Fitzhardinge 
14984284d3cSJeremy Fitzhardinge 	struct timer_list rx_refill_timer;
15084284d3cSJeremy Fitzhardinge 
1510d160211SJeremy Fitzhardinge 	struct sk_buff *rx_skbs[NET_RX_RING_SIZE];
1520d160211SJeremy Fitzhardinge 	grant_ref_t gref_rx_head;
1530d160211SJeremy Fitzhardinge 	grant_ref_t grant_rx_ref[NET_RX_RING_SIZE];
1546c5aa6fcSDenis Kirjanov 
1556c5aa6fcSDenis Kirjanov 	struct page_pool *page_pool;
1566c5aa6fcSDenis Kirjanov 	struct xdp_rxq_info xdp_rxq;
1572688fcb7SAndrew J. Bennieston };
1582688fcb7SAndrew J. Bennieston 
1592688fcb7SAndrew J. Bennieston struct netfront_info {
1602688fcb7SAndrew J. Bennieston 	struct list_head list;
1612688fcb7SAndrew J. Bennieston 	struct net_device *netdev;
1622688fcb7SAndrew J. Bennieston 
1632688fcb7SAndrew J. Bennieston 	struct xenbus_device *xbdev;
1642688fcb7SAndrew J. Bennieston 
1652688fcb7SAndrew J. Bennieston 	/* Multi-queue support */
1662688fcb7SAndrew J. Bennieston 	struct netfront_queue *queues;
167e0ce4af9SIan Campbell 
168e0ce4af9SIan Campbell 	/* Statistics */
169900e1833SDavid Vrabel 	struct netfront_stats __percpu *rx_stats;
170900e1833SDavid Vrabel 	struct netfront_stats __percpu *tx_stats;
171e00f85beSstephen hemminger 
1726c5aa6fcSDenis Kirjanov 	/* XDP state */
1736c5aa6fcSDenis Kirjanov 	bool netback_has_xdp_headroom;
1746c5aa6fcSDenis Kirjanov 	bool netfront_xdp_enabled;
1756c5aa6fcSDenis Kirjanov 
1762688fcb7SAndrew J. Bennieston 	atomic_t rx_gso_checksum_fixup;
1770d160211SJeremy Fitzhardinge };
1780d160211SJeremy Fitzhardinge 
1790d160211SJeremy Fitzhardinge struct netfront_rx_info {
1800d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response rx;
1810d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info extras[XEN_NETIF_EXTRA_TYPE_MAX - 1];
1820d160211SJeremy Fitzhardinge };
1830d160211SJeremy Fitzhardinge 
1841ffb40b8SIsaku Yamahata static void skb_entry_set_link(union skb_entry *list, unsigned short id)
1851ffb40b8SIsaku Yamahata {
1861ffb40b8SIsaku Yamahata 	list->link = id;
1871ffb40b8SIsaku Yamahata }
1881ffb40b8SIsaku Yamahata 
1891ffb40b8SIsaku Yamahata static int skb_entry_is_link(const union skb_entry *list)
1901ffb40b8SIsaku Yamahata {
1911ffb40b8SIsaku Yamahata 	BUILD_BUG_ON(sizeof(list->skb) != sizeof(list->link));
192807540baSEric Dumazet 	return (unsigned long)list->skb < PAGE_OFFSET;
1931ffb40b8SIsaku Yamahata }
1941ffb40b8SIsaku Yamahata 
1950d160211SJeremy Fitzhardinge /*
1960d160211SJeremy Fitzhardinge  * Access macros for acquiring freeing slots in tx_skbs[].
1970d160211SJeremy Fitzhardinge  */
1980d160211SJeremy Fitzhardinge 
1990d160211SJeremy Fitzhardinge static void add_id_to_freelist(unsigned *head, union skb_entry *list,
2000d160211SJeremy Fitzhardinge 			       unsigned short id)
2010d160211SJeremy Fitzhardinge {
2021ffb40b8SIsaku Yamahata 	skb_entry_set_link(&list[id], *head);
2030d160211SJeremy Fitzhardinge 	*head = id;
2040d160211SJeremy Fitzhardinge }
2050d160211SJeremy Fitzhardinge 
2060d160211SJeremy Fitzhardinge static unsigned short get_id_from_freelist(unsigned *head,
2070d160211SJeremy Fitzhardinge 					   union skb_entry *list)
2080d160211SJeremy Fitzhardinge {
2090d160211SJeremy Fitzhardinge 	unsigned int id = *head;
2100d160211SJeremy Fitzhardinge 	*head = list[id].link;
2110d160211SJeremy Fitzhardinge 	return id;
2120d160211SJeremy Fitzhardinge }
2130d160211SJeremy Fitzhardinge 
2140d160211SJeremy Fitzhardinge static int xennet_rxidx(RING_IDX idx)
2150d160211SJeremy Fitzhardinge {
2160d160211SJeremy Fitzhardinge 	return idx & (NET_RX_RING_SIZE - 1);
2170d160211SJeremy Fitzhardinge }
2180d160211SJeremy Fitzhardinge 
2192688fcb7SAndrew J. Bennieston static struct sk_buff *xennet_get_rx_skb(struct netfront_queue *queue,
2200d160211SJeremy Fitzhardinge 					 RING_IDX ri)
2210d160211SJeremy Fitzhardinge {
2220d160211SJeremy Fitzhardinge 	int i = xennet_rxidx(ri);
2232688fcb7SAndrew J. Bennieston 	struct sk_buff *skb = queue->rx_skbs[i];
2242688fcb7SAndrew J. Bennieston 	queue->rx_skbs[i] = NULL;
2250d160211SJeremy Fitzhardinge 	return skb;
2260d160211SJeremy Fitzhardinge }
2270d160211SJeremy Fitzhardinge 
2282688fcb7SAndrew J. Bennieston static grant_ref_t xennet_get_rx_ref(struct netfront_queue *queue,
2290d160211SJeremy Fitzhardinge 					    RING_IDX ri)
2300d160211SJeremy Fitzhardinge {
2310d160211SJeremy Fitzhardinge 	int i = xennet_rxidx(ri);
2322688fcb7SAndrew J. Bennieston 	grant_ref_t ref = queue->grant_rx_ref[i];
2332688fcb7SAndrew J. Bennieston 	queue->grant_rx_ref[i] = GRANT_INVALID_REF;
2340d160211SJeremy Fitzhardinge 	return ref;
2350d160211SJeremy Fitzhardinge }
2360d160211SJeremy Fitzhardinge 
2370d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS
23827b917e5STakashi Iwai static const struct attribute_group xennet_dev_group;
2390d160211SJeremy Fitzhardinge #endif
2400d160211SJeremy Fitzhardinge 
2413ad9b358SMichał Mirosław static bool xennet_can_sg(struct net_device *dev)
2420d160211SJeremy Fitzhardinge {
2433ad9b358SMichał Mirosław 	return dev->features & NETIF_F_SG;
2440d160211SJeremy Fitzhardinge }
2450d160211SJeremy Fitzhardinge 
2460d160211SJeremy Fitzhardinge 
247e99e88a9SKees Cook static void rx_refill_timeout(struct timer_list *t)
2480d160211SJeremy Fitzhardinge {
249e99e88a9SKees Cook 	struct netfront_queue *queue = from_timer(queue, t, rx_refill_timer);
2502688fcb7SAndrew J. Bennieston 	napi_schedule(&queue->napi);
2510d160211SJeremy Fitzhardinge }
2520d160211SJeremy Fitzhardinge 
2532688fcb7SAndrew J. Bennieston static int netfront_tx_slot_available(struct netfront_queue *queue)
2540d160211SJeremy Fitzhardinge {
2552688fcb7SAndrew J. Bennieston 	return (queue->tx.req_prod_pvt - queue->tx.rsp_cons) <
25657f230abSJuergen Gross 		(NET_TX_RING_SIZE - XEN_NETIF_NR_SLOTS_MIN - 1);
2570d160211SJeremy Fitzhardinge }
2580d160211SJeremy Fitzhardinge 
2592688fcb7SAndrew J. Bennieston static void xennet_maybe_wake_tx(struct netfront_queue *queue)
2600d160211SJeremy Fitzhardinge {
2612688fcb7SAndrew J. Bennieston 	struct net_device *dev = queue->info->netdev;
2622688fcb7SAndrew J. Bennieston 	struct netdev_queue *dev_queue = netdev_get_tx_queue(dev, queue->id);
2630d160211SJeremy Fitzhardinge 
2642688fcb7SAndrew J. Bennieston 	if (unlikely(netif_tx_queue_stopped(dev_queue)) &&
2652688fcb7SAndrew J. Bennieston 	    netfront_tx_slot_available(queue) &&
2660d160211SJeremy Fitzhardinge 	    likely(netif_running(dev)))
2672688fcb7SAndrew J. Bennieston 		netif_tx_wake_queue(netdev_get_tx_queue(dev, queue->id));
2680d160211SJeremy Fitzhardinge }
2690d160211SJeremy Fitzhardinge 
2701f3c2ebaSDavid Vrabel 
2711f3c2ebaSDavid Vrabel static struct sk_buff *xennet_alloc_one_rx_buffer(struct netfront_queue *queue)
2720d160211SJeremy Fitzhardinge {
2730d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
2740d160211SJeremy Fitzhardinge 	struct page *page;
2750d160211SJeremy Fitzhardinge 
2762688fcb7SAndrew J. Bennieston 	skb = __netdev_alloc_skb(queue->info->netdev,
2772688fcb7SAndrew J. Bennieston 				 RX_COPY_THRESHOLD + NET_IP_ALIGN,
2780d160211SJeremy Fitzhardinge 				 GFP_ATOMIC | __GFP_NOWARN);
2790d160211SJeremy Fitzhardinge 	if (unlikely(!skb))
2801f3c2ebaSDavid Vrabel 		return NULL;
281617a20bbSIsaku Yamahata 
2826c5aa6fcSDenis Kirjanov 	page = page_pool_dev_alloc_pages(queue->page_pool);
2836c5aa6fcSDenis Kirjanov 	if (unlikely(!page)) {
2840d160211SJeremy Fitzhardinge 		kfree_skb(skb);
2851f3c2ebaSDavid Vrabel 		return NULL;
2860d160211SJeremy Fitzhardinge 	}
287093b9c71SJan Beulich 	skb_add_rx_frag(skb, 0, page, 0, 0, PAGE_SIZE);
2880d160211SJeremy Fitzhardinge 
2891f3c2ebaSDavid Vrabel 	/* Align ip header to a 16 bytes boundary */
2901f3c2ebaSDavid Vrabel 	skb_reserve(skb, NET_IP_ALIGN);
2912688fcb7SAndrew J. Bennieston 	skb->dev = queue->info->netdev;
2920d160211SJeremy Fitzhardinge 
2931f3c2ebaSDavid Vrabel 	return skb;
2941f3c2ebaSDavid Vrabel }
2951f3c2ebaSDavid Vrabel 
2961f3c2ebaSDavid Vrabel 
2971f3c2ebaSDavid Vrabel static void xennet_alloc_rx_buffers(struct netfront_queue *queue)
2981f3c2ebaSDavid Vrabel {
2991f3c2ebaSDavid Vrabel 	RING_IDX req_prod = queue->rx.req_prod_pvt;
3001f3c2ebaSDavid Vrabel 	int notify;
301538d9291SVineeth Remanan Pillai 	int err = 0;
3021f3c2ebaSDavid Vrabel 
3031f3c2ebaSDavid Vrabel 	if (unlikely(!netif_carrier_ok(queue->info->netdev)))
3041f3c2ebaSDavid Vrabel 		return;
3051f3c2ebaSDavid Vrabel 
3061f3c2ebaSDavid Vrabel 	for (req_prod = queue->rx.req_prod_pvt;
3071f3c2ebaSDavid Vrabel 	     req_prod - queue->rx.rsp_cons < NET_RX_RING_SIZE;
3081f3c2ebaSDavid Vrabel 	     req_prod++) {
3091f3c2ebaSDavid Vrabel 		struct sk_buff *skb;
3101f3c2ebaSDavid Vrabel 		unsigned short id;
3111f3c2ebaSDavid Vrabel 		grant_ref_t ref;
31230c5d7f0SJulien Grall 		struct page *page;
3131f3c2ebaSDavid Vrabel 		struct xen_netif_rx_request *req;
3141f3c2ebaSDavid Vrabel 
3151f3c2ebaSDavid Vrabel 		skb = xennet_alloc_one_rx_buffer(queue);
316538d9291SVineeth Remanan Pillai 		if (!skb) {
317538d9291SVineeth Remanan Pillai 			err = -ENOMEM;
3181f3c2ebaSDavid Vrabel 			break;
319538d9291SVineeth Remanan Pillai 		}
3201f3c2ebaSDavid Vrabel 
3211f3c2ebaSDavid Vrabel 		id = xennet_rxidx(req_prod);
3220d160211SJeremy Fitzhardinge 
3232688fcb7SAndrew J. Bennieston 		BUG_ON(queue->rx_skbs[id]);
3242688fcb7SAndrew J. Bennieston 		queue->rx_skbs[id] = skb;
3250d160211SJeremy Fitzhardinge 
3262688fcb7SAndrew J. Bennieston 		ref = gnttab_claim_grant_reference(&queue->gref_rx_head);
327269ebce4SDongli Zhang 		WARN_ON_ONCE(IS_ERR_VALUE((unsigned long)(int)ref));
3282688fcb7SAndrew J. Bennieston 		queue->grant_rx_ref[id] = ref;
3290d160211SJeremy Fitzhardinge 
33030c5d7f0SJulien Grall 		page = skb_frag_page(&skb_shinfo(skb)->frags[0]);
3310d160211SJeremy Fitzhardinge 
3321f3c2ebaSDavid Vrabel 		req = RING_GET_REQUEST(&queue->rx, req_prod);
33330c5d7f0SJulien Grall 		gnttab_page_grant_foreign_access_ref_one(ref,
3342688fcb7SAndrew J. Bennieston 							 queue->info->xbdev->otherend_id,
33530c5d7f0SJulien Grall 							 page,
3360d160211SJeremy Fitzhardinge 							 0);
3370d160211SJeremy Fitzhardinge 		req->id = id;
3380d160211SJeremy Fitzhardinge 		req->gref = ref;
3390d160211SJeremy Fitzhardinge 	}
3400d160211SJeremy Fitzhardinge 
3411f3c2ebaSDavid Vrabel 	queue->rx.req_prod_pvt = req_prod;
3421f3c2ebaSDavid Vrabel 
343538d9291SVineeth Remanan Pillai 	/* Try again later if there are not enough requests or skb allocation
344538d9291SVineeth Remanan Pillai 	 * failed.
345538d9291SVineeth Remanan Pillai 	 * Enough requests is quantified as the sum of newly created slots and
346538d9291SVineeth Remanan Pillai 	 * the unconsumed slots at the backend.
347538d9291SVineeth Remanan Pillai 	 */
348538d9291SVineeth Remanan Pillai 	if (req_prod - queue->rx.rsp_cons < NET_RX_SLOTS_MIN ||
349538d9291SVineeth Remanan Pillai 	    unlikely(err)) {
3501f3c2ebaSDavid Vrabel 		mod_timer(&queue->rx_refill_timer, jiffies + (HZ/10));
3511f3c2ebaSDavid Vrabel 		return;
3521f3c2ebaSDavid Vrabel 	}
3531f3c2ebaSDavid Vrabel 
3542688fcb7SAndrew J. Bennieston 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&queue->rx, notify);
3550d160211SJeremy Fitzhardinge 	if (notify)
3562688fcb7SAndrew J. Bennieston 		notify_remote_via_irq(queue->rx_irq);
3570d160211SJeremy Fitzhardinge }
3580d160211SJeremy Fitzhardinge 
3590d160211SJeremy Fitzhardinge static int xennet_open(struct net_device *dev)
3600d160211SJeremy Fitzhardinge {
3610d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
3622688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
3632688fcb7SAndrew J. Bennieston 	unsigned int i = 0;
3642688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
3650d160211SJeremy Fitzhardinge 
366f599c64fSRoss Lagerwall 	if (!np->queues)
367f599c64fSRoss Lagerwall 		return -ENODEV;
368f599c64fSRoss Lagerwall 
3692688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i) {
3702688fcb7SAndrew J. Bennieston 		queue = &np->queues[i];
3712688fcb7SAndrew J. Bennieston 		napi_enable(&queue->napi);
372bea3348eSStephen Hemminger 
3732688fcb7SAndrew J. Bennieston 		spin_lock_bh(&queue->rx_lock);
3740d160211SJeremy Fitzhardinge 		if (netif_carrier_ok(dev)) {
3752688fcb7SAndrew J. Bennieston 			xennet_alloc_rx_buffers(queue);
3762688fcb7SAndrew J. Bennieston 			queue->rx.sring->rsp_event = queue->rx.rsp_cons + 1;
3772688fcb7SAndrew J. Bennieston 			if (RING_HAS_UNCONSUMED_RESPONSES(&queue->rx))
3782688fcb7SAndrew J. Bennieston 				napi_schedule(&queue->napi);
3790d160211SJeremy Fitzhardinge 		}
3802688fcb7SAndrew J. Bennieston 		spin_unlock_bh(&queue->rx_lock);
3812688fcb7SAndrew J. Bennieston 	}
3820d160211SJeremy Fitzhardinge 
3832688fcb7SAndrew J. Bennieston 	netif_tx_start_all_queues(dev);
3840d160211SJeremy Fitzhardinge 
3850d160211SJeremy Fitzhardinge 	return 0;
3860d160211SJeremy Fitzhardinge }
3870d160211SJeremy Fitzhardinge 
3882688fcb7SAndrew J. Bennieston static void xennet_tx_buf_gc(struct netfront_queue *queue)
3890d160211SJeremy Fitzhardinge {
3900d160211SJeremy Fitzhardinge 	RING_IDX cons, prod;
3910d160211SJeremy Fitzhardinge 	unsigned short id;
3920d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
3937d0105b5SMalcolm Crossley 	bool more_to_do;
3940d160211SJeremy Fitzhardinge 
3952688fcb7SAndrew J. Bennieston 	BUG_ON(!netif_carrier_ok(queue->info->netdev));
3960d160211SJeremy Fitzhardinge 
3970d160211SJeremy Fitzhardinge 	do {
3982688fcb7SAndrew J. Bennieston 		prod = queue->tx.sring->rsp_prod;
3990d160211SJeremy Fitzhardinge 		rmb(); /* Ensure we see responses up to 'rp'. */
4000d160211SJeremy Fitzhardinge 
4012688fcb7SAndrew J. Bennieston 		for (cons = queue->tx.rsp_cons; cons != prod; cons++) {
4020d160211SJeremy Fitzhardinge 			struct xen_netif_tx_response *txrsp;
4030d160211SJeremy Fitzhardinge 
4042688fcb7SAndrew J. Bennieston 			txrsp = RING_GET_RESPONSE(&queue->tx, cons);
405f942dc25SIan Campbell 			if (txrsp->status == XEN_NETIF_RSP_NULL)
4060d160211SJeremy Fitzhardinge 				continue;
4070d160211SJeremy Fitzhardinge 
4080d160211SJeremy Fitzhardinge 			id  = txrsp->id;
4092688fcb7SAndrew J. Bennieston 			skb = queue->tx_skbs[id].skb;
4100d160211SJeremy Fitzhardinge 			if (unlikely(gnttab_query_foreign_access(
4112688fcb7SAndrew J. Bennieston 				queue->grant_tx_ref[id]) != 0)) {
412383eda32SJoe Perches 				pr_alert("%s: warning -- grant still in use by backend domain\n",
413383eda32SJoe Perches 					 __func__);
4140d160211SJeremy Fitzhardinge 				BUG();
4150d160211SJeremy Fitzhardinge 			}
4160d160211SJeremy Fitzhardinge 			gnttab_end_foreign_access_ref(
4172688fcb7SAndrew J. Bennieston 				queue->grant_tx_ref[id], GNTMAP_readonly);
4180d160211SJeremy Fitzhardinge 			gnttab_release_grant_reference(
4192688fcb7SAndrew J. Bennieston 				&queue->gref_tx_head, queue->grant_tx_ref[id]);
4202688fcb7SAndrew J. Bennieston 			queue->grant_tx_ref[id] = GRANT_INVALID_REF;
4212688fcb7SAndrew J. Bennieston 			queue->grant_tx_page[id] = NULL;
4222688fcb7SAndrew J. Bennieston 			add_id_to_freelist(&queue->tx_skb_freelist, queue->tx_skbs, id);
4230d160211SJeremy Fitzhardinge 			dev_kfree_skb_irq(skb);
4240d160211SJeremy Fitzhardinge 		}
4250d160211SJeremy Fitzhardinge 
4262688fcb7SAndrew J. Bennieston 		queue->tx.rsp_cons = prod;
4270d160211SJeremy Fitzhardinge 
4287d0105b5SMalcolm Crossley 		RING_FINAL_CHECK_FOR_RESPONSES(&queue->tx, more_to_do);
4297d0105b5SMalcolm Crossley 	} while (more_to_do);
4300d160211SJeremy Fitzhardinge 
4312688fcb7SAndrew J. Bennieston 	xennet_maybe_wake_tx(queue);
4320d160211SJeremy Fitzhardinge }
4330d160211SJeremy Fitzhardinge 
43430c5d7f0SJulien Grall struct xennet_gnttab_make_txreq {
43530c5d7f0SJulien Grall 	struct netfront_queue *queue;
43630c5d7f0SJulien Grall 	struct sk_buff *skb;
43730c5d7f0SJulien Grall 	struct page *page;
43830c5d7f0SJulien Grall 	struct xen_netif_tx_request *tx; /* Last request */
43930c5d7f0SJulien Grall 	unsigned int size;
44030c5d7f0SJulien Grall };
44130c5d7f0SJulien Grall 
44230c5d7f0SJulien Grall static void xennet_tx_setup_grant(unsigned long gfn, unsigned int offset,
44330c5d7f0SJulien Grall 				  unsigned int len, void *data)
4440d160211SJeremy Fitzhardinge {
44530c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq *info = data;
4460d160211SJeremy Fitzhardinge 	unsigned int id;
447a55e8bb8SDavid Vrabel 	struct xen_netif_tx_request *tx;
4480d160211SJeremy Fitzhardinge 	grant_ref_t ref;
44930c5d7f0SJulien Grall 	/* convenient aliases */
45030c5d7f0SJulien Grall 	struct page *page = info->page;
45130c5d7f0SJulien Grall 	struct netfront_queue *queue = info->queue;
45230c5d7f0SJulien Grall 	struct sk_buff *skb = info->skb;
4530d160211SJeremy Fitzhardinge 
4542688fcb7SAndrew J. Bennieston 	id = get_id_from_freelist(&queue->tx_skb_freelist, queue->tx_skbs);
455a55e8bb8SDavid Vrabel 	tx = RING_GET_REQUEST(&queue->tx, queue->tx.req_prod_pvt++);
4562688fcb7SAndrew J. Bennieston 	ref = gnttab_claim_grant_reference(&queue->gref_tx_head);
457269ebce4SDongli Zhang 	WARN_ON_ONCE(IS_ERR_VALUE((unsigned long)(int)ref));
4580d160211SJeremy Fitzhardinge 
45930c5d7f0SJulien Grall 	gnttab_grant_foreign_access_ref(ref, queue->info->xbdev->otherend_id,
46030c5d7f0SJulien Grall 					gfn, GNTMAP_readonly);
4610d160211SJeremy Fitzhardinge 
462a55e8bb8SDavid Vrabel 	queue->tx_skbs[id].skb = skb;
463a55e8bb8SDavid Vrabel 	queue->grant_tx_page[id] = page;
464a55e8bb8SDavid Vrabel 	queue->grant_tx_ref[id] = ref;
465a55e8bb8SDavid Vrabel 
466a55e8bb8SDavid Vrabel 	tx->id = id;
467a55e8bb8SDavid Vrabel 	tx->gref = ref;
4680d160211SJeremy Fitzhardinge 	tx->offset = offset;
4690d160211SJeremy Fitzhardinge 	tx->size = len;
4700d160211SJeremy Fitzhardinge 	tx->flags = 0;
471a55e8bb8SDavid Vrabel 
47230c5d7f0SJulien Grall 	info->tx = tx;
47330c5d7f0SJulien Grall 	info->size += tx->size;
47430c5d7f0SJulien Grall }
47530c5d7f0SJulien Grall 
47630c5d7f0SJulien Grall static struct xen_netif_tx_request *xennet_make_first_txreq(
47730c5d7f0SJulien Grall 	struct netfront_queue *queue, struct sk_buff *skb,
47830c5d7f0SJulien Grall 	struct page *page, unsigned int offset, unsigned int len)
47930c5d7f0SJulien Grall {
48030c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq info = {
48130c5d7f0SJulien Grall 		.queue = queue,
48230c5d7f0SJulien Grall 		.skb = skb,
48330c5d7f0SJulien Grall 		.page = page,
48430c5d7f0SJulien Grall 		.size = 0,
48530c5d7f0SJulien Grall 	};
48630c5d7f0SJulien Grall 
48730c5d7f0SJulien Grall 	gnttab_for_one_grant(page, offset, len, xennet_tx_setup_grant, &info);
48830c5d7f0SJulien Grall 
48930c5d7f0SJulien Grall 	return info.tx;
49030c5d7f0SJulien Grall }
49130c5d7f0SJulien Grall 
49230c5d7f0SJulien Grall static void xennet_make_one_txreq(unsigned long gfn, unsigned int offset,
49330c5d7f0SJulien Grall 				  unsigned int len, void *data)
49430c5d7f0SJulien Grall {
49530c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq *info = data;
49630c5d7f0SJulien Grall 
49730c5d7f0SJulien Grall 	info->tx->flags |= XEN_NETTXF_more_data;
49830c5d7f0SJulien Grall 	skb_get(info->skb);
49930c5d7f0SJulien Grall 	xennet_tx_setup_grant(gfn, offset, len, data);
5000d160211SJeremy Fitzhardinge }
5010d160211SJeremy Fitzhardinge 
502a55e8bb8SDavid Vrabel static struct xen_netif_tx_request *xennet_make_txreqs(
503a55e8bb8SDavid Vrabel 	struct netfront_queue *queue, struct xen_netif_tx_request *tx,
504a55e8bb8SDavid Vrabel 	struct sk_buff *skb, struct page *page,
505a55e8bb8SDavid Vrabel 	unsigned int offset, unsigned int len)
506a55e8bb8SDavid Vrabel {
50730c5d7f0SJulien Grall 	struct xennet_gnttab_make_txreq info = {
50830c5d7f0SJulien Grall 		.queue = queue,
50930c5d7f0SJulien Grall 		.skb = skb,
51030c5d7f0SJulien Grall 		.tx = tx,
51130c5d7f0SJulien Grall 	};
51230c5d7f0SJulien Grall 
513f36c3747SIan Campbell 	/* Skip unused frames from start of page */
514f36c3747SIan Campbell 	page += offset >> PAGE_SHIFT;
515f36c3747SIan Campbell 	offset &= ~PAGE_MASK;
516f36c3747SIan Campbell 
517a55e8bb8SDavid Vrabel 	while (len) {
51830c5d7f0SJulien Grall 		info.page = page;
51930c5d7f0SJulien Grall 		info.size = 0;
52030c5d7f0SJulien Grall 
52130c5d7f0SJulien Grall 		gnttab_foreach_grant_in_range(page, offset, len,
52230c5d7f0SJulien Grall 					      xennet_make_one_txreq,
52330c5d7f0SJulien Grall 					      &info);
52430c5d7f0SJulien Grall 
525f36c3747SIan Campbell 		page++;
526f36c3747SIan Campbell 		offset = 0;
52730c5d7f0SJulien Grall 		len -= info.size;
5280d160211SJeremy Fitzhardinge 	}
5290d160211SJeremy Fitzhardinge 
53030c5d7f0SJulien Grall 	return info.tx;
5310d160211SJeremy Fitzhardinge }
5320d160211SJeremy Fitzhardinge 
533f36c3747SIan Campbell /*
534e84448d5SDavid Vrabel  * Count how many ring slots are required to send this skb. Each frag
535e84448d5SDavid Vrabel  * might be a compound page.
536f36c3747SIan Campbell  */
537e84448d5SDavid Vrabel static int xennet_count_skb_slots(struct sk_buff *skb)
538f36c3747SIan Campbell {
539f36c3747SIan Campbell 	int i, frags = skb_shinfo(skb)->nr_frags;
54030c5d7f0SJulien Grall 	int slots;
541e84448d5SDavid Vrabel 
54230c5d7f0SJulien Grall 	slots = gnttab_count_grant(offset_in_page(skb->data),
54330c5d7f0SJulien Grall 				   skb_headlen(skb));
544f36c3747SIan Campbell 
545f36c3747SIan Campbell 	for (i = 0; i < frags; i++) {
546f36c3747SIan Campbell 		skb_frag_t *frag = skb_shinfo(skb)->frags + i;
547f36c3747SIan Campbell 		unsigned long size = skb_frag_size(frag);
548b54c9d5bSJonathan Lemon 		unsigned long offset = skb_frag_off(frag);
549f36c3747SIan Campbell 
550f36c3747SIan Campbell 		/* Skip unused frames from start of page */
551f36c3747SIan Campbell 		offset &= ~PAGE_MASK;
552f36c3747SIan Campbell 
55330c5d7f0SJulien Grall 		slots += gnttab_count_grant(offset, size);
554f36c3747SIan Campbell 	}
555f36c3747SIan Campbell 
55630c5d7f0SJulien Grall 	return slots;
557f36c3747SIan Campbell }
558f36c3747SIan Campbell 
55950ee6061SAndrew J. Bennieston static u16 xennet_select_queue(struct net_device *dev, struct sk_buff *skb,
560a350ecceSPaolo Abeni 			       struct net_device *sb_dev)
5612688fcb7SAndrew J. Bennieston {
56250ee6061SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
56350ee6061SAndrew J. Bennieston 	u32 hash;
56450ee6061SAndrew J. Bennieston 	u16 queue_idx;
56550ee6061SAndrew J. Bennieston 
56650ee6061SAndrew J. Bennieston 	/* First, check if there is only one queue */
56750ee6061SAndrew J. Bennieston 	if (num_queues == 1) {
56850ee6061SAndrew J. Bennieston 		queue_idx = 0;
56950ee6061SAndrew J. Bennieston 	} else {
57050ee6061SAndrew J. Bennieston 		hash = skb_get_hash(skb);
57150ee6061SAndrew J. Bennieston 		queue_idx = hash % num_queues;
57250ee6061SAndrew J. Bennieston 	}
57350ee6061SAndrew J. Bennieston 
57450ee6061SAndrew J. Bennieston 	return queue_idx;
5752688fcb7SAndrew J. Bennieston }
5762688fcb7SAndrew J. Bennieston 
5776c5aa6fcSDenis Kirjanov static int xennet_xdp_xmit_one(struct net_device *dev,
5786c5aa6fcSDenis Kirjanov 			       struct netfront_queue *queue,
5796c5aa6fcSDenis Kirjanov 			       struct xdp_frame *xdpf)
5806c5aa6fcSDenis Kirjanov {
5816c5aa6fcSDenis Kirjanov 	struct netfront_info *np = netdev_priv(dev);
5826c5aa6fcSDenis Kirjanov 	struct netfront_stats *tx_stats = this_cpu_ptr(np->tx_stats);
5836c5aa6fcSDenis Kirjanov 	int notify;
5846c5aa6fcSDenis Kirjanov 
5856c5aa6fcSDenis Kirjanov 	xennet_make_first_txreq(queue, NULL,
5866c5aa6fcSDenis Kirjanov 				virt_to_page(xdpf->data),
5876c5aa6fcSDenis Kirjanov 				offset_in_page(xdpf->data),
5886c5aa6fcSDenis Kirjanov 				xdpf->len);
5896c5aa6fcSDenis Kirjanov 
5906c5aa6fcSDenis Kirjanov 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&queue->tx, notify);
5916c5aa6fcSDenis Kirjanov 	if (notify)
5926c5aa6fcSDenis Kirjanov 		notify_remote_via_irq(queue->tx_irq);
5936c5aa6fcSDenis Kirjanov 
5946c5aa6fcSDenis Kirjanov 	u64_stats_update_begin(&tx_stats->syncp);
5956c5aa6fcSDenis Kirjanov 	tx_stats->bytes += xdpf->len;
5966c5aa6fcSDenis Kirjanov 	tx_stats->packets++;
5976c5aa6fcSDenis Kirjanov 	u64_stats_update_end(&tx_stats->syncp);
5986c5aa6fcSDenis Kirjanov 
5996c5aa6fcSDenis Kirjanov 	xennet_tx_buf_gc(queue);
6006c5aa6fcSDenis Kirjanov 
6016c5aa6fcSDenis Kirjanov 	return 0;
6026c5aa6fcSDenis Kirjanov }
6036c5aa6fcSDenis Kirjanov 
6046c5aa6fcSDenis Kirjanov static int xennet_xdp_xmit(struct net_device *dev, int n,
6056c5aa6fcSDenis Kirjanov 			   struct xdp_frame **frames, u32 flags)
6066c5aa6fcSDenis Kirjanov {
6076c5aa6fcSDenis Kirjanov 	unsigned int num_queues = dev->real_num_tx_queues;
6086c5aa6fcSDenis Kirjanov 	struct netfront_info *np = netdev_priv(dev);
6096c5aa6fcSDenis Kirjanov 	struct netfront_queue *queue = NULL;
6106c5aa6fcSDenis Kirjanov 	unsigned long irq_flags;
611*fdc13979SLorenzo Bianconi 	int nxmit = 0;
612*fdc13979SLorenzo Bianconi 	int i;
6136c5aa6fcSDenis Kirjanov 
6146c5aa6fcSDenis Kirjanov 	if (unlikely(flags & ~XDP_XMIT_FLAGS_MASK))
6156c5aa6fcSDenis Kirjanov 		return -EINVAL;
6166c5aa6fcSDenis Kirjanov 
6176c5aa6fcSDenis Kirjanov 	queue = &np->queues[smp_processor_id() % num_queues];
6186c5aa6fcSDenis Kirjanov 
6196c5aa6fcSDenis Kirjanov 	spin_lock_irqsave(&queue->tx_lock, irq_flags);
6206c5aa6fcSDenis Kirjanov 	for (i = 0; i < n; i++) {
6216c5aa6fcSDenis Kirjanov 		struct xdp_frame *xdpf = frames[i];
6226c5aa6fcSDenis Kirjanov 
6236c5aa6fcSDenis Kirjanov 		if (!xdpf)
6246c5aa6fcSDenis Kirjanov 			continue;
625*fdc13979SLorenzo Bianconi 		if (xennet_xdp_xmit_one(dev, queue, xdpf))
626*fdc13979SLorenzo Bianconi 			break;
627*fdc13979SLorenzo Bianconi 		nxmit++;
6286c5aa6fcSDenis Kirjanov 	}
6296c5aa6fcSDenis Kirjanov 	spin_unlock_irqrestore(&queue->tx_lock, irq_flags);
6306c5aa6fcSDenis Kirjanov 
631*fdc13979SLorenzo Bianconi 	return nxmit;
6326c5aa6fcSDenis Kirjanov }
6336c5aa6fcSDenis Kirjanov 
6346c5aa6fcSDenis Kirjanov 
63530c5d7f0SJulien Grall #define MAX_XEN_SKB_FRAGS (65536 / XEN_PAGE_SIZE + 1)
63630c5d7f0SJulien Grall 
63724a94b3cSLuc Van Oostenryck static netdev_tx_t xennet_start_xmit(struct sk_buff *skb, struct net_device *dev)
6380d160211SJeremy Fitzhardinge {
6390d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
640900e1833SDavid Vrabel 	struct netfront_stats *tx_stats = this_cpu_ptr(np->tx_stats);
641a55e8bb8SDavid Vrabel 	struct xen_netif_tx_request *tx, *first_tx;
642a55e8bb8SDavid Vrabel 	unsigned int i;
6430d160211SJeremy Fitzhardinge 	int notify;
644f36c3747SIan Campbell 	int slots;
645a55e8bb8SDavid Vrabel 	struct page *page;
646a55e8bb8SDavid Vrabel 	unsigned int offset;
647a55e8bb8SDavid Vrabel 	unsigned int len;
648cf66f9d4SKonrad Rzeszutek Wilk 	unsigned long flags;
6492688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
6502688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
6512688fcb7SAndrew J. Bennieston 	u16 queue_index;
652fd07160bSVitaly Kuznetsov 	struct sk_buff *nskb;
6532688fcb7SAndrew J. Bennieston 
6542688fcb7SAndrew J. Bennieston 	/* Drop the packet if no queues are set up */
6552688fcb7SAndrew J. Bennieston 	if (num_queues < 1)
6562688fcb7SAndrew J. Bennieston 		goto drop;
6572688fcb7SAndrew J. Bennieston 	/* Determine which queue to transmit this SKB on */
6582688fcb7SAndrew J. Bennieston 	queue_index = skb_get_queue_mapping(skb);
6592688fcb7SAndrew J. Bennieston 	queue = &np->queues[queue_index];
6600d160211SJeremy Fitzhardinge 
6619ecd1a75SWei Liu 	/* If skb->len is too big for wire format, drop skb and alert
6629ecd1a75SWei Liu 	 * user about misconfiguration.
6639ecd1a75SWei Liu 	 */
6649ecd1a75SWei Liu 	if (unlikely(skb->len > XEN_NETIF_MAX_TX_SIZE)) {
6659ecd1a75SWei Liu 		net_alert_ratelimited(
6669ecd1a75SWei Liu 			"xennet: skb->len = %u, too big for wire format\n",
6679ecd1a75SWei Liu 			skb->len);
6689ecd1a75SWei Liu 		goto drop;
6699ecd1a75SWei Liu 	}
6709ecd1a75SWei Liu 
671e84448d5SDavid Vrabel 	slots = xennet_count_skb_slots(skb);
67230c5d7f0SJulien Grall 	if (unlikely(slots > MAX_XEN_SKB_FRAGS + 1)) {
67397a6d1bbSZoltan Kiss 		net_dbg_ratelimited("xennet: skb rides the rocket: %d slots, %d bytes\n",
67497a6d1bbSZoltan Kiss 				    slots, skb->len);
67597a6d1bbSZoltan Kiss 		if (skb_linearize(skb))
6760d160211SJeremy Fitzhardinge 			goto drop;
6770d160211SJeremy Fitzhardinge 	}
6780d160211SJeremy Fitzhardinge 
679a55e8bb8SDavid Vrabel 	page = virt_to_page(skb->data);
680a55e8bb8SDavid Vrabel 	offset = offset_in_page(skb->data);
681fd07160bSVitaly Kuznetsov 
682fd07160bSVitaly Kuznetsov 	/* The first req should be at least ETH_HLEN size or the packet will be
683fd07160bSVitaly Kuznetsov 	 * dropped by netback.
684fd07160bSVitaly Kuznetsov 	 */
685fd07160bSVitaly Kuznetsov 	if (unlikely(PAGE_SIZE - offset < ETH_HLEN)) {
686fd07160bSVitaly Kuznetsov 		nskb = skb_copy(skb, GFP_ATOMIC);
687fd07160bSVitaly Kuznetsov 		if (!nskb)
688fd07160bSVitaly Kuznetsov 			goto drop;
68962f3250fSEric Dumazet 		dev_consume_skb_any(skb);
690fd07160bSVitaly Kuznetsov 		skb = nskb;
691fd07160bSVitaly Kuznetsov 		page = virt_to_page(skb->data);
692fd07160bSVitaly Kuznetsov 		offset = offset_in_page(skb->data);
693fd07160bSVitaly Kuznetsov 	}
694fd07160bSVitaly Kuznetsov 
695a55e8bb8SDavid Vrabel 	len = skb_headlen(skb);
696a55e8bb8SDavid Vrabel 
6972688fcb7SAndrew J. Bennieston 	spin_lock_irqsave(&queue->tx_lock, flags);
6980d160211SJeremy Fitzhardinge 
6990d160211SJeremy Fitzhardinge 	if (unlikely(!netif_carrier_ok(dev) ||
700f36c3747SIan Campbell 		     (slots > 1 && !xennet_can_sg(dev)) ||
7018b86a61dSJohannes Berg 		     netif_needs_gso(skb, netif_skb_features(skb)))) {
7022688fcb7SAndrew J. Bennieston 		spin_unlock_irqrestore(&queue->tx_lock, flags);
7030d160211SJeremy Fitzhardinge 		goto drop;
7040d160211SJeremy Fitzhardinge 	}
7050d160211SJeremy Fitzhardinge 
706a55e8bb8SDavid Vrabel 	/* First request for the linear area. */
70730c5d7f0SJulien Grall 	first_tx = tx = xennet_make_first_txreq(queue, skb,
708a55e8bb8SDavid Vrabel 						page, offset, len);
70930c5d7f0SJulien Grall 	offset += tx->size;
71030c5d7f0SJulien Grall 	if (offset == PAGE_SIZE) {
711a55e8bb8SDavid Vrabel 		page++;
712a55e8bb8SDavid Vrabel 		offset = 0;
71330c5d7f0SJulien Grall 	}
714a55e8bb8SDavid Vrabel 	len -= tx->size;
7150d160211SJeremy Fitzhardinge 
7160d160211SJeremy Fitzhardinge 	if (skb->ip_summed == CHECKSUM_PARTIAL)
7170d160211SJeremy Fitzhardinge 		/* local packet? */
718f942dc25SIan Campbell 		tx->flags |= XEN_NETTXF_csum_blank | XEN_NETTXF_data_validated;
7190d160211SJeremy Fitzhardinge 	else if (skb->ip_summed == CHECKSUM_UNNECESSARY)
7200d160211SJeremy Fitzhardinge 		/* remote but checksummed. */
721f942dc25SIan Campbell 		tx->flags |= XEN_NETTXF_data_validated;
7220d160211SJeremy Fitzhardinge 
723a55e8bb8SDavid Vrabel 	/* Optional extra info after the first request. */
7240d160211SJeremy Fitzhardinge 	if (skb_shinfo(skb)->gso_size) {
7250d160211SJeremy Fitzhardinge 		struct xen_netif_extra_info *gso;
7260d160211SJeremy Fitzhardinge 
7270d160211SJeremy Fitzhardinge 		gso = (struct xen_netif_extra_info *)
728a55e8bb8SDavid Vrabel 			RING_GET_REQUEST(&queue->tx, queue->tx.req_prod_pvt++);
7290d160211SJeremy Fitzhardinge 
730f942dc25SIan Campbell 		tx->flags |= XEN_NETTXF_extra_info;
7310d160211SJeremy Fitzhardinge 
7320d160211SJeremy Fitzhardinge 		gso->u.gso.size = skb_shinfo(skb)->gso_size;
7332c0057deSPaul Durrant 		gso->u.gso.type = (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6) ?
7342c0057deSPaul Durrant 			XEN_NETIF_GSO_TYPE_TCPV6 :
7352c0057deSPaul Durrant 			XEN_NETIF_GSO_TYPE_TCPV4;
7360d160211SJeremy Fitzhardinge 		gso->u.gso.pad = 0;
7370d160211SJeremy Fitzhardinge 		gso->u.gso.features = 0;
7380d160211SJeremy Fitzhardinge 
7390d160211SJeremy Fitzhardinge 		gso->type = XEN_NETIF_EXTRA_TYPE_GSO;
7400d160211SJeremy Fitzhardinge 		gso->flags = 0;
7410d160211SJeremy Fitzhardinge 	}
7420d160211SJeremy Fitzhardinge 
743a55e8bb8SDavid Vrabel 	/* Requests for the rest of the linear area. */
744a55e8bb8SDavid Vrabel 	tx = xennet_make_txreqs(queue, tx, skb, page, offset, len);
7450d160211SJeremy Fitzhardinge 
746a55e8bb8SDavid Vrabel 	/* Requests for all the frags. */
747a55e8bb8SDavid Vrabel 	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
748a55e8bb8SDavid Vrabel 		skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
749b54c9d5bSJonathan Lemon 		tx = xennet_make_txreqs(queue, tx, skb, skb_frag_page(frag),
750b54c9d5bSJonathan Lemon 					skb_frag_off(frag),
751a55e8bb8SDavid Vrabel 					skb_frag_size(frag));
752a55e8bb8SDavid Vrabel 	}
753a55e8bb8SDavid Vrabel 
754a55e8bb8SDavid Vrabel 	/* First request has the packet length. */
755a55e8bb8SDavid Vrabel 	first_tx->size = skb->len;
7560d160211SJeremy Fitzhardinge 
75791ffb9d3SDaniel Drown 	/* timestamp packet in software */
75891ffb9d3SDaniel Drown 	skb_tx_timestamp(skb);
75991ffb9d3SDaniel Drown 
7602688fcb7SAndrew J. Bennieston 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&queue->tx, notify);
7610d160211SJeremy Fitzhardinge 	if (notify)
7622688fcb7SAndrew J. Bennieston 		notify_remote_via_irq(queue->tx_irq);
7630d160211SJeremy Fitzhardinge 
764900e1833SDavid Vrabel 	u64_stats_update_begin(&tx_stats->syncp);
765900e1833SDavid Vrabel 	tx_stats->bytes += skb->len;
766900e1833SDavid Vrabel 	tx_stats->packets++;
767900e1833SDavid Vrabel 	u64_stats_update_end(&tx_stats->syncp);
76810a273a6SJeremy Fitzhardinge 
76910a273a6SJeremy Fitzhardinge 	/* Note: It is not safe to access skb after xennet_tx_buf_gc()! */
7702688fcb7SAndrew J. Bennieston 	xennet_tx_buf_gc(queue);
7710d160211SJeremy Fitzhardinge 
7722688fcb7SAndrew J. Bennieston 	if (!netfront_tx_slot_available(queue))
7732688fcb7SAndrew J. Bennieston 		netif_tx_stop_queue(netdev_get_tx_queue(dev, queue->id));
7740d160211SJeremy Fitzhardinge 
7752688fcb7SAndrew J. Bennieston 	spin_unlock_irqrestore(&queue->tx_lock, flags);
7760d160211SJeremy Fitzhardinge 
7776ed10654SPatrick McHardy 	return NETDEV_TX_OK;
7780d160211SJeremy Fitzhardinge 
7790d160211SJeremy Fitzhardinge  drop:
78009f75cd7SJeff Garzik 	dev->stats.tx_dropped++;
781979de8a0SEric W. Biederman 	dev_kfree_skb_any(skb);
7826ed10654SPatrick McHardy 	return NETDEV_TX_OK;
7830d160211SJeremy Fitzhardinge }
7840d160211SJeremy Fitzhardinge 
7850d160211SJeremy Fitzhardinge static int xennet_close(struct net_device *dev)
7860d160211SJeremy Fitzhardinge {
7870d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
7882688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
7892688fcb7SAndrew J. Bennieston 	unsigned int i;
7902688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue;
7912688fcb7SAndrew J. Bennieston 	netif_tx_stop_all_queues(np->netdev);
7922688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i) {
7932688fcb7SAndrew J. Bennieston 		queue = &np->queues[i];
7942688fcb7SAndrew J. Bennieston 		napi_disable(&queue->napi);
7952688fcb7SAndrew J. Bennieston 	}
7960d160211SJeremy Fitzhardinge 	return 0;
7970d160211SJeremy Fitzhardinge }
7980d160211SJeremy Fitzhardinge 
7992688fcb7SAndrew J. Bennieston static void xennet_move_rx_slot(struct netfront_queue *queue, struct sk_buff *skb,
8000d160211SJeremy Fitzhardinge 				grant_ref_t ref)
8010d160211SJeremy Fitzhardinge {
8022688fcb7SAndrew J. Bennieston 	int new = xennet_rxidx(queue->rx.req_prod_pvt);
8030d160211SJeremy Fitzhardinge 
8042688fcb7SAndrew J. Bennieston 	BUG_ON(queue->rx_skbs[new]);
8052688fcb7SAndrew J. Bennieston 	queue->rx_skbs[new] = skb;
8062688fcb7SAndrew J. Bennieston 	queue->grant_rx_ref[new] = ref;
8072688fcb7SAndrew J. Bennieston 	RING_GET_REQUEST(&queue->rx, queue->rx.req_prod_pvt)->id = new;
8082688fcb7SAndrew J. Bennieston 	RING_GET_REQUEST(&queue->rx, queue->rx.req_prod_pvt)->gref = ref;
8092688fcb7SAndrew J. Bennieston 	queue->rx.req_prod_pvt++;
8100d160211SJeremy Fitzhardinge }
8110d160211SJeremy Fitzhardinge 
8122688fcb7SAndrew J. Bennieston static int xennet_get_extras(struct netfront_queue *queue,
8130d160211SJeremy Fitzhardinge 			     struct xen_netif_extra_info *extras,
8140d160211SJeremy Fitzhardinge 			     RING_IDX rp)
8150d160211SJeremy Fitzhardinge 
8160d160211SJeremy Fitzhardinge {
8170d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extra;
8182688fcb7SAndrew J. Bennieston 	struct device *dev = &queue->info->netdev->dev;
8192688fcb7SAndrew J. Bennieston 	RING_IDX cons = queue->rx.rsp_cons;
8200d160211SJeremy Fitzhardinge 	int err = 0;
8210d160211SJeremy Fitzhardinge 
8220d160211SJeremy Fitzhardinge 	do {
8230d160211SJeremy Fitzhardinge 		struct sk_buff *skb;
8240d160211SJeremy Fitzhardinge 		grant_ref_t ref;
8250d160211SJeremy Fitzhardinge 
8260d160211SJeremy Fitzhardinge 		if (unlikely(cons + 1 == rp)) {
8270d160211SJeremy Fitzhardinge 			if (net_ratelimit())
8280d160211SJeremy Fitzhardinge 				dev_warn(dev, "Missing extra info\n");
8290d160211SJeremy Fitzhardinge 			err = -EBADR;
8300d160211SJeremy Fitzhardinge 			break;
8310d160211SJeremy Fitzhardinge 		}
8320d160211SJeremy Fitzhardinge 
8330d160211SJeremy Fitzhardinge 		extra = (struct xen_netif_extra_info *)
8342688fcb7SAndrew J. Bennieston 			RING_GET_RESPONSE(&queue->rx, ++cons);
8350d160211SJeremy Fitzhardinge 
8360d160211SJeremy Fitzhardinge 		if (unlikely(!extra->type ||
8370d160211SJeremy Fitzhardinge 			     extra->type >= XEN_NETIF_EXTRA_TYPE_MAX)) {
8380d160211SJeremy Fitzhardinge 			if (net_ratelimit())
8390d160211SJeremy Fitzhardinge 				dev_warn(dev, "Invalid extra type: %d\n",
8400d160211SJeremy Fitzhardinge 					extra->type);
8410d160211SJeremy Fitzhardinge 			err = -EINVAL;
8420d160211SJeremy Fitzhardinge 		} else {
8430d160211SJeremy Fitzhardinge 			memcpy(&extras[extra->type - 1], extra,
8440d160211SJeremy Fitzhardinge 			       sizeof(*extra));
8450d160211SJeremy Fitzhardinge 		}
8460d160211SJeremy Fitzhardinge 
8472688fcb7SAndrew J. Bennieston 		skb = xennet_get_rx_skb(queue, cons);
8482688fcb7SAndrew J. Bennieston 		ref = xennet_get_rx_ref(queue, cons);
8492688fcb7SAndrew J. Bennieston 		xennet_move_rx_slot(queue, skb, ref);
8500d160211SJeremy Fitzhardinge 	} while (extra->flags & XEN_NETIF_EXTRA_FLAG_MORE);
8510d160211SJeremy Fitzhardinge 
8522688fcb7SAndrew J. Bennieston 	queue->rx.rsp_cons = cons;
8530d160211SJeremy Fitzhardinge 	return err;
8540d160211SJeremy Fitzhardinge }
8550d160211SJeremy Fitzhardinge 
8566c5aa6fcSDenis Kirjanov static u32 xennet_run_xdp(struct netfront_queue *queue, struct page *pdata,
8576c5aa6fcSDenis Kirjanov 		   struct xen_netif_rx_response *rx, struct bpf_prog *prog,
8586c5aa6fcSDenis Kirjanov 		   struct xdp_buff *xdp, bool *need_xdp_flush)
8596c5aa6fcSDenis Kirjanov {
8606c5aa6fcSDenis Kirjanov 	struct xdp_frame *xdpf;
8616c5aa6fcSDenis Kirjanov 	u32 len = rx->status;
862e44f65fdSColin Ian King 	u32 act;
8636c5aa6fcSDenis Kirjanov 	int err;
8646c5aa6fcSDenis Kirjanov 
86543b5169dSLorenzo Bianconi 	xdp_init_buff(xdp, XEN_PAGE_SIZE - XDP_PACKET_HEADROOM,
86643b5169dSLorenzo Bianconi 		      &queue->xdp_rxq);
867be9df4afSLorenzo Bianconi 	xdp_prepare_buff(xdp, page_address(pdata), XDP_PACKET_HEADROOM,
868be9df4afSLorenzo Bianconi 			 len, false);
8696c5aa6fcSDenis Kirjanov 
8706c5aa6fcSDenis Kirjanov 	act = bpf_prog_run_xdp(prog, xdp);
8716c5aa6fcSDenis Kirjanov 	switch (act) {
8726c5aa6fcSDenis Kirjanov 	case XDP_TX:
8736c5aa6fcSDenis Kirjanov 		get_page(pdata);
8746c5aa6fcSDenis Kirjanov 		xdpf = xdp_convert_buff_to_frame(xdp);
8756c5aa6fcSDenis Kirjanov 		err = xennet_xdp_xmit(queue->info->netdev, 1, &xdpf, 0);
876*fdc13979SLorenzo Bianconi 		if (unlikely(!err))
877*fdc13979SLorenzo Bianconi 			xdp_return_frame_rx_napi(xdpf);
878*fdc13979SLorenzo Bianconi 		else if (unlikely(err < 0))
8796c5aa6fcSDenis Kirjanov 			trace_xdp_exception(queue->info->netdev, prog, act);
8806c5aa6fcSDenis Kirjanov 		break;
8816c5aa6fcSDenis Kirjanov 	case XDP_REDIRECT:
8826c5aa6fcSDenis Kirjanov 		get_page(pdata);
8836c5aa6fcSDenis Kirjanov 		err = xdp_do_redirect(queue->info->netdev, xdp, prog);
8846c5aa6fcSDenis Kirjanov 		*need_xdp_flush = true;
8856c5aa6fcSDenis Kirjanov 		if (unlikely(err))
8866c5aa6fcSDenis Kirjanov 			trace_xdp_exception(queue->info->netdev, prog, act);
8876c5aa6fcSDenis Kirjanov 		break;
8886c5aa6fcSDenis Kirjanov 	case XDP_PASS:
8896c5aa6fcSDenis Kirjanov 	case XDP_DROP:
8906c5aa6fcSDenis Kirjanov 		break;
8916c5aa6fcSDenis Kirjanov 
8926c5aa6fcSDenis Kirjanov 	case XDP_ABORTED:
8936c5aa6fcSDenis Kirjanov 		trace_xdp_exception(queue->info->netdev, prog, act);
8946c5aa6fcSDenis Kirjanov 		break;
8956c5aa6fcSDenis Kirjanov 
8966c5aa6fcSDenis Kirjanov 	default:
8976c5aa6fcSDenis Kirjanov 		bpf_warn_invalid_xdp_action(act);
8986c5aa6fcSDenis Kirjanov 	}
8996c5aa6fcSDenis Kirjanov 
9006c5aa6fcSDenis Kirjanov 	return act;
9016c5aa6fcSDenis Kirjanov }
9026c5aa6fcSDenis Kirjanov 
9032688fcb7SAndrew J. Bennieston static int xennet_get_responses(struct netfront_queue *queue,
9040d160211SJeremy Fitzhardinge 				struct netfront_rx_info *rinfo, RING_IDX rp,
9056c5aa6fcSDenis Kirjanov 				struct sk_buff_head *list,
9066c5aa6fcSDenis Kirjanov 				bool *need_xdp_flush)
9070d160211SJeremy Fitzhardinge {
9080d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response *rx = &rinfo->rx;
9096c5aa6fcSDenis Kirjanov 	int max = XEN_NETIF_NR_SLOTS_MIN + (rx->status <= RX_COPY_THRESHOLD);
9102688fcb7SAndrew J. Bennieston 	RING_IDX cons = queue->rx.rsp_cons;
9112688fcb7SAndrew J. Bennieston 	struct sk_buff *skb = xennet_get_rx_skb(queue, cons);
9126c5aa6fcSDenis Kirjanov 	struct xen_netif_extra_info *extras = rinfo->extras;
9132688fcb7SAndrew J. Bennieston 	grant_ref_t ref = xennet_get_rx_ref(queue, cons);
9146c5aa6fcSDenis Kirjanov 	struct device *dev = &queue->info->netdev->dev;
9156c5aa6fcSDenis Kirjanov 	struct bpf_prog *xdp_prog;
9166c5aa6fcSDenis Kirjanov 	struct xdp_buff xdp;
9176c5aa6fcSDenis Kirjanov 	unsigned long ret;
9187158ff6dSWei Liu 	int slots = 1;
9190d160211SJeremy Fitzhardinge 	int err = 0;
9206c5aa6fcSDenis Kirjanov 	u32 verdict;
9210d160211SJeremy Fitzhardinge 
922f942dc25SIan Campbell 	if (rx->flags & XEN_NETRXF_extra_info) {
9232688fcb7SAndrew J. Bennieston 		err = xennet_get_extras(queue, extras, rp);
9246c5aa6fcSDenis Kirjanov 		if (!err) {
9256c5aa6fcSDenis Kirjanov 			if (extras[XEN_NETIF_EXTRA_TYPE_XDP - 1].type) {
9266c5aa6fcSDenis Kirjanov 				struct xen_netif_extra_info *xdp;
9276c5aa6fcSDenis Kirjanov 
9286c5aa6fcSDenis Kirjanov 				xdp = &extras[XEN_NETIF_EXTRA_TYPE_XDP - 1];
9296c5aa6fcSDenis Kirjanov 				rx->offset = xdp->u.xdp.headroom;
9306c5aa6fcSDenis Kirjanov 			}
9316c5aa6fcSDenis Kirjanov 		}
9322688fcb7SAndrew J. Bennieston 		cons = queue->rx.rsp_cons;
9330d160211SJeremy Fitzhardinge 	}
9340d160211SJeremy Fitzhardinge 
9350d160211SJeremy Fitzhardinge 	for (;;) {
9360d160211SJeremy Fitzhardinge 		if (unlikely(rx->status < 0 ||
93730c5d7f0SJulien Grall 			     rx->offset + rx->status > XEN_PAGE_SIZE)) {
9380d160211SJeremy Fitzhardinge 			if (net_ratelimit())
9396c10127dSJulien Grall 				dev_warn(dev, "rx->offset: %u, size: %d\n",
9400d160211SJeremy Fitzhardinge 					 rx->offset, rx->status);
9412688fcb7SAndrew J. Bennieston 			xennet_move_rx_slot(queue, skb, ref);
9420d160211SJeremy Fitzhardinge 			err = -EINVAL;
9430d160211SJeremy Fitzhardinge 			goto next;
9440d160211SJeremy Fitzhardinge 		}
9450d160211SJeremy Fitzhardinge 
9460d160211SJeremy Fitzhardinge 		/*
9470d160211SJeremy Fitzhardinge 		 * This definitely indicates a bug, either in this driver or in
9480d160211SJeremy Fitzhardinge 		 * the backend driver. In future this should flag the bad
949697089dcSWei Liu 		 * situation to the system controller to reboot the backend.
9500d160211SJeremy Fitzhardinge 		 */
9510d160211SJeremy Fitzhardinge 		if (ref == GRANT_INVALID_REF) {
9520d160211SJeremy Fitzhardinge 			if (net_ratelimit())
9530d160211SJeremy Fitzhardinge 				dev_warn(dev, "Bad rx response id %d.\n",
9540d160211SJeremy Fitzhardinge 					 rx->id);
9550d160211SJeremy Fitzhardinge 			err = -EINVAL;
9560d160211SJeremy Fitzhardinge 			goto next;
9570d160211SJeremy Fitzhardinge 		}
9580d160211SJeremy Fitzhardinge 
9590d160211SJeremy Fitzhardinge 		ret = gnttab_end_foreign_access_ref(ref, 0);
9600d160211SJeremy Fitzhardinge 		BUG_ON(!ret);
9610d160211SJeremy Fitzhardinge 
9622688fcb7SAndrew J. Bennieston 		gnttab_release_grant_reference(&queue->gref_rx_head, ref);
9630d160211SJeremy Fitzhardinge 
9646c5aa6fcSDenis Kirjanov 		rcu_read_lock();
9656c5aa6fcSDenis Kirjanov 		xdp_prog = rcu_dereference(queue->xdp_prog);
9666c5aa6fcSDenis Kirjanov 		if (xdp_prog) {
9676c5aa6fcSDenis Kirjanov 			if (!(rx->flags & XEN_NETRXF_more_data)) {
9686c5aa6fcSDenis Kirjanov 				/* currently only a single page contains data */
9696c5aa6fcSDenis Kirjanov 				verdict = xennet_run_xdp(queue,
9706c5aa6fcSDenis Kirjanov 							 skb_frag_page(&skb_shinfo(skb)->frags[0]),
9716c5aa6fcSDenis Kirjanov 							 rx, xdp_prog, &xdp, need_xdp_flush);
9726c5aa6fcSDenis Kirjanov 				if (verdict != XDP_PASS)
9736c5aa6fcSDenis Kirjanov 					err = -EINVAL;
9746c5aa6fcSDenis Kirjanov 			} else {
9756c5aa6fcSDenis Kirjanov 				/* drop the frame */
9766c5aa6fcSDenis Kirjanov 				err = -EINVAL;
9776c5aa6fcSDenis Kirjanov 			}
9786c5aa6fcSDenis Kirjanov 		}
9796c5aa6fcSDenis Kirjanov 		rcu_read_unlock();
9800d160211SJeremy Fitzhardinge next:
9816c5aa6fcSDenis Kirjanov 		__skb_queue_tail(list, skb);
982f942dc25SIan Campbell 		if (!(rx->flags & XEN_NETRXF_more_data))
9830d160211SJeremy Fitzhardinge 			break;
9840d160211SJeremy Fitzhardinge 
9857158ff6dSWei Liu 		if (cons + slots == rp) {
9860d160211SJeremy Fitzhardinge 			if (net_ratelimit())
9877158ff6dSWei Liu 				dev_warn(dev, "Need more slots\n");
9880d160211SJeremy Fitzhardinge 			err = -ENOENT;
9890d160211SJeremy Fitzhardinge 			break;
9900d160211SJeremy Fitzhardinge 		}
9910d160211SJeremy Fitzhardinge 
9922688fcb7SAndrew J. Bennieston 		rx = RING_GET_RESPONSE(&queue->rx, cons + slots);
9932688fcb7SAndrew J. Bennieston 		skb = xennet_get_rx_skb(queue, cons + slots);
9942688fcb7SAndrew J. Bennieston 		ref = xennet_get_rx_ref(queue, cons + slots);
9957158ff6dSWei Liu 		slots++;
9960d160211SJeremy Fitzhardinge 	}
9970d160211SJeremy Fitzhardinge 
9987158ff6dSWei Liu 	if (unlikely(slots > max)) {
9990d160211SJeremy Fitzhardinge 		if (net_ratelimit())
1000697089dcSWei Liu 			dev_warn(dev, "Too many slots\n");
10010d160211SJeremy Fitzhardinge 		err = -E2BIG;
10020d160211SJeremy Fitzhardinge 	}
10030d160211SJeremy Fitzhardinge 
10040d160211SJeremy Fitzhardinge 	if (unlikely(err))
10052688fcb7SAndrew J. Bennieston 		queue->rx.rsp_cons = cons + slots;
10060d160211SJeremy Fitzhardinge 
10070d160211SJeremy Fitzhardinge 	return err;
10080d160211SJeremy Fitzhardinge }
10090d160211SJeremy Fitzhardinge 
10100d160211SJeremy Fitzhardinge static int xennet_set_skb_gso(struct sk_buff *skb,
10110d160211SJeremy Fitzhardinge 			      struct xen_netif_extra_info *gso)
10120d160211SJeremy Fitzhardinge {
10130d160211SJeremy Fitzhardinge 	if (!gso->u.gso.size) {
10140d160211SJeremy Fitzhardinge 		if (net_ratelimit())
1015383eda32SJoe Perches 			pr_warn("GSO size must not be zero\n");
10160d160211SJeremy Fitzhardinge 		return -EINVAL;
10170d160211SJeremy Fitzhardinge 	}
10180d160211SJeremy Fitzhardinge 
10192c0057deSPaul Durrant 	if (gso->u.gso.type != XEN_NETIF_GSO_TYPE_TCPV4 &&
10202c0057deSPaul Durrant 	    gso->u.gso.type != XEN_NETIF_GSO_TYPE_TCPV6) {
10210d160211SJeremy Fitzhardinge 		if (net_ratelimit())
1022383eda32SJoe Perches 			pr_warn("Bad GSO type %d\n", gso->u.gso.type);
10230d160211SJeremy Fitzhardinge 		return -EINVAL;
10240d160211SJeremy Fitzhardinge 	}
10250d160211SJeremy Fitzhardinge 
10260d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_size = gso->u.gso.size;
10272c0057deSPaul Durrant 	skb_shinfo(skb)->gso_type =
10282c0057deSPaul Durrant 		(gso->u.gso.type == XEN_NETIF_GSO_TYPE_TCPV4) ?
10292c0057deSPaul Durrant 		SKB_GSO_TCPV4 :
10302c0057deSPaul Durrant 		SKB_GSO_TCPV6;
10310d160211SJeremy Fitzhardinge 
10320d160211SJeremy Fitzhardinge 	/* Header must be checked, and gso_segs computed. */
10330d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
10340d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_segs = 0;
10350d160211SJeremy Fitzhardinge 
10360d160211SJeremy Fitzhardinge 	return 0;
10370d160211SJeremy Fitzhardinge }
10380d160211SJeremy Fitzhardinge 
1039a761129eSDongli Zhang static int xennet_fill_frags(struct netfront_queue *queue,
10400d160211SJeremy Fitzhardinge 			     struct sk_buff *skb,
10410d160211SJeremy Fitzhardinge 			     struct sk_buff_head *list)
10420d160211SJeremy Fitzhardinge {
10432688fcb7SAndrew J. Bennieston 	RING_IDX cons = queue->rx.rsp_cons;
10440d160211SJeremy Fitzhardinge 	struct sk_buff *nskb;
10450d160211SJeremy Fitzhardinge 
10460d160211SJeremy Fitzhardinge 	while ((nskb = __skb_dequeue(list))) {
10470d160211SJeremy Fitzhardinge 		struct xen_netif_rx_response *rx =
10482688fcb7SAndrew J. Bennieston 			RING_GET_RESPONSE(&queue->rx, ++cons);
104901c68026SIan Campbell 		skb_frag_t *nfrag = &skb_shinfo(nskb)->frags[0];
10500d160211SJeremy Fitzhardinge 
1051d472b3a6SJuergen Gross 		if (skb_shinfo(skb)->nr_frags == MAX_SKB_FRAGS) {
1052093b9c71SJan Beulich 			unsigned int pull_to = NETFRONT_SKB_CB(skb)->pull_to;
10530d160211SJeremy Fitzhardinge 
1054d81c5054SJuergen Gross 			BUG_ON(pull_to < skb_headlen(skb));
1055093b9c71SJan Beulich 			__pskb_pull_tail(skb, pull_to - skb_headlen(skb));
1056093b9c71SJan Beulich 		}
1057ad4f15dcSJuergen Gross 		if (unlikely(skb_shinfo(skb)->nr_frags >= MAX_SKB_FRAGS)) {
105800b36850SDongli Zhang 			queue->rx.rsp_cons = ++cons + skb_queue_len(list);
1059ad4f15dcSJuergen Gross 			kfree_skb(nskb);
1060a761129eSDongli Zhang 			return -ENOENT;
1061ad4f15dcSJuergen Gross 		}
1062093b9c71SJan Beulich 
1063d472b3a6SJuergen Gross 		skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags,
1064d472b3a6SJuergen Gross 				skb_frag_page(nfrag),
1065093b9c71SJan Beulich 				rx->offset, rx->status, PAGE_SIZE);
10660d160211SJeremy Fitzhardinge 
10670d160211SJeremy Fitzhardinge 		skb_shinfo(nskb)->nr_frags = 0;
10680d160211SJeremy Fitzhardinge 		kfree_skb(nskb);
10690d160211SJeremy Fitzhardinge 	}
10700d160211SJeremy Fitzhardinge 
1071a761129eSDongli Zhang 	queue->rx.rsp_cons = cons;
1072a761129eSDongli Zhang 
1073a761129eSDongli Zhang 	return 0;
10740d160211SJeremy Fitzhardinge }
10750d160211SJeremy Fitzhardinge 
1076e0ce4af9SIan Campbell static int checksum_setup(struct net_device *dev, struct sk_buff *skb)
10770d160211SJeremy Fitzhardinge {
1078b5cf66cdSPaul Durrant 	bool recalculate_partial_csum = false;
1079e0ce4af9SIan Campbell 
1080e0ce4af9SIan Campbell 	/*
1081e0ce4af9SIan Campbell 	 * A GSO SKB must be CHECKSUM_PARTIAL. However some buggy
1082e0ce4af9SIan Campbell 	 * peers can fail to set NETRXF_csum_blank when sending a GSO
1083e0ce4af9SIan Campbell 	 * frame. In this case force the SKB to CHECKSUM_PARTIAL and
1084e0ce4af9SIan Campbell 	 * recalculate the partial checksum.
1085e0ce4af9SIan Campbell 	 */
1086e0ce4af9SIan Campbell 	if (skb->ip_summed != CHECKSUM_PARTIAL && skb_is_gso(skb)) {
1087e0ce4af9SIan Campbell 		struct netfront_info *np = netdev_priv(dev);
10882688fcb7SAndrew J. Bennieston 		atomic_inc(&np->rx_gso_checksum_fixup);
1089e0ce4af9SIan Campbell 		skb->ip_summed = CHECKSUM_PARTIAL;
1090b5cf66cdSPaul Durrant 		recalculate_partial_csum = true;
1091e0ce4af9SIan Campbell 	}
1092e0ce4af9SIan Campbell 
1093e0ce4af9SIan Campbell 	/* A non-CHECKSUM_PARTIAL SKB does not require setup. */
1094e0ce4af9SIan Campbell 	if (skb->ip_summed != CHECKSUM_PARTIAL)
1095e0ce4af9SIan Campbell 		return 0;
10960d160211SJeremy Fitzhardinge 
1097b5cf66cdSPaul Durrant 	return skb_checksum_setup(skb, recalculate_partial_csum);
10980d160211SJeremy Fitzhardinge }
10990d160211SJeremy Fitzhardinge 
11002688fcb7SAndrew J. Bennieston static int handle_incoming_queue(struct netfront_queue *queue,
11010d160211SJeremy Fitzhardinge 				 struct sk_buff_head *rxq)
11020d160211SJeremy Fitzhardinge {
1103900e1833SDavid Vrabel 	struct netfront_stats *rx_stats = this_cpu_ptr(queue->info->rx_stats);
11040d160211SJeremy Fitzhardinge 	int packets_dropped = 0;
11050d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
11060d160211SJeremy Fitzhardinge 
11070d160211SJeremy Fitzhardinge 	while ((skb = __skb_dequeue(rxq)) != NULL) {
11083683243bSIan Campbell 		int pull_to = NETFRONT_SKB_CB(skb)->pull_to;
11090d160211SJeremy Fitzhardinge 
1110093b9c71SJan Beulich 		if (pull_to > skb_headlen(skb))
11113683243bSIan Campbell 			__pskb_pull_tail(skb, pull_to - skb_headlen(skb));
11120d160211SJeremy Fitzhardinge 
11130d160211SJeremy Fitzhardinge 		/* Ethernet work: Delayed to here as it peeks the header. */
11142688fcb7SAndrew J. Bennieston 		skb->protocol = eth_type_trans(skb, queue->info->netdev);
1115d554f73dSWei Liu 		skb_reset_network_header(skb);
11160d160211SJeremy Fitzhardinge 
11172688fcb7SAndrew J. Bennieston 		if (checksum_setup(queue->info->netdev, skb)) {
11180d160211SJeremy Fitzhardinge 			kfree_skb(skb);
11190d160211SJeremy Fitzhardinge 			packets_dropped++;
11202688fcb7SAndrew J. Bennieston 			queue->info->netdev->stats.rx_errors++;
11210d160211SJeremy Fitzhardinge 			continue;
11220d160211SJeremy Fitzhardinge 		}
11230d160211SJeremy Fitzhardinge 
1124900e1833SDavid Vrabel 		u64_stats_update_begin(&rx_stats->syncp);
1125900e1833SDavid Vrabel 		rx_stats->packets++;
1126900e1833SDavid Vrabel 		rx_stats->bytes += skb->len;
1127900e1833SDavid Vrabel 		u64_stats_update_end(&rx_stats->syncp);
11280d160211SJeremy Fitzhardinge 
11290d160211SJeremy Fitzhardinge 		/* Pass it up. */
11302688fcb7SAndrew J. Bennieston 		napi_gro_receive(&queue->napi, skb);
11310d160211SJeremy Fitzhardinge 	}
11320d160211SJeremy Fitzhardinge 
11330d160211SJeremy Fitzhardinge 	return packets_dropped;
11340d160211SJeremy Fitzhardinge }
11350d160211SJeremy Fitzhardinge 
1136bea3348eSStephen Hemminger static int xennet_poll(struct napi_struct *napi, int budget)
11370d160211SJeremy Fitzhardinge {
11382688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = container_of(napi, struct netfront_queue, napi);
11392688fcb7SAndrew J. Bennieston 	struct net_device *dev = queue->info->netdev;
11400d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
11410d160211SJeremy Fitzhardinge 	struct netfront_rx_info rinfo;
11420d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response *rx = &rinfo.rx;
11430d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extras = rinfo.extras;
11440d160211SJeremy Fitzhardinge 	RING_IDX i, rp;
1145bea3348eSStephen Hemminger 	int work_done;
11460d160211SJeremy Fitzhardinge 	struct sk_buff_head rxq;
11470d160211SJeremy Fitzhardinge 	struct sk_buff_head errq;
11480d160211SJeremy Fitzhardinge 	struct sk_buff_head tmpq;
11490d160211SJeremy Fitzhardinge 	int err;
11506c5aa6fcSDenis Kirjanov 	bool need_xdp_flush = false;
11510d160211SJeremy Fitzhardinge 
11522688fcb7SAndrew J. Bennieston 	spin_lock(&queue->rx_lock);
11530d160211SJeremy Fitzhardinge 
11540d160211SJeremy Fitzhardinge 	skb_queue_head_init(&rxq);
11550d160211SJeremy Fitzhardinge 	skb_queue_head_init(&errq);
11560d160211SJeremy Fitzhardinge 	skb_queue_head_init(&tmpq);
11570d160211SJeremy Fitzhardinge 
11582688fcb7SAndrew J. Bennieston 	rp = queue->rx.sring->rsp_prod;
11590d160211SJeremy Fitzhardinge 	rmb(); /* Ensure we see queued responses up to 'rp'. */
11600d160211SJeremy Fitzhardinge 
11612688fcb7SAndrew J. Bennieston 	i = queue->rx.rsp_cons;
11620d160211SJeremy Fitzhardinge 	work_done = 0;
11630d160211SJeremy Fitzhardinge 	while ((i != rp) && (work_done < budget)) {
11642688fcb7SAndrew J. Bennieston 		memcpy(rx, RING_GET_RESPONSE(&queue->rx, i), sizeof(*rx));
11650d160211SJeremy Fitzhardinge 		memset(extras, 0, sizeof(rinfo.extras));
11660d160211SJeremy Fitzhardinge 
11676c5aa6fcSDenis Kirjanov 		err = xennet_get_responses(queue, &rinfo, rp, &tmpq,
11686c5aa6fcSDenis Kirjanov 					   &need_xdp_flush);
11690d160211SJeremy Fitzhardinge 
11700d160211SJeremy Fitzhardinge 		if (unlikely(err)) {
11710d160211SJeremy Fitzhardinge err:
11720d160211SJeremy Fitzhardinge 			while ((skb = __skb_dequeue(&tmpq)))
11730d160211SJeremy Fitzhardinge 				__skb_queue_tail(&errq, skb);
117409f75cd7SJeff Garzik 			dev->stats.rx_errors++;
11752688fcb7SAndrew J. Bennieston 			i = queue->rx.rsp_cons;
11760d160211SJeremy Fitzhardinge 			continue;
11770d160211SJeremy Fitzhardinge 		}
11780d160211SJeremy Fitzhardinge 
11790d160211SJeremy Fitzhardinge 		skb = __skb_dequeue(&tmpq);
11800d160211SJeremy Fitzhardinge 
11810d160211SJeremy Fitzhardinge 		if (extras[XEN_NETIF_EXTRA_TYPE_GSO - 1].type) {
11820d160211SJeremy Fitzhardinge 			struct xen_netif_extra_info *gso;
11830d160211SJeremy Fitzhardinge 			gso = &extras[XEN_NETIF_EXTRA_TYPE_GSO - 1];
11840d160211SJeremy Fitzhardinge 
11850d160211SJeremy Fitzhardinge 			if (unlikely(xennet_set_skb_gso(skb, gso))) {
11860d160211SJeremy Fitzhardinge 				__skb_queue_head(&tmpq, skb);
11872688fcb7SAndrew J. Bennieston 				queue->rx.rsp_cons += skb_queue_len(&tmpq);
11880d160211SJeremy Fitzhardinge 				goto err;
11890d160211SJeremy Fitzhardinge 			}
11900d160211SJeremy Fitzhardinge 		}
11910d160211SJeremy Fitzhardinge 
11923683243bSIan Campbell 		NETFRONT_SKB_CB(skb)->pull_to = rx->status;
11933683243bSIan Campbell 		if (NETFRONT_SKB_CB(skb)->pull_to > RX_COPY_THRESHOLD)
11943683243bSIan Campbell 			NETFRONT_SKB_CB(skb)->pull_to = RX_COPY_THRESHOLD;
11950d160211SJeremy Fitzhardinge 
1196b54c9d5bSJonathan Lemon 		skb_frag_off_set(&skb_shinfo(skb)->frags[0], rx->offset);
11973683243bSIan Campbell 		skb_frag_size_set(&skb_shinfo(skb)->frags[0], rx->status);
11983683243bSIan Campbell 		skb->data_len = rx->status;
1199093b9c71SJan Beulich 		skb->len += rx->status;
12000d160211SJeremy Fitzhardinge 
1201a761129eSDongli Zhang 		if (unlikely(xennet_fill_frags(queue, skb, &tmpq)))
1202ad4f15dcSJuergen Gross 			goto err;
12030d160211SJeremy Fitzhardinge 
1204f942dc25SIan Campbell 		if (rx->flags & XEN_NETRXF_csum_blank)
12050d160211SJeremy Fitzhardinge 			skb->ip_summed = CHECKSUM_PARTIAL;
1206f942dc25SIan Campbell 		else if (rx->flags & XEN_NETRXF_data_validated)
12070d160211SJeremy Fitzhardinge 			skb->ip_summed = CHECKSUM_UNNECESSARY;
12080d160211SJeremy Fitzhardinge 
12090d160211SJeremy Fitzhardinge 		__skb_queue_tail(&rxq, skb);
12100d160211SJeremy Fitzhardinge 
1211a761129eSDongli Zhang 		i = ++queue->rx.rsp_cons;
12120d160211SJeremy Fitzhardinge 		work_done++;
12130d160211SJeremy Fitzhardinge 	}
12146c5aa6fcSDenis Kirjanov 	if (need_xdp_flush)
12156c5aa6fcSDenis Kirjanov 		xdp_do_flush();
12160d160211SJeremy Fitzhardinge 
121756cfe5d0SWang Chen 	__skb_queue_purge(&errq);
12180d160211SJeremy Fitzhardinge 
12192688fcb7SAndrew J. Bennieston 	work_done -= handle_incoming_queue(queue, &rxq);
12200d160211SJeremy Fitzhardinge 
12212688fcb7SAndrew J. Bennieston 	xennet_alloc_rx_buffers(queue);
12220d160211SJeremy Fitzhardinge 
12230d160211SJeremy Fitzhardinge 	if (work_done < budget) {
1224bea3348eSStephen Hemminger 		int more_to_do = 0;
1225bea3348eSStephen Hemminger 
12266ad20165SEric Dumazet 		napi_complete_done(napi, work_done);
12270d160211SJeremy Fitzhardinge 
12282688fcb7SAndrew J. Bennieston 		RING_FINAL_CHECK_FOR_RESPONSES(&queue->rx, more_to_do);
12296a6dc08fSDavid Vrabel 		if (more_to_do)
12306a6dc08fSDavid Vrabel 			napi_schedule(napi);
12310d160211SJeremy Fitzhardinge 	}
12320d160211SJeremy Fitzhardinge 
12332688fcb7SAndrew J. Bennieston 	spin_unlock(&queue->rx_lock);
12340d160211SJeremy Fitzhardinge 
1235bea3348eSStephen Hemminger 	return work_done;
12360d160211SJeremy Fitzhardinge }
12370d160211SJeremy Fitzhardinge 
12380d160211SJeremy Fitzhardinge static int xennet_change_mtu(struct net_device *dev, int mtu)
12390d160211SJeremy Fitzhardinge {
12400c36820eSJonathan Davies 	int max = xennet_can_sg(dev) ? XEN_NETIF_MAX_TX_SIZE : ETH_DATA_LEN;
12410d160211SJeremy Fitzhardinge 
12420d160211SJeremy Fitzhardinge 	if (mtu > max)
12430d160211SJeremy Fitzhardinge 		return -EINVAL;
12440d160211SJeremy Fitzhardinge 	dev->mtu = mtu;
12450d160211SJeremy Fitzhardinge 	return 0;
12460d160211SJeremy Fitzhardinge }
12470d160211SJeremy Fitzhardinge 
1248bc1f4470Sstephen hemminger static void xennet_get_stats64(struct net_device *dev,
1249e00f85beSstephen hemminger 			       struct rtnl_link_stats64 *tot)
1250e00f85beSstephen hemminger {
1251e00f85beSstephen hemminger 	struct netfront_info *np = netdev_priv(dev);
1252e00f85beSstephen hemminger 	int cpu;
1253e00f85beSstephen hemminger 
1254e00f85beSstephen hemminger 	for_each_possible_cpu(cpu) {
1255900e1833SDavid Vrabel 		struct netfront_stats *rx_stats = per_cpu_ptr(np->rx_stats, cpu);
1256900e1833SDavid Vrabel 		struct netfront_stats *tx_stats = per_cpu_ptr(np->tx_stats, cpu);
1257e00f85beSstephen hemminger 		u64 rx_packets, rx_bytes, tx_packets, tx_bytes;
1258e00f85beSstephen hemminger 		unsigned int start;
1259e00f85beSstephen hemminger 
1260e00f85beSstephen hemminger 		do {
1261900e1833SDavid Vrabel 			start = u64_stats_fetch_begin_irq(&tx_stats->syncp);
1262900e1833SDavid Vrabel 			tx_packets = tx_stats->packets;
1263900e1833SDavid Vrabel 			tx_bytes = tx_stats->bytes;
1264900e1833SDavid Vrabel 		} while (u64_stats_fetch_retry_irq(&tx_stats->syncp, start));
1265e00f85beSstephen hemminger 
1266900e1833SDavid Vrabel 		do {
1267900e1833SDavid Vrabel 			start = u64_stats_fetch_begin_irq(&rx_stats->syncp);
1268900e1833SDavid Vrabel 			rx_packets = rx_stats->packets;
1269900e1833SDavid Vrabel 			rx_bytes = rx_stats->bytes;
1270900e1833SDavid Vrabel 		} while (u64_stats_fetch_retry_irq(&rx_stats->syncp, start));
1271e00f85beSstephen hemminger 
1272e00f85beSstephen hemminger 		tot->rx_packets += rx_packets;
1273e00f85beSstephen hemminger 		tot->tx_packets += tx_packets;
1274e00f85beSstephen hemminger 		tot->rx_bytes   += rx_bytes;
1275e00f85beSstephen hemminger 		tot->tx_bytes   += tx_bytes;
1276e00f85beSstephen hemminger 	}
1277e00f85beSstephen hemminger 
1278e00f85beSstephen hemminger 	tot->rx_errors  = dev->stats.rx_errors;
1279e00f85beSstephen hemminger 	tot->tx_dropped = dev->stats.tx_dropped;
1280e00f85beSstephen hemminger }
1281e00f85beSstephen hemminger 
12822688fcb7SAndrew J. Bennieston static void xennet_release_tx_bufs(struct netfront_queue *queue)
12830d160211SJeremy Fitzhardinge {
12840d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
12850d160211SJeremy Fitzhardinge 	int i;
12860d160211SJeremy Fitzhardinge 
12870d160211SJeremy Fitzhardinge 	for (i = 0; i < NET_TX_RING_SIZE; i++) {
12880d160211SJeremy Fitzhardinge 		/* Skip over entries which are actually freelist references */
12892688fcb7SAndrew J. Bennieston 		if (skb_entry_is_link(&queue->tx_skbs[i]))
12900d160211SJeremy Fitzhardinge 			continue;
12910d160211SJeremy Fitzhardinge 
12922688fcb7SAndrew J. Bennieston 		skb = queue->tx_skbs[i].skb;
12932688fcb7SAndrew J. Bennieston 		get_page(queue->grant_tx_page[i]);
12942688fcb7SAndrew J. Bennieston 		gnttab_end_foreign_access(queue->grant_tx_ref[i],
1295cefe0078SAnnie Li 					  GNTMAP_readonly,
12962688fcb7SAndrew J. Bennieston 					  (unsigned long)page_address(queue->grant_tx_page[i]));
12972688fcb7SAndrew J. Bennieston 		queue->grant_tx_page[i] = NULL;
12982688fcb7SAndrew J. Bennieston 		queue->grant_tx_ref[i] = GRANT_INVALID_REF;
12992688fcb7SAndrew J. Bennieston 		add_id_to_freelist(&queue->tx_skb_freelist, queue->tx_skbs, i);
13000d160211SJeremy Fitzhardinge 		dev_kfree_skb_irq(skb);
13010d160211SJeremy Fitzhardinge 	}
13020d160211SJeremy Fitzhardinge }
13030d160211SJeremy Fitzhardinge 
13042688fcb7SAndrew J. Bennieston static void xennet_release_rx_bufs(struct netfront_queue *queue)
13050d160211SJeremy Fitzhardinge {
13060d160211SJeremy Fitzhardinge 	int id, ref;
13070d160211SJeremy Fitzhardinge 
13082688fcb7SAndrew J. Bennieston 	spin_lock_bh(&queue->rx_lock);
13090d160211SJeremy Fitzhardinge 
13100d160211SJeremy Fitzhardinge 	for (id = 0; id < NET_RX_RING_SIZE; id++) {
1311cefe0078SAnnie Li 		struct sk_buff *skb;
1312cefe0078SAnnie Li 		struct page *page;
13130d160211SJeremy Fitzhardinge 
13142688fcb7SAndrew J. Bennieston 		skb = queue->rx_skbs[id];
1315cefe0078SAnnie Li 		if (!skb)
1316cefe0078SAnnie Li 			continue;
1317cefe0078SAnnie Li 
13182688fcb7SAndrew J. Bennieston 		ref = queue->grant_rx_ref[id];
1319cefe0078SAnnie Li 		if (ref == GRANT_INVALID_REF)
1320cefe0078SAnnie Li 			continue;
1321cefe0078SAnnie Li 
1322cefe0078SAnnie Li 		page = skb_frag_page(&skb_shinfo(skb)->frags[0]);
1323cefe0078SAnnie Li 
1324cefe0078SAnnie Li 		/* gnttab_end_foreign_access() needs a page ref until
1325cefe0078SAnnie Li 		 * foreign access is ended (which may be deferred).
1326cefe0078SAnnie Li 		 */
1327cefe0078SAnnie Li 		get_page(page);
1328cefe0078SAnnie Li 		gnttab_end_foreign_access(ref, 0,
1329cefe0078SAnnie Li 					  (unsigned long)page_address(page));
13302688fcb7SAndrew J. Bennieston 		queue->grant_rx_ref[id] = GRANT_INVALID_REF;
13310d160211SJeremy Fitzhardinge 
1332cefe0078SAnnie Li 		kfree_skb(skb);
13330d160211SJeremy Fitzhardinge 	}
13340d160211SJeremy Fitzhardinge 
13352688fcb7SAndrew J. Bennieston 	spin_unlock_bh(&queue->rx_lock);
13360d160211SJeremy Fitzhardinge }
13370d160211SJeremy Fitzhardinge 
1338c8f44affSMichał Mirosław static netdev_features_t xennet_fix_features(struct net_device *dev,
1339c8f44affSMichał Mirosław 	netdev_features_t features)
13408f7b01a1SEric Dumazet {
13418f7b01a1SEric Dumazet 	struct netfront_info *np = netdev_priv(dev);
13428f7b01a1SEric Dumazet 
13432890ea5cSJuergen Gross 	if (features & NETIF_F_SG &&
13442890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend, "feature-sg", 0))
13458f7b01a1SEric Dumazet 		features &= ~NETIF_F_SG;
13468f7b01a1SEric Dumazet 
13472890ea5cSJuergen Gross 	if (features & NETIF_F_IPV6_CSUM &&
13482890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend,
13492890ea5cSJuergen Gross 				  "feature-ipv6-csum-offload", 0))
13502c0057deSPaul Durrant 		features &= ~NETIF_F_IPV6_CSUM;
13512c0057deSPaul Durrant 
13522890ea5cSJuergen Gross 	if (features & NETIF_F_TSO &&
13532890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend, "feature-gso-tcpv4", 0))
13548f7b01a1SEric Dumazet 		features &= ~NETIF_F_TSO;
13558f7b01a1SEric Dumazet 
13562890ea5cSJuergen Gross 	if (features & NETIF_F_TSO6 &&
13572890ea5cSJuergen Gross 	    !xenbus_read_unsigned(np->xbdev->otherend, "feature-gso-tcpv6", 0))
13582c0057deSPaul Durrant 		features &= ~NETIF_F_TSO6;
13592c0057deSPaul Durrant 
13608f7b01a1SEric Dumazet 	return features;
13618f7b01a1SEric Dumazet }
13628f7b01a1SEric Dumazet 
1363c8f44affSMichał Mirosław static int xennet_set_features(struct net_device *dev,
1364c8f44affSMichał Mirosław 	netdev_features_t features)
13658f7b01a1SEric Dumazet {
13668f7b01a1SEric Dumazet 	if (!(features & NETIF_F_SG) && dev->mtu > ETH_DATA_LEN) {
13678f7b01a1SEric Dumazet 		netdev_info(dev, "Reducing MTU because no SG offload");
13688f7b01a1SEric Dumazet 		dev->mtu = ETH_DATA_LEN;
13698f7b01a1SEric Dumazet 	}
13708f7b01a1SEric Dumazet 
13718f7b01a1SEric Dumazet 	return 0;
13728f7b01a1SEric Dumazet }
13738f7b01a1SEric Dumazet 
1374d634bf2cSWei Liu static irqreturn_t xennet_tx_interrupt(int irq, void *dev_id)
1375cf66f9d4SKonrad Rzeszutek Wilk {
13762688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = dev_id;
1377cf66f9d4SKonrad Rzeszutek Wilk 	unsigned long flags;
1378cf66f9d4SKonrad Rzeszutek Wilk 
13792688fcb7SAndrew J. Bennieston 	spin_lock_irqsave(&queue->tx_lock, flags);
13802688fcb7SAndrew J. Bennieston 	xennet_tx_buf_gc(queue);
13812688fcb7SAndrew J. Bennieston 	spin_unlock_irqrestore(&queue->tx_lock, flags);
1382cf66f9d4SKonrad Rzeszutek Wilk 
1383cf66f9d4SKonrad Rzeszutek Wilk 	return IRQ_HANDLED;
1384cf66f9d4SKonrad Rzeszutek Wilk }
1385cf66f9d4SKonrad Rzeszutek Wilk 
1386d634bf2cSWei Liu static irqreturn_t xennet_rx_interrupt(int irq, void *dev_id)
1387d634bf2cSWei Liu {
13882688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = dev_id;
13892688fcb7SAndrew J. Bennieston 	struct net_device *dev = queue->info->netdev;
1390d634bf2cSWei Liu 
1391d634bf2cSWei Liu 	if (likely(netif_carrier_ok(dev) &&
13922688fcb7SAndrew J. Bennieston 		   RING_HAS_UNCONSUMED_RESPONSES(&queue->rx)))
13932688fcb7SAndrew J. Bennieston 		napi_schedule(&queue->napi);
1394d634bf2cSWei Liu 
1395d634bf2cSWei Liu 	return IRQ_HANDLED;
1396d634bf2cSWei Liu }
1397d634bf2cSWei Liu 
1398d634bf2cSWei Liu static irqreturn_t xennet_interrupt(int irq, void *dev_id)
1399d634bf2cSWei Liu {
1400d634bf2cSWei Liu 	xennet_tx_interrupt(irq, dev_id);
1401d634bf2cSWei Liu 	xennet_rx_interrupt(irq, dev_id);
1402d634bf2cSWei Liu 	return IRQ_HANDLED;
1403d634bf2cSWei Liu }
1404d634bf2cSWei Liu 
1405cf66f9d4SKonrad Rzeszutek Wilk #ifdef CONFIG_NET_POLL_CONTROLLER
1406cf66f9d4SKonrad Rzeszutek Wilk static void xennet_poll_controller(struct net_device *dev)
1407cf66f9d4SKonrad Rzeszutek Wilk {
14082688fcb7SAndrew J. Bennieston 	/* Poll each queue */
14092688fcb7SAndrew J. Bennieston 	struct netfront_info *info = netdev_priv(dev);
14102688fcb7SAndrew J. Bennieston 	unsigned int num_queues = dev->real_num_tx_queues;
14112688fcb7SAndrew J. Bennieston 	unsigned int i;
14122688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i)
14132688fcb7SAndrew J. Bennieston 		xennet_interrupt(0, &info->queues[i]);
1414cf66f9d4SKonrad Rzeszutek Wilk }
1415cf66f9d4SKonrad Rzeszutek Wilk #endif
1416cf66f9d4SKonrad Rzeszutek Wilk 
14176c5aa6fcSDenis Kirjanov #define NETBACK_XDP_HEADROOM_DISABLE	0
14186c5aa6fcSDenis Kirjanov #define NETBACK_XDP_HEADROOM_ENABLE	1
14196c5aa6fcSDenis Kirjanov 
14206c5aa6fcSDenis Kirjanov static int talk_to_netback_xdp(struct netfront_info *np, int xdp)
14216c5aa6fcSDenis Kirjanov {
14226c5aa6fcSDenis Kirjanov 	int err;
14236c5aa6fcSDenis Kirjanov 	unsigned short headroom;
14246c5aa6fcSDenis Kirjanov 
14256c5aa6fcSDenis Kirjanov 	headroom = xdp ? XDP_PACKET_HEADROOM : 0;
14266c5aa6fcSDenis Kirjanov 	err = xenbus_printf(XBT_NIL, np->xbdev->nodename,
14276c5aa6fcSDenis Kirjanov 			    "xdp-headroom", "%hu",
14286c5aa6fcSDenis Kirjanov 			    headroom);
14296c5aa6fcSDenis Kirjanov 	if (err)
14306c5aa6fcSDenis Kirjanov 		pr_warn("Error writing xdp-headroom\n");
14316c5aa6fcSDenis Kirjanov 
14326c5aa6fcSDenis Kirjanov 	return err;
14336c5aa6fcSDenis Kirjanov }
14346c5aa6fcSDenis Kirjanov 
14356c5aa6fcSDenis Kirjanov static int xennet_xdp_set(struct net_device *dev, struct bpf_prog *prog,
14366c5aa6fcSDenis Kirjanov 			  struct netlink_ext_ack *extack)
14376c5aa6fcSDenis Kirjanov {
14386c5aa6fcSDenis Kirjanov 	unsigned long max_mtu = XEN_PAGE_SIZE - XDP_PACKET_HEADROOM;
14396c5aa6fcSDenis Kirjanov 	struct netfront_info *np = netdev_priv(dev);
14406c5aa6fcSDenis Kirjanov 	struct bpf_prog *old_prog;
14416c5aa6fcSDenis Kirjanov 	unsigned int i, err;
14426c5aa6fcSDenis Kirjanov 
14436c5aa6fcSDenis Kirjanov 	if (dev->mtu > max_mtu) {
14446c5aa6fcSDenis Kirjanov 		netdev_warn(dev, "XDP requires MTU less than %lu\n", max_mtu);
14456c5aa6fcSDenis Kirjanov 		return -EINVAL;
14466c5aa6fcSDenis Kirjanov 	}
14476c5aa6fcSDenis Kirjanov 
14486c5aa6fcSDenis Kirjanov 	if (!np->netback_has_xdp_headroom)
14496c5aa6fcSDenis Kirjanov 		return 0;
14506c5aa6fcSDenis Kirjanov 
14516c5aa6fcSDenis Kirjanov 	xenbus_switch_state(np->xbdev, XenbusStateReconfiguring);
14526c5aa6fcSDenis Kirjanov 
14536c5aa6fcSDenis Kirjanov 	err = talk_to_netback_xdp(np, prog ? NETBACK_XDP_HEADROOM_ENABLE :
14546c5aa6fcSDenis Kirjanov 				  NETBACK_XDP_HEADROOM_DISABLE);
14556c5aa6fcSDenis Kirjanov 	if (err)
14566c5aa6fcSDenis Kirjanov 		return err;
14576c5aa6fcSDenis Kirjanov 
14586c5aa6fcSDenis Kirjanov 	/* avoid the race with XDP headroom adjustment */
14596c5aa6fcSDenis Kirjanov 	wait_event(module_wq,
14606c5aa6fcSDenis Kirjanov 		   xenbus_read_driver_state(np->xbdev->otherend) ==
14616c5aa6fcSDenis Kirjanov 		   XenbusStateReconfigured);
14626c5aa6fcSDenis Kirjanov 	np->netfront_xdp_enabled = true;
14636c5aa6fcSDenis Kirjanov 
14646c5aa6fcSDenis Kirjanov 	old_prog = rtnl_dereference(np->queues[0].xdp_prog);
14656c5aa6fcSDenis Kirjanov 
14666c5aa6fcSDenis Kirjanov 	if (prog)
14676c5aa6fcSDenis Kirjanov 		bpf_prog_add(prog, dev->real_num_tx_queues);
14686c5aa6fcSDenis Kirjanov 
14696c5aa6fcSDenis Kirjanov 	for (i = 0; i < dev->real_num_tx_queues; ++i)
14706c5aa6fcSDenis Kirjanov 		rcu_assign_pointer(np->queues[i].xdp_prog, prog);
14716c5aa6fcSDenis Kirjanov 
14726c5aa6fcSDenis Kirjanov 	if (old_prog)
14736c5aa6fcSDenis Kirjanov 		for (i = 0; i < dev->real_num_tx_queues; ++i)
14746c5aa6fcSDenis Kirjanov 			bpf_prog_put(old_prog);
14756c5aa6fcSDenis Kirjanov 
14766c5aa6fcSDenis Kirjanov 	xenbus_switch_state(np->xbdev, XenbusStateConnected);
14776c5aa6fcSDenis Kirjanov 
14786c5aa6fcSDenis Kirjanov 	return 0;
14796c5aa6fcSDenis Kirjanov }
14806c5aa6fcSDenis Kirjanov 
14816c5aa6fcSDenis Kirjanov static int xennet_xdp(struct net_device *dev, struct netdev_bpf *xdp)
14826c5aa6fcSDenis Kirjanov {
14836c5aa6fcSDenis Kirjanov 	switch (xdp->command) {
14846c5aa6fcSDenis Kirjanov 	case XDP_SETUP_PROG:
14856c5aa6fcSDenis Kirjanov 		return xennet_xdp_set(dev, xdp->prog, xdp->extack);
14866c5aa6fcSDenis Kirjanov 	default:
14876c5aa6fcSDenis Kirjanov 		return -EINVAL;
14886c5aa6fcSDenis Kirjanov 	}
14896c5aa6fcSDenis Kirjanov }
14906c5aa6fcSDenis Kirjanov 
14910a0b9d2eSStephen Hemminger static const struct net_device_ops xennet_netdev_ops = {
14920a0b9d2eSStephen Hemminger 	.ndo_open            = xennet_open,
14930a0b9d2eSStephen Hemminger 	.ndo_stop            = xennet_close,
14940a0b9d2eSStephen Hemminger 	.ndo_start_xmit      = xennet_start_xmit,
14950a0b9d2eSStephen Hemminger 	.ndo_change_mtu	     = xennet_change_mtu,
1496e00f85beSstephen hemminger 	.ndo_get_stats64     = xennet_get_stats64,
14970a0b9d2eSStephen Hemminger 	.ndo_set_mac_address = eth_mac_addr,
14980a0b9d2eSStephen Hemminger 	.ndo_validate_addr   = eth_validate_addr,
1499fb507934SMichał Mirosław 	.ndo_fix_features    = xennet_fix_features,
1500fb507934SMichał Mirosław 	.ndo_set_features    = xennet_set_features,
15012688fcb7SAndrew J. Bennieston 	.ndo_select_queue    = xennet_select_queue,
15026c5aa6fcSDenis Kirjanov 	.ndo_bpf            = xennet_xdp,
15036c5aa6fcSDenis Kirjanov 	.ndo_xdp_xmit	    = xennet_xdp_xmit,
1504cf66f9d4SKonrad Rzeszutek Wilk #ifdef CONFIG_NET_POLL_CONTROLLER
1505cf66f9d4SKonrad Rzeszutek Wilk 	.ndo_poll_controller = xennet_poll_controller,
1506cf66f9d4SKonrad Rzeszutek Wilk #endif
15070a0b9d2eSStephen Hemminger };
15080a0b9d2eSStephen Hemminger 
1509900e1833SDavid Vrabel static void xennet_free_netdev(struct net_device *netdev)
1510900e1833SDavid Vrabel {
1511900e1833SDavid Vrabel 	struct netfront_info *np = netdev_priv(netdev);
1512900e1833SDavid Vrabel 
1513900e1833SDavid Vrabel 	free_percpu(np->rx_stats);
1514900e1833SDavid Vrabel 	free_percpu(np->tx_stats);
1515900e1833SDavid Vrabel 	free_netdev(netdev);
1516900e1833SDavid Vrabel }
1517900e1833SDavid Vrabel 
15188e0e46bbSBill Pemberton static struct net_device *xennet_create_dev(struct xenbus_device *dev)
15190d160211SJeremy Fitzhardinge {
15202688fcb7SAndrew J. Bennieston 	int err;
15210d160211SJeremy Fitzhardinge 	struct net_device *netdev;
15220d160211SJeremy Fitzhardinge 	struct netfront_info *np;
15230d160211SJeremy Fitzhardinge 
152450ee6061SAndrew J. Bennieston 	netdev = alloc_etherdev_mq(sizeof(struct netfront_info), xennet_max_queues);
152541de8d4cSJoe Perches 	if (!netdev)
15260d160211SJeremy Fitzhardinge 		return ERR_PTR(-ENOMEM);
15270d160211SJeremy Fitzhardinge 
15280d160211SJeremy Fitzhardinge 	np                   = netdev_priv(netdev);
15290d160211SJeremy Fitzhardinge 	np->xbdev            = dev;
15300d160211SJeremy Fitzhardinge 
15312688fcb7SAndrew J. Bennieston 	np->queues = NULL;
15320d160211SJeremy Fitzhardinge 
1533e00f85beSstephen hemminger 	err = -ENOMEM;
1534900e1833SDavid Vrabel 	np->rx_stats = netdev_alloc_pcpu_stats(struct netfront_stats);
1535900e1833SDavid Vrabel 	if (np->rx_stats == NULL)
1536900e1833SDavid Vrabel 		goto exit;
1537900e1833SDavid Vrabel 	np->tx_stats = netdev_alloc_pcpu_stats(struct netfront_stats);
1538900e1833SDavid Vrabel 	if (np->tx_stats == NULL)
1539e00f85beSstephen hemminger 		goto exit;
1540e00f85beSstephen hemminger 
15410a0b9d2eSStephen Hemminger 	netdev->netdev_ops	= &xennet_netdev_ops;
15420a0b9d2eSStephen Hemminger 
1543fb507934SMichał Mirosław 	netdev->features        = NETIF_F_IP_CSUM | NETIF_F_RXCSUM |
1544fb507934SMichał Mirosław 				  NETIF_F_GSO_ROBUST;
15452c0057deSPaul Durrant 	netdev->hw_features	= NETIF_F_SG |
15462c0057deSPaul Durrant 				  NETIF_F_IPV6_CSUM |
15472c0057deSPaul Durrant 				  NETIF_F_TSO | NETIF_F_TSO6;
15480d160211SJeremy Fitzhardinge 
1549fc3e5941SIan Campbell 	/*
1550fc3e5941SIan Campbell          * Assume that all hw features are available for now. This set
1551fc3e5941SIan Campbell          * will be adjusted by the call to netdev_update_features() in
1552fc3e5941SIan Campbell          * xennet_connect() which is the earliest point where we can
1553fc3e5941SIan Campbell          * negotiate with the backend regarding supported features.
1554fc3e5941SIan Campbell          */
1555fc3e5941SIan Campbell 	netdev->features |= netdev->hw_features;
1556fc3e5941SIan Campbell 
15577ad24ea4SWilfried Klaebe 	netdev->ethtool_ops = &xennet_ethtool_ops;
1558e1043a4bSMohammed Gamal 	netdev->min_mtu = ETH_MIN_MTU;
1559d0c2c997SJarod Wilson 	netdev->max_mtu = XEN_NETIF_MAX_TX_SIZE;
15600d160211SJeremy Fitzhardinge 	SET_NETDEV_DEV(netdev, &dev->dev);
15610d160211SJeremy Fitzhardinge 
15620d160211SJeremy Fitzhardinge 	np->netdev = netdev;
15636c5aa6fcSDenis Kirjanov 	np->netfront_xdp_enabled = false;
15640d160211SJeremy Fitzhardinge 
15650d160211SJeremy Fitzhardinge 	netif_carrier_off(netdev);
15660d160211SJeremy Fitzhardinge 
1567c2c63310SAndrea Righi 	do {
1568b707fda2SEduardo Otubo 		xenbus_switch_state(dev, XenbusStateInitialising);
1569c2c63310SAndrea Righi 		err = wait_event_timeout(module_wq,
1570822fb18aSXiao Liang 				 xenbus_read_driver_state(dev->otherend) !=
1571822fb18aSXiao Liang 				 XenbusStateClosed &&
1572822fb18aSXiao Liang 				 xenbus_read_driver_state(dev->otherend) !=
1573c2c63310SAndrea Righi 				 XenbusStateUnknown, XENNET_TIMEOUT);
1574c2c63310SAndrea Righi 	} while (!err);
1575c2c63310SAndrea Righi 
15760d160211SJeremy Fitzhardinge 	return netdev;
15770d160211SJeremy Fitzhardinge 
15780d160211SJeremy Fitzhardinge  exit:
1579900e1833SDavid Vrabel 	xennet_free_netdev(netdev);
15800d160211SJeremy Fitzhardinge 	return ERR_PTR(err);
15810d160211SJeremy Fitzhardinge }
15820d160211SJeremy Fitzhardinge 
158380708602SLee Jones /*
15840d160211SJeremy Fitzhardinge  * Entry point to this code when a new device is created.  Allocate the basic
15850d160211SJeremy Fitzhardinge  * structures and the ring buffers for communication with the backend, and
15860d160211SJeremy Fitzhardinge  * inform the backend of the appropriate details for those.
15870d160211SJeremy Fitzhardinge  */
15888e0e46bbSBill Pemberton static int netfront_probe(struct xenbus_device *dev,
15890d160211SJeremy Fitzhardinge 			  const struct xenbus_device_id *id)
15900d160211SJeremy Fitzhardinge {
15910d160211SJeremy Fitzhardinge 	int err;
15920d160211SJeremy Fitzhardinge 	struct net_device *netdev;
15930d160211SJeremy Fitzhardinge 	struct netfront_info *info;
15940d160211SJeremy Fitzhardinge 
15950d160211SJeremy Fitzhardinge 	netdev = xennet_create_dev(dev);
15960d160211SJeremy Fitzhardinge 	if (IS_ERR(netdev)) {
15970d160211SJeremy Fitzhardinge 		err = PTR_ERR(netdev);
15980d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "creating netdev");
15990d160211SJeremy Fitzhardinge 		return err;
16000d160211SJeremy Fitzhardinge 	}
16010d160211SJeremy Fitzhardinge 
16020d160211SJeremy Fitzhardinge 	info = netdev_priv(netdev);
16031b713e00SGreg Kroah-Hartman 	dev_set_drvdata(&dev->dev, info);
160427b917e5STakashi Iwai #ifdef CONFIG_SYSFS
160527b917e5STakashi Iwai 	info->netdev->sysfs_groups[0] = &xennet_dev_group;
160627b917e5STakashi Iwai #endif
16070d160211SJeremy Fitzhardinge 
16080d160211SJeremy Fitzhardinge 	return 0;
16090d160211SJeremy Fitzhardinge }
16100d160211SJeremy Fitzhardinge 
16110d160211SJeremy Fitzhardinge static void xennet_end_access(int ref, void *page)
16120d160211SJeremy Fitzhardinge {
16130d160211SJeremy Fitzhardinge 	/* This frees the page as a side-effect */
16140d160211SJeremy Fitzhardinge 	if (ref != GRANT_INVALID_REF)
16150d160211SJeremy Fitzhardinge 		gnttab_end_foreign_access(ref, 0, (unsigned long)page);
16160d160211SJeremy Fitzhardinge }
16170d160211SJeremy Fitzhardinge 
16180d160211SJeremy Fitzhardinge static void xennet_disconnect_backend(struct netfront_info *info)
16190d160211SJeremy Fitzhardinge {
16202688fcb7SAndrew J. Bennieston 	unsigned int i = 0;
16212688fcb7SAndrew J. Bennieston 	unsigned int num_queues = info->netdev->real_num_tx_queues;
16220d160211SJeremy Fitzhardinge 
1623f9feb1e6SDavid Vrabel 	netif_carrier_off(info->netdev);
1624f9feb1e6SDavid Vrabel 
16259a873c71SChas Williams 	for (i = 0; i < num_queues && info->queues; ++i) {
162676541869SDavid Vrabel 		struct netfront_queue *queue = &info->queues[i];
162776541869SDavid Vrabel 
162874470954SBoris Ostrovsky 		del_timer_sync(&queue->rx_refill_timer);
162974470954SBoris Ostrovsky 
16302688fcb7SAndrew J. Bennieston 		if (queue->tx_irq && (queue->tx_irq == queue->rx_irq))
16312688fcb7SAndrew J. Bennieston 			unbind_from_irqhandler(queue->tx_irq, queue);
16322688fcb7SAndrew J. Bennieston 		if (queue->tx_irq && (queue->tx_irq != queue->rx_irq)) {
16332688fcb7SAndrew J. Bennieston 			unbind_from_irqhandler(queue->tx_irq, queue);
16342688fcb7SAndrew J. Bennieston 			unbind_from_irqhandler(queue->rx_irq, queue);
1635d634bf2cSWei Liu 		}
16362688fcb7SAndrew J. Bennieston 		queue->tx_evtchn = queue->rx_evtchn = 0;
16372688fcb7SAndrew J. Bennieston 		queue->tx_irq = queue->rx_irq = 0;
16380d160211SJeremy Fitzhardinge 
1639274b0455SChas Williams 		if (netif_running(info->netdev))
1640f9feb1e6SDavid Vrabel 			napi_synchronize(&queue->napi);
1641f9feb1e6SDavid Vrabel 
1642a5b5dc3cSDavid Vrabel 		xennet_release_tx_bufs(queue);
1643a5b5dc3cSDavid Vrabel 		xennet_release_rx_bufs(queue);
1644a5b5dc3cSDavid Vrabel 		gnttab_free_grant_references(queue->gref_tx_head);
1645a5b5dc3cSDavid Vrabel 		gnttab_free_grant_references(queue->gref_rx_head);
1646a5b5dc3cSDavid Vrabel 
16470d160211SJeremy Fitzhardinge 		/* End access and free the pages */
16482688fcb7SAndrew J. Bennieston 		xennet_end_access(queue->tx_ring_ref, queue->tx.sring);
16492688fcb7SAndrew J. Bennieston 		xennet_end_access(queue->rx_ring_ref, queue->rx.sring);
16500d160211SJeremy Fitzhardinge 
16512688fcb7SAndrew J. Bennieston 		queue->tx_ring_ref = GRANT_INVALID_REF;
16522688fcb7SAndrew J. Bennieston 		queue->rx_ring_ref = GRANT_INVALID_REF;
16532688fcb7SAndrew J. Bennieston 		queue->tx.sring = NULL;
16542688fcb7SAndrew J. Bennieston 		queue->rx.sring = NULL;
16556c5aa6fcSDenis Kirjanov 
16566c5aa6fcSDenis Kirjanov 		page_pool_destroy(queue->page_pool);
16572688fcb7SAndrew J. Bennieston 	}
16580d160211SJeremy Fitzhardinge }
16590d160211SJeremy Fitzhardinge 
166080708602SLee Jones /*
16610d160211SJeremy Fitzhardinge  * We are reconnecting to the backend, due to a suspend/resume, or a backend
16620d160211SJeremy Fitzhardinge  * driver restart.  We tear down our netif structure and recreate it, but
16630d160211SJeremy Fitzhardinge  * leave the device-layer structures intact so that this is transparent to the
16640d160211SJeremy Fitzhardinge  * rest of the kernel.
16650d160211SJeremy Fitzhardinge  */
16660d160211SJeremy Fitzhardinge static int netfront_resume(struct xenbus_device *dev)
16670d160211SJeremy Fitzhardinge {
16681b713e00SGreg Kroah-Hartman 	struct netfront_info *info = dev_get_drvdata(&dev->dev);
16690d160211SJeremy Fitzhardinge 
16700d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", dev->nodename);
16710d160211SJeremy Fitzhardinge 
16720d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
16730d160211SJeremy Fitzhardinge 	return 0;
16740d160211SJeremy Fitzhardinge }
16750d160211SJeremy Fitzhardinge 
16760d160211SJeremy Fitzhardinge static int xen_net_read_mac(struct xenbus_device *dev, u8 mac[])
16770d160211SJeremy Fitzhardinge {
16780d160211SJeremy Fitzhardinge 	char *s, *e, *macstr;
16790d160211SJeremy Fitzhardinge 	int i;
16800d160211SJeremy Fitzhardinge 
16810d160211SJeremy Fitzhardinge 	macstr = s = xenbus_read(XBT_NIL, dev->nodename, "mac", NULL);
16820d160211SJeremy Fitzhardinge 	if (IS_ERR(macstr))
16830d160211SJeremy Fitzhardinge 		return PTR_ERR(macstr);
16840d160211SJeremy Fitzhardinge 
16850d160211SJeremy Fitzhardinge 	for (i = 0; i < ETH_ALEN; i++) {
16860d160211SJeremy Fitzhardinge 		mac[i] = simple_strtoul(s, &e, 16);
16870d160211SJeremy Fitzhardinge 		if ((s == e) || (*e != ((i == ETH_ALEN-1) ? '\0' : ':'))) {
16880d160211SJeremy Fitzhardinge 			kfree(macstr);
16890d160211SJeremy Fitzhardinge 			return -ENOENT;
16900d160211SJeremy Fitzhardinge 		}
16910d160211SJeremy Fitzhardinge 		s = e+1;
16920d160211SJeremy Fitzhardinge 	}
16930d160211SJeremy Fitzhardinge 
16940d160211SJeremy Fitzhardinge 	kfree(macstr);
16950d160211SJeremy Fitzhardinge 	return 0;
16960d160211SJeremy Fitzhardinge }
16970d160211SJeremy Fitzhardinge 
16982688fcb7SAndrew J. Bennieston static int setup_netfront_single(struct netfront_queue *queue)
1699d634bf2cSWei Liu {
1700d634bf2cSWei Liu 	int err;
1701d634bf2cSWei Liu 
17022688fcb7SAndrew J. Bennieston 	err = xenbus_alloc_evtchn(queue->info->xbdev, &queue->tx_evtchn);
1703d634bf2cSWei Liu 	if (err < 0)
1704d634bf2cSWei Liu 		goto fail;
1705d634bf2cSWei Liu 
17062688fcb7SAndrew J. Bennieston 	err = bind_evtchn_to_irqhandler(queue->tx_evtchn,
1707d634bf2cSWei Liu 					xennet_interrupt,
17082688fcb7SAndrew J. Bennieston 					0, queue->info->netdev->name, queue);
1709d634bf2cSWei Liu 	if (err < 0)
1710d634bf2cSWei Liu 		goto bind_fail;
17112688fcb7SAndrew J. Bennieston 	queue->rx_evtchn = queue->tx_evtchn;
17122688fcb7SAndrew J. Bennieston 	queue->rx_irq = queue->tx_irq = err;
1713d634bf2cSWei Liu 
1714d634bf2cSWei Liu 	return 0;
1715d634bf2cSWei Liu 
1716d634bf2cSWei Liu bind_fail:
17172688fcb7SAndrew J. Bennieston 	xenbus_free_evtchn(queue->info->xbdev, queue->tx_evtchn);
17182688fcb7SAndrew J. Bennieston 	queue->tx_evtchn = 0;
1719d634bf2cSWei Liu fail:
1720d634bf2cSWei Liu 	return err;
1721d634bf2cSWei Liu }
1722d634bf2cSWei Liu 
17232688fcb7SAndrew J. Bennieston static int setup_netfront_split(struct netfront_queue *queue)
1724d634bf2cSWei Liu {
1725d634bf2cSWei Liu 	int err;
1726d634bf2cSWei Liu 
17272688fcb7SAndrew J. Bennieston 	err = xenbus_alloc_evtchn(queue->info->xbdev, &queue->tx_evtchn);
1728d634bf2cSWei Liu 	if (err < 0)
1729d634bf2cSWei Liu 		goto fail;
17302688fcb7SAndrew J. Bennieston 	err = xenbus_alloc_evtchn(queue->info->xbdev, &queue->rx_evtchn);
1731d634bf2cSWei Liu 	if (err < 0)
1732d634bf2cSWei Liu 		goto alloc_rx_evtchn_fail;
1733d634bf2cSWei Liu 
17342688fcb7SAndrew J. Bennieston 	snprintf(queue->tx_irq_name, sizeof(queue->tx_irq_name),
17352688fcb7SAndrew J. Bennieston 		 "%s-tx", queue->name);
17362688fcb7SAndrew J. Bennieston 	err = bind_evtchn_to_irqhandler(queue->tx_evtchn,
1737d634bf2cSWei Liu 					xennet_tx_interrupt,
17382688fcb7SAndrew J. Bennieston 					0, queue->tx_irq_name, queue);
1739d634bf2cSWei Liu 	if (err < 0)
1740d634bf2cSWei Liu 		goto bind_tx_fail;
17412688fcb7SAndrew J. Bennieston 	queue->tx_irq = err;
1742d634bf2cSWei Liu 
17432688fcb7SAndrew J. Bennieston 	snprintf(queue->rx_irq_name, sizeof(queue->rx_irq_name),
17442688fcb7SAndrew J. Bennieston 		 "%s-rx", queue->name);
17452688fcb7SAndrew J. Bennieston 	err = bind_evtchn_to_irqhandler(queue->rx_evtchn,
1746d634bf2cSWei Liu 					xennet_rx_interrupt,
17472688fcb7SAndrew J. Bennieston 					0, queue->rx_irq_name, queue);
1748d634bf2cSWei Liu 	if (err < 0)
1749d634bf2cSWei Liu 		goto bind_rx_fail;
17502688fcb7SAndrew J. Bennieston 	queue->rx_irq = err;
1751d634bf2cSWei Liu 
1752d634bf2cSWei Liu 	return 0;
1753d634bf2cSWei Liu 
1754d634bf2cSWei Liu bind_rx_fail:
17552688fcb7SAndrew J. Bennieston 	unbind_from_irqhandler(queue->tx_irq, queue);
17562688fcb7SAndrew J. Bennieston 	queue->tx_irq = 0;
1757d634bf2cSWei Liu bind_tx_fail:
17582688fcb7SAndrew J. Bennieston 	xenbus_free_evtchn(queue->info->xbdev, queue->rx_evtchn);
17592688fcb7SAndrew J. Bennieston 	queue->rx_evtchn = 0;
1760d634bf2cSWei Liu alloc_rx_evtchn_fail:
17612688fcb7SAndrew J. Bennieston 	xenbus_free_evtchn(queue->info->xbdev, queue->tx_evtchn);
17622688fcb7SAndrew J. Bennieston 	queue->tx_evtchn = 0;
1763d634bf2cSWei Liu fail:
1764d634bf2cSWei Liu 	return err;
1765d634bf2cSWei Liu }
1766d634bf2cSWei Liu 
17672688fcb7SAndrew J. Bennieston static int setup_netfront(struct xenbus_device *dev,
17682688fcb7SAndrew J. Bennieston 			struct netfront_queue *queue, unsigned int feature_split_evtchn)
17690d160211SJeremy Fitzhardinge {
17700d160211SJeremy Fitzhardinge 	struct xen_netif_tx_sring *txs;
17710d160211SJeremy Fitzhardinge 	struct xen_netif_rx_sring *rxs;
1772ccc9d90aSWei Liu 	grant_ref_t gref;
17730d160211SJeremy Fitzhardinge 	int err;
17740d160211SJeremy Fitzhardinge 
17752688fcb7SAndrew J. Bennieston 	queue->tx_ring_ref = GRANT_INVALID_REF;
17762688fcb7SAndrew J. Bennieston 	queue->rx_ring_ref = GRANT_INVALID_REF;
17772688fcb7SAndrew J. Bennieston 	queue->rx.sring = NULL;
17782688fcb7SAndrew J. Bennieston 	queue->tx.sring = NULL;
17790d160211SJeremy Fitzhardinge 
1780a144ff09SIan Campbell 	txs = (struct xen_netif_tx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH);
17810d160211SJeremy Fitzhardinge 	if (!txs) {
17820d160211SJeremy Fitzhardinge 		err = -ENOMEM;
17830d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "allocating tx ring page");
17840d160211SJeremy Fitzhardinge 		goto fail;
17850d160211SJeremy Fitzhardinge 	}
17860d160211SJeremy Fitzhardinge 	SHARED_RING_INIT(txs);
178730c5d7f0SJulien Grall 	FRONT_RING_INIT(&queue->tx, txs, XEN_PAGE_SIZE);
17880d160211SJeremy Fitzhardinge 
1789ccc9d90aSWei Liu 	err = xenbus_grant_ring(dev, txs, 1, &gref);
17901ca2983aSWei Liu 	if (err < 0)
17911ca2983aSWei Liu 		goto grant_tx_ring_fail;
1792ccc9d90aSWei Liu 	queue->tx_ring_ref = gref;
17930d160211SJeremy Fitzhardinge 
1794a144ff09SIan Campbell 	rxs = (struct xen_netif_rx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH);
17950d160211SJeremy Fitzhardinge 	if (!rxs) {
17960d160211SJeremy Fitzhardinge 		err = -ENOMEM;
17970d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "allocating rx ring page");
17981ca2983aSWei Liu 		goto alloc_rx_ring_fail;
17990d160211SJeremy Fitzhardinge 	}
18000d160211SJeremy Fitzhardinge 	SHARED_RING_INIT(rxs);
180130c5d7f0SJulien Grall 	FRONT_RING_INIT(&queue->rx, rxs, XEN_PAGE_SIZE);
18020d160211SJeremy Fitzhardinge 
1803ccc9d90aSWei Liu 	err = xenbus_grant_ring(dev, rxs, 1, &gref);
18041ca2983aSWei Liu 	if (err < 0)
18051ca2983aSWei Liu 		goto grant_rx_ring_fail;
1806ccc9d90aSWei Liu 	queue->rx_ring_ref = gref;
18070d160211SJeremy Fitzhardinge 
1808d634bf2cSWei Liu 	if (feature_split_evtchn)
18092688fcb7SAndrew J. Bennieston 		err = setup_netfront_split(queue);
1810d634bf2cSWei Liu 	/* setup single event channel if
1811d634bf2cSWei Liu 	 *  a) feature-split-event-channels == 0
1812d634bf2cSWei Liu 	 *  b) feature-split-event-channels == 1 but failed to setup
1813d634bf2cSWei Liu 	 */
1814e93fac3bSJiapeng Chong 	if (!feature_split_evtchn || err)
18152688fcb7SAndrew J. Bennieston 		err = setup_netfront_single(queue);
1816d634bf2cSWei Liu 
18170d160211SJeremy Fitzhardinge 	if (err)
18181ca2983aSWei Liu 		goto alloc_evtchn_fail;
18190d160211SJeremy Fitzhardinge 
18200d160211SJeremy Fitzhardinge 	return 0;
18210d160211SJeremy Fitzhardinge 
18221ca2983aSWei Liu 	/* If we fail to setup netfront, it is safe to just revoke access to
18231ca2983aSWei Liu 	 * granted pages because backend is not accessing it at this point.
18241ca2983aSWei Liu 	 */
18251ca2983aSWei Liu alloc_evtchn_fail:
18262688fcb7SAndrew J. Bennieston 	gnttab_end_foreign_access_ref(queue->rx_ring_ref, 0);
18271ca2983aSWei Liu grant_rx_ring_fail:
18281ca2983aSWei Liu 	free_page((unsigned long)rxs);
18291ca2983aSWei Liu alloc_rx_ring_fail:
18302688fcb7SAndrew J. Bennieston 	gnttab_end_foreign_access_ref(queue->tx_ring_ref, 0);
18311ca2983aSWei Liu grant_tx_ring_fail:
18321ca2983aSWei Liu 	free_page((unsigned long)txs);
18330d160211SJeremy Fitzhardinge fail:
18340d160211SJeremy Fitzhardinge 	return err;
18350d160211SJeremy Fitzhardinge }
18360d160211SJeremy Fitzhardinge 
18372688fcb7SAndrew J. Bennieston /* Queue-specific initialisation
18382688fcb7SAndrew J. Bennieston  * This used to be done in xennet_create_dev() but must now
18392688fcb7SAndrew J. Bennieston  * be run per-queue.
18402688fcb7SAndrew J. Bennieston  */
18412688fcb7SAndrew J. Bennieston static int xennet_init_queue(struct netfront_queue *queue)
18422688fcb7SAndrew J. Bennieston {
18432688fcb7SAndrew J. Bennieston 	unsigned short i;
18442688fcb7SAndrew J. Bennieston 	int err = 0;
184521f2706bSXiao Liang 	char *devid;
18462688fcb7SAndrew J. Bennieston 
18472688fcb7SAndrew J. Bennieston 	spin_lock_init(&queue->tx_lock);
18482688fcb7SAndrew J. Bennieston 	spin_lock_init(&queue->rx_lock);
18492688fcb7SAndrew J. Bennieston 
1850e99e88a9SKees Cook 	timer_setup(&queue->rx_refill_timer, rx_refill_timeout, 0);
18512688fcb7SAndrew J. Bennieston 
185221f2706bSXiao Liang 	devid = strrchr(queue->info->xbdev->nodename, '/') + 1;
185321f2706bSXiao Liang 	snprintf(queue->name, sizeof(queue->name), "vif%s-q%u",
185421f2706bSXiao Liang 		 devid, queue->id);
18558b715010SWei Liu 
18562688fcb7SAndrew J. Bennieston 	/* Initialise tx_skbs as a free chain containing every entry. */
18572688fcb7SAndrew J. Bennieston 	queue->tx_skb_freelist = 0;
18582688fcb7SAndrew J. Bennieston 	for (i = 0; i < NET_TX_RING_SIZE; i++) {
18592688fcb7SAndrew J. Bennieston 		skb_entry_set_link(&queue->tx_skbs[i], i+1);
18602688fcb7SAndrew J. Bennieston 		queue->grant_tx_ref[i] = GRANT_INVALID_REF;
18612688fcb7SAndrew J. Bennieston 		queue->grant_tx_page[i] = NULL;
18622688fcb7SAndrew J. Bennieston 	}
18632688fcb7SAndrew J. Bennieston 
18642688fcb7SAndrew J. Bennieston 	/* Clear out rx_skbs */
18652688fcb7SAndrew J. Bennieston 	for (i = 0; i < NET_RX_RING_SIZE; i++) {
18662688fcb7SAndrew J. Bennieston 		queue->rx_skbs[i] = NULL;
18672688fcb7SAndrew J. Bennieston 		queue->grant_rx_ref[i] = GRANT_INVALID_REF;
18682688fcb7SAndrew J. Bennieston 	}
18692688fcb7SAndrew J. Bennieston 
18702688fcb7SAndrew J. Bennieston 	/* A grant for every tx ring slot */
18711f3c2ebaSDavid Vrabel 	if (gnttab_alloc_grant_references(NET_TX_RING_SIZE,
18722688fcb7SAndrew J. Bennieston 					  &queue->gref_tx_head) < 0) {
18732688fcb7SAndrew J. Bennieston 		pr_alert("can't alloc tx grant refs\n");
18742688fcb7SAndrew J. Bennieston 		err = -ENOMEM;
18752688fcb7SAndrew J. Bennieston 		goto exit;
18762688fcb7SAndrew J. Bennieston 	}
18772688fcb7SAndrew J. Bennieston 
18782688fcb7SAndrew J. Bennieston 	/* A grant for every rx ring slot */
18791f3c2ebaSDavid Vrabel 	if (gnttab_alloc_grant_references(NET_RX_RING_SIZE,
18802688fcb7SAndrew J. Bennieston 					  &queue->gref_rx_head) < 0) {
18812688fcb7SAndrew J. Bennieston 		pr_alert("can't alloc rx grant refs\n");
18822688fcb7SAndrew J. Bennieston 		err = -ENOMEM;
18832688fcb7SAndrew J. Bennieston 		goto exit_free_tx;
18842688fcb7SAndrew J. Bennieston 	}
18852688fcb7SAndrew J. Bennieston 
18862688fcb7SAndrew J. Bennieston 	return 0;
18872688fcb7SAndrew J. Bennieston 
18882688fcb7SAndrew J. Bennieston  exit_free_tx:
18892688fcb7SAndrew J. Bennieston 	gnttab_free_grant_references(queue->gref_tx_head);
18902688fcb7SAndrew J. Bennieston  exit:
18912688fcb7SAndrew J. Bennieston 	return err;
18922688fcb7SAndrew J. Bennieston }
18932688fcb7SAndrew J. Bennieston 
189450ee6061SAndrew J. Bennieston static int write_queue_xenstore_keys(struct netfront_queue *queue,
189550ee6061SAndrew J. Bennieston 			   struct xenbus_transaction *xbt, int write_hierarchical)
189650ee6061SAndrew J. Bennieston {
189750ee6061SAndrew J. Bennieston 	/* Write the queue-specific keys into XenStore in the traditional
189850ee6061SAndrew J. Bennieston 	 * way for a single queue, or in a queue subkeys for multiple
189950ee6061SAndrew J. Bennieston 	 * queues.
190050ee6061SAndrew J. Bennieston 	 */
190150ee6061SAndrew J. Bennieston 	struct xenbus_device *dev = queue->info->xbdev;
190250ee6061SAndrew J. Bennieston 	int err;
190350ee6061SAndrew J. Bennieston 	const char *message;
190450ee6061SAndrew J. Bennieston 	char *path;
190550ee6061SAndrew J. Bennieston 	size_t pathsize;
190650ee6061SAndrew J. Bennieston 
190750ee6061SAndrew J. Bennieston 	/* Choose the correct place to write the keys */
190850ee6061SAndrew J. Bennieston 	if (write_hierarchical) {
190950ee6061SAndrew J. Bennieston 		pathsize = strlen(dev->nodename) + 10;
191050ee6061SAndrew J. Bennieston 		path = kzalloc(pathsize, GFP_KERNEL);
191150ee6061SAndrew J. Bennieston 		if (!path) {
191250ee6061SAndrew J. Bennieston 			err = -ENOMEM;
191350ee6061SAndrew J. Bennieston 			message = "out of memory while writing ring references";
191450ee6061SAndrew J. Bennieston 			goto error;
191550ee6061SAndrew J. Bennieston 		}
191650ee6061SAndrew J. Bennieston 		snprintf(path, pathsize, "%s/queue-%u",
191750ee6061SAndrew J. Bennieston 				dev->nodename, queue->id);
191850ee6061SAndrew J. Bennieston 	} else {
191950ee6061SAndrew J. Bennieston 		path = (char *)dev->nodename;
192050ee6061SAndrew J. Bennieston 	}
192150ee6061SAndrew J. Bennieston 
192250ee6061SAndrew J. Bennieston 	/* Write ring references */
192350ee6061SAndrew J. Bennieston 	err = xenbus_printf(*xbt, path, "tx-ring-ref", "%u",
192450ee6061SAndrew J. Bennieston 			queue->tx_ring_ref);
192550ee6061SAndrew J. Bennieston 	if (err) {
192650ee6061SAndrew J. Bennieston 		message = "writing tx-ring-ref";
192750ee6061SAndrew J. Bennieston 		goto error;
192850ee6061SAndrew J. Bennieston 	}
192950ee6061SAndrew J. Bennieston 
193050ee6061SAndrew J. Bennieston 	err = xenbus_printf(*xbt, path, "rx-ring-ref", "%u",
193150ee6061SAndrew J. Bennieston 			queue->rx_ring_ref);
193250ee6061SAndrew J. Bennieston 	if (err) {
193350ee6061SAndrew J. Bennieston 		message = "writing rx-ring-ref";
193450ee6061SAndrew J. Bennieston 		goto error;
193550ee6061SAndrew J. Bennieston 	}
193650ee6061SAndrew J. Bennieston 
193750ee6061SAndrew J. Bennieston 	/* Write event channels; taking into account both shared
193850ee6061SAndrew J. Bennieston 	 * and split event channel scenarios.
193950ee6061SAndrew J. Bennieston 	 */
194050ee6061SAndrew J. Bennieston 	if (queue->tx_evtchn == queue->rx_evtchn) {
194150ee6061SAndrew J. Bennieston 		/* Shared event channel */
194250ee6061SAndrew J. Bennieston 		err = xenbus_printf(*xbt, path,
194350ee6061SAndrew J. Bennieston 				"event-channel", "%u", queue->tx_evtchn);
194450ee6061SAndrew J. Bennieston 		if (err) {
194550ee6061SAndrew J. Bennieston 			message = "writing event-channel";
194650ee6061SAndrew J. Bennieston 			goto error;
194750ee6061SAndrew J. Bennieston 		}
194850ee6061SAndrew J. Bennieston 	} else {
194950ee6061SAndrew J. Bennieston 		/* Split event channels */
195050ee6061SAndrew J. Bennieston 		err = xenbus_printf(*xbt, path,
195150ee6061SAndrew J. Bennieston 				"event-channel-tx", "%u", queue->tx_evtchn);
195250ee6061SAndrew J. Bennieston 		if (err) {
195350ee6061SAndrew J. Bennieston 			message = "writing event-channel-tx";
195450ee6061SAndrew J. Bennieston 			goto error;
195550ee6061SAndrew J. Bennieston 		}
195650ee6061SAndrew J. Bennieston 
195750ee6061SAndrew J. Bennieston 		err = xenbus_printf(*xbt, path,
195850ee6061SAndrew J. Bennieston 				"event-channel-rx", "%u", queue->rx_evtchn);
195950ee6061SAndrew J. Bennieston 		if (err) {
196050ee6061SAndrew J. Bennieston 			message = "writing event-channel-rx";
196150ee6061SAndrew J. Bennieston 			goto error;
196250ee6061SAndrew J. Bennieston 		}
196350ee6061SAndrew J. Bennieston 	}
196450ee6061SAndrew J. Bennieston 
196550ee6061SAndrew J. Bennieston 	if (write_hierarchical)
196650ee6061SAndrew J. Bennieston 		kfree(path);
196750ee6061SAndrew J. Bennieston 	return 0;
196850ee6061SAndrew J. Bennieston 
196950ee6061SAndrew J. Bennieston error:
197050ee6061SAndrew J. Bennieston 	if (write_hierarchical)
197150ee6061SAndrew J. Bennieston 		kfree(path);
197250ee6061SAndrew J. Bennieston 	xenbus_dev_fatal(dev, err, "%s", message);
197350ee6061SAndrew J. Bennieston 	return err;
197450ee6061SAndrew J. Bennieston }
197550ee6061SAndrew J. Bennieston 
1976ce58725fSDavid Vrabel static void xennet_destroy_queues(struct netfront_info *info)
1977ce58725fSDavid Vrabel {
1978ce58725fSDavid Vrabel 	unsigned int i;
1979ce58725fSDavid Vrabel 
1980ce58725fSDavid Vrabel 	for (i = 0; i < info->netdev->real_num_tx_queues; i++) {
1981ce58725fSDavid Vrabel 		struct netfront_queue *queue = &info->queues[i];
1982ce58725fSDavid Vrabel 
1983ce58725fSDavid Vrabel 		if (netif_running(info->netdev))
1984ce58725fSDavid Vrabel 			napi_disable(&queue->napi);
1985ce58725fSDavid Vrabel 		netif_napi_del(&queue->napi);
1986ce58725fSDavid Vrabel 	}
1987ce58725fSDavid Vrabel 
1988ce58725fSDavid Vrabel 	kfree(info->queues);
1989ce58725fSDavid Vrabel 	info->queues = NULL;
1990ce58725fSDavid Vrabel }
1991ce58725fSDavid Vrabel 
19926c5aa6fcSDenis Kirjanov 
19936c5aa6fcSDenis Kirjanov 
19946c5aa6fcSDenis Kirjanov static int xennet_create_page_pool(struct netfront_queue *queue)
19956c5aa6fcSDenis Kirjanov {
19966c5aa6fcSDenis Kirjanov 	int err;
19976c5aa6fcSDenis Kirjanov 	struct page_pool_params pp_params = {
19986c5aa6fcSDenis Kirjanov 		.order = 0,
19996c5aa6fcSDenis Kirjanov 		.flags = 0,
20006c5aa6fcSDenis Kirjanov 		.pool_size = NET_RX_RING_SIZE,
20016c5aa6fcSDenis Kirjanov 		.nid = NUMA_NO_NODE,
20026c5aa6fcSDenis Kirjanov 		.dev = &queue->info->netdev->dev,
20036c5aa6fcSDenis Kirjanov 		.offset = XDP_PACKET_HEADROOM,
20046c5aa6fcSDenis Kirjanov 		.max_len = XEN_PAGE_SIZE - XDP_PACKET_HEADROOM,
20056c5aa6fcSDenis Kirjanov 	};
20066c5aa6fcSDenis Kirjanov 
20076c5aa6fcSDenis Kirjanov 	queue->page_pool = page_pool_create(&pp_params);
20086c5aa6fcSDenis Kirjanov 	if (IS_ERR(queue->page_pool)) {
20096c5aa6fcSDenis Kirjanov 		err = PTR_ERR(queue->page_pool);
20106c5aa6fcSDenis Kirjanov 		queue->page_pool = NULL;
20116c5aa6fcSDenis Kirjanov 		return err;
20126c5aa6fcSDenis Kirjanov 	}
20136c5aa6fcSDenis Kirjanov 
20146c5aa6fcSDenis Kirjanov 	err = xdp_rxq_info_reg(&queue->xdp_rxq, queue->info->netdev,
2015b02e5a0eSBjörn Töpel 			       queue->id, 0);
20166c5aa6fcSDenis Kirjanov 	if (err) {
20176c5aa6fcSDenis Kirjanov 		netdev_err(queue->info->netdev, "xdp_rxq_info_reg failed\n");
20186c5aa6fcSDenis Kirjanov 		goto err_free_pp;
20196c5aa6fcSDenis Kirjanov 	}
20206c5aa6fcSDenis Kirjanov 
20216c5aa6fcSDenis Kirjanov 	err = xdp_rxq_info_reg_mem_model(&queue->xdp_rxq,
20226c5aa6fcSDenis Kirjanov 					 MEM_TYPE_PAGE_POOL, queue->page_pool);
20236c5aa6fcSDenis Kirjanov 	if (err) {
20246c5aa6fcSDenis Kirjanov 		netdev_err(queue->info->netdev, "xdp_rxq_info_reg_mem_model failed\n");
20256c5aa6fcSDenis Kirjanov 		goto err_unregister_rxq;
20266c5aa6fcSDenis Kirjanov 	}
20276c5aa6fcSDenis Kirjanov 	return 0;
20286c5aa6fcSDenis Kirjanov 
20296c5aa6fcSDenis Kirjanov err_unregister_rxq:
20306c5aa6fcSDenis Kirjanov 	xdp_rxq_info_unreg(&queue->xdp_rxq);
20316c5aa6fcSDenis Kirjanov err_free_pp:
20326c5aa6fcSDenis Kirjanov 	page_pool_destroy(queue->page_pool);
20336c5aa6fcSDenis Kirjanov 	queue->page_pool = NULL;
20346c5aa6fcSDenis Kirjanov 	return err;
20356c5aa6fcSDenis Kirjanov }
20366c5aa6fcSDenis Kirjanov 
2037ce58725fSDavid Vrabel static int xennet_create_queues(struct netfront_info *info,
2038ca88ea12SJoe Jin 				unsigned int *num_queues)
2039ce58725fSDavid Vrabel {
2040ce58725fSDavid Vrabel 	unsigned int i;
2041ce58725fSDavid Vrabel 	int ret;
2042ce58725fSDavid Vrabel 
2043ca88ea12SJoe Jin 	info->queues = kcalloc(*num_queues, sizeof(struct netfront_queue),
2044ce58725fSDavid Vrabel 			       GFP_KERNEL);
2045ce58725fSDavid Vrabel 	if (!info->queues)
2046ce58725fSDavid Vrabel 		return -ENOMEM;
2047ce58725fSDavid Vrabel 
2048ca88ea12SJoe Jin 	for (i = 0; i < *num_queues; i++) {
2049ce58725fSDavid Vrabel 		struct netfront_queue *queue = &info->queues[i];
2050ce58725fSDavid Vrabel 
2051ce58725fSDavid Vrabel 		queue->id = i;
2052ce58725fSDavid Vrabel 		queue->info = info;
2053ce58725fSDavid Vrabel 
2054ce58725fSDavid Vrabel 		ret = xennet_init_queue(queue);
2055ce58725fSDavid Vrabel 		if (ret < 0) {
2056f599c64fSRoss Lagerwall 			dev_warn(&info->xbdev->dev,
205769cb8524SDavid Vrabel 				 "only created %d queues\n", i);
2058ca88ea12SJoe Jin 			*num_queues = i;
2059ce58725fSDavid Vrabel 			break;
2060ce58725fSDavid Vrabel 		}
2061ce58725fSDavid Vrabel 
20626c5aa6fcSDenis Kirjanov 		/* use page pool recycling instead of buddy allocator */
20636c5aa6fcSDenis Kirjanov 		ret = xennet_create_page_pool(queue);
20646c5aa6fcSDenis Kirjanov 		if (ret < 0) {
20656c5aa6fcSDenis Kirjanov 			dev_err(&info->xbdev->dev, "can't allocate page pool\n");
20666c5aa6fcSDenis Kirjanov 			*num_queues = i;
20676c5aa6fcSDenis Kirjanov 			return ret;
20686c5aa6fcSDenis Kirjanov 		}
20696c5aa6fcSDenis Kirjanov 
2070ce58725fSDavid Vrabel 		netif_napi_add(queue->info->netdev, &queue->napi,
2071ce58725fSDavid Vrabel 			       xennet_poll, 64);
2072ce58725fSDavid Vrabel 		if (netif_running(info->netdev))
2073ce58725fSDavid Vrabel 			napi_enable(&queue->napi);
2074ce58725fSDavid Vrabel 	}
2075ce58725fSDavid Vrabel 
2076ca88ea12SJoe Jin 	netif_set_real_num_tx_queues(info->netdev, *num_queues);
2077ce58725fSDavid Vrabel 
2078ca88ea12SJoe Jin 	if (*num_queues == 0) {
2079f599c64fSRoss Lagerwall 		dev_err(&info->xbdev->dev, "no queues\n");
2080ce58725fSDavid Vrabel 		return -EINVAL;
2081ce58725fSDavid Vrabel 	}
2082ce58725fSDavid Vrabel 	return 0;
2083ce58725fSDavid Vrabel }
2084ce58725fSDavid Vrabel 
20850d160211SJeremy Fitzhardinge /* Common code used when first setting up, and when resuming. */
2086f502bf2bSIan Campbell static int talk_to_netback(struct xenbus_device *dev,
20870d160211SJeremy Fitzhardinge 			   struct netfront_info *info)
20880d160211SJeremy Fitzhardinge {
20890d160211SJeremy Fitzhardinge 	const char *message;
20900d160211SJeremy Fitzhardinge 	struct xenbus_transaction xbt;
20910d160211SJeremy Fitzhardinge 	int err;
20922688fcb7SAndrew J. Bennieston 	unsigned int feature_split_evtchn;
20932688fcb7SAndrew J. Bennieston 	unsigned int i = 0;
209450ee6061SAndrew J. Bennieston 	unsigned int max_queues = 0;
20952688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
20962688fcb7SAndrew J. Bennieston 	unsigned int num_queues = 1;
20970d160211SJeremy Fitzhardinge 
20982688fcb7SAndrew J. Bennieston 	info->netdev->irq = 0;
20992688fcb7SAndrew J. Bennieston 
210050ee6061SAndrew J. Bennieston 	/* Check if backend supports multiple queues */
21012890ea5cSJuergen Gross 	max_queues = xenbus_read_unsigned(info->xbdev->otherend,
21022890ea5cSJuergen Gross 					  "multi-queue-max-queues", 1);
210350ee6061SAndrew J. Bennieston 	num_queues = min(max_queues, xennet_max_queues);
210450ee6061SAndrew J. Bennieston 
21052688fcb7SAndrew J. Bennieston 	/* Check feature-split-event-channels */
21062890ea5cSJuergen Gross 	feature_split_evtchn = xenbus_read_unsigned(info->xbdev->otherend,
21072890ea5cSJuergen Gross 					"feature-split-event-channels", 0);
21082688fcb7SAndrew J. Bennieston 
21092688fcb7SAndrew J. Bennieston 	/* Read mac addr. */
21102688fcb7SAndrew J. Bennieston 	err = xen_net_read_mac(dev, info->netdev->dev_addr);
21112688fcb7SAndrew J. Bennieston 	if (err) {
21122688fcb7SAndrew J. Bennieston 		xenbus_dev_fatal(dev, err, "parsing %s/mac", dev->nodename);
2113cb257783SRoss Lagerwall 		goto out_unlocked;
21142688fcb7SAndrew J. Bennieston 	}
21152688fcb7SAndrew J. Bennieston 
21166c5aa6fcSDenis Kirjanov 	info->netback_has_xdp_headroom = xenbus_read_unsigned(info->xbdev->otherend,
21176c5aa6fcSDenis Kirjanov 							      "feature-xdp-headroom", 0);
21186c5aa6fcSDenis Kirjanov 	if (info->netback_has_xdp_headroom) {
21196c5aa6fcSDenis Kirjanov 		/* set the current xen-netfront xdp state */
21206c5aa6fcSDenis Kirjanov 		err = talk_to_netback_xdp(info, info->netfront_xdp_enabled ?
21216c5aa6fcSDenis Kirjanov 					  NETBACK_XDP_HEADROOM_ENABLE :
21226c5aa6fcSDenis Kirjanov 					  NETBACK_XDP_HEADROOM_DISABLE);
21236c5aa6fcSDenis Kirjanov 		if (err)
21246c5aa6fcSDenis Kirjanov 			goto out_unlocked;
21256c5aa6fcSDenis Kirjanov 	}
21266c5aa6fcSDenis Kirjanov 
2127f599c64fSRoss Lagerwall 	rtnl_lock();
2128ce58725fSDavid Vrabel 	if (info->queues)
2129ce58725fSDavid Vrabel 		xennet_destroy_queues(info);
2130ce58725fSDavid Vrabel 
2131ca88ea12SJoe Jin 	err = xennet_create_queues(info, &num_queues);
2132e2e004acSRoss Lagerwall 	if (err < 0) {
2133e2e004acSRoss Lagerwall 		xenbus_dev_fatal(dev, err, "creating queues");
2134e2e004acSRoss Lagerwall 		kfree(info->queues);
2135e2e004acSRoss Lagerwall 		info->queues = NULL;
2136e2e004acSRoss Lagerwall 		goto out;
2137e2e004acSRoss Lagerwall 	}
2138f599c64fSRoss Lagerwall 	rtnl_unlock();
21392688fcb7SAndrew J. Bennieston 
21402688fcb7SAndrew J. Bennieston 	/* Create shared ring, alloc event channel -- for each queue */
21412688fcb7SAndrew J. Bennieston 	for (i = 0; i < num_queues; ++i) {
21422688fcb7SAndrew J. Bennieston 		queue = &info->queues[i];
21432688fcb7SAndrew J. Bennieston 		err = setup_netfront(dev, queue, feature_split_evtchn);
2144e2e004acSRoss Lagerwall 		if (err)
21452688fcb7SAndrew J. Bennieston 			goto destroy_ring;
21462688fcb7SAndrew J. Bennieston 	}
21470d160211SJeremy Fitzhardinge 
21480d160211SJeremy Fitzhardinge again:
21490d160211SJeremy Fitzhardinge 	err = xenbus_transaction_start(&xbt);
21500d160211SJeremy Fitzhardinge 	if (err) {
21510d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "starting transaction");
21520d160211SJeremy Fitzhardinge 		goto destroy_ring;
21530d160211SJeremy Fitzhardinge 	}
21540d160211SJeremy Fitzhardinge 
2155812494d9Schas williams 	if (xenbus_exists(XBT_NIL,
2156812494d9Schas williams 			  info->xbdev->otherend, "multi-queue-max-queues")) {
2157812494d9Schas williams 		/* Write the number of queues */
2158812494d9Schas williams 		err = xenbus_printf(xbt, dev->nodename,
2159812494d9Schas williams 				    "multi-queue-num-queues", "%u", num_queues);
2160812494d9Schas williams 		if (err) {
2161812494d9Schas williams 			message = "writing multi-queue-num-queues";
2162812494d9Schas williams 			goto abort_transaction_no_dev_fatal;
2163812494d9Schas williams 		}
2164812494d9Schas williams 	}
2165812494d9Schas williams 
216650ee6061SAndrew J. Bennieston 	if (num_queues == 1) {
216750ee6061SAndrew J. Bennieston 		err = write_queue_xenstore_keys(&info->queues[0], &xbt, 0); /* flat */
216850ee6061SAndrew J. Bennieston 		if (err)
216950ee6061SAndrew J. Bennieston 			goto abort_transaction_no_dev_fatal;
2170d634bf2cSWei Liu 	} else {
217150ee6061SAndrew J. Bennieston 		/* Write the keys for each queue */
217250ee6061SAndrew J. Bennieston 		for (i = 0; i < num_queues; ++i) {
217350ee6061SAndrew J. Bennieston 			queue = &info->queues[i];
217450ee6061SAndrew J. Bennieston 			err = write_queue_xenstore_keys(queue, &xbt, 1); /* hierarchical */
217550ee6061SAndrew J. Bennieston 			if (err)
217650ee6061SAndrew J. Bennieston 				goto abort_transaction_no_dev_fatal;
2177d634bf2cSWei Liu 		}
2178d634bf2cSWei Liu 	}
21790d160211SJeremy Fitzhardinge 
218050ee6061SAndrew J. Bennieston 	/* The remaining keys are not queue-specific */
21810d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "request-rx-copy", "%u",
21820d160211SJeremy Fitzhardinge 			    1);
21830d160211SJeremy Fitzhardinge 	if (err) {
21840d160211SJeremy Fitzhardinge 		message = "writing request-rx-copy";
21850d160211SJeremy Fitzhardinge 		goto abort_transaction;
21860d160211SJeremy Fitzhardinge 	}
21870d160211SJeremy Fitzhardinge 
21880d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-rx-notify", "%d", 1);
21890d160211SJeremy Fitzhardinge 	if (err) {
21900d160211SJeremy Fitzhardinge 		message = "writing feature-rx-notify";
21910d160211SJeremy Fitzhardinge 		goto abort_transaction;
21920d160211SJeremy Fitzhardinge 	}
21930d160211SJeremy Fitzhardinge 
21940d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-sg", "%d", 1);
21950d160211SJeremy Fitzhardinge 	if (err) {
21960d160211SJeremy Fitzhardinge 		message = "writing feature-sg";
21970d160211SJeremy Fitzhardinge 		goto abort_transaction;
21980d160211SJeremy Fitzhardinge 	}
21990d160211SJeremy Fitzhardinge 
22000d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-gso-tcpv4", "%d", 1);
22010d160211SJeremy Fitzhardinge 	if (err) {
22020d160211SJeremy Fitzhardinge 		message = "writing feature-gso-tcpv4";
22030d160211SJeremy Fitzhardinge 		goto abort_transaction;
22040d160211SJeremy Fitzhardinge 	}
22050d160211SJeremy Fitzhardinge 
22062c0057deSPaul Durrant 	err = xenbus_write(xbt, dev->nodename, "feature-gso-tcpv6", "1");
22072c0057deSPaul Durrant 	if (err) {
22082c0057deSPaul Durrant 		message = "writing feature-gso-tcpv6";
22092c0057deSPaul Durrant 		goto abort_transaction;
22102c0057deSPaul Durrant 	}
22112c0057deSPaul Durrant 
22122c0057deSPaul Durrant 	err = xenbus_write(xbt, dev->nodename, "feature-ipv6-csum-offload",
22132c0057deSPaul Durrant 			   "1");
22142c0057deSPaul Durrant 	if (err) {
22152c0057deSPaul Durrant 		message = "writing feature-ipv6-csum-offload";
22162c0057deSPaul Durrant 		goto abort_transaction;
22172c0057deSPaul Durrant 	}
22182c0057deSPaul Durrant 
22190d160211SJeremy Fitzhardinge 	err = xenbus_transaction_end(xbt, 0);
22200d160211SJeremy Fitzhardinge 	if (err) {
22210d160211SJeremy Fitzhardinge 		if (err == -EAGAIN)
22220d160211SJeremy Fitzhardinge 			goto again;
22230d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "completing transaction");
22240d160211SJeremy Fitzhardinge 		goto destroy_ring;
22250d160211SJeremy Fitzhardinge 	}
22260d160211SJeremy Fitzhardinge 
22270d160211SJeremy Fitzhardinge 	return 0;
22280d160211SJeremy Fitzhardinge 
22290d160211SJeremy Fitzhardinge  abort_transaction:
22300d160211SJeremy Fitzhardinge 	xenbus_dev_fatal(dev, err, "%s", message);
223150ee6061SAndrew J. Bennieston abort_transaction_no_dev_fatal:
223250ee6061SAndrew J. Bennieston 	xenbus_transaction_end(xbt, 1);
22330d160211SJeremy Fitzhardinge  destroy_ring:
22340d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
2235f599c64fSRoss Lagerwall 	rtnl_lock();
2236e2e004acSRoss Lagerwall 	xennet_destroy_queues(info);
22370d160211SJeremy Fitzhardinge  out:
2238f599c64fSRoss Lagerwall 	rtnl_unlock();
2239cb257783SRoss Lagerwall out_unlocked:
2240d86b5672SVitaly Kuznetsov 	device_unregister(&dev->dev);
22410d160211SJeremy Fitzhardinge 	return err;
22420d160211SJeremy Fitzhardinge }
22430d160211SJeremy Fitzhardinge 
22440d160211SJeremy Fitzhardinge static int xennet_connect(struct net_device *dev)
22450d160211SJeremy Fitzhardinge {
22460d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
22472688fcb7SAndrew J. Bennieston 	unsigned int num_queues = 0;
2248a5b5dc3cSDavid Vrabel 	int err;
22492688fcb7SAndrew J. Bennieston 	unsigned int j = 0;
22502688fcb7SAndrew J. Bennieston 	struct netfront_queue *queue = NULL;
22510d160211SJeremy Fitzhardinge 
22522890ea5cSJuergen Gross 	if (!xenbus_read_unsigned(np->xbdev->otherend, "feature-rx-copy", 0)) {
22530d160211SJeremy Fitzhardinge 		dev_info(&dev->dev,
2254898eb71cSJoe Perches 			 "backend does not support copying receive path\n");
22550d160211SJeremy Fitzhardinge 		return -ENODEV;
22560d160211SJeremy Fitzhardinge 	}
22570d160211SJeremy Fitzhardinge 
2258f502bf2bSIan Campbell 	err = talk_to_netback(np->xbdev, np);
22590d160211SJeremy Fitzhardinge 	if (err)
22600d160211SJeremy Fitzhardinge 		return err;
22616c5aa6fcSDenis Kirjanov 	if (np->netback_has_xdp_headroom)
22626c5aa6fcSDenis Kirjanov 		pr_info("backend supports XDP headroom\n");
22630d160211SJeremy Fitzhardinge 
22642688fcb7SAndrew J. Bennieston 	/* talk_to_netback() sets the correct number of queues */
22652688fcb7SAndrew J. Bennieston 	num_queues = dev->real_num_tx_queues;
22662688fcb7SAndrew J. Bennieston 
2267f599c64fSRoss Lagerwall 	if (dev->reg_state == NETREG_UNINITIALIZED) {
2268f599c64fSRoss Lagerwall 		err = register_netdev(dev);
2269f599c64fSRoss Lagerwall 		if (err) {
2270f599c64fSRoss Lagerwall 			pr_warn("%s: register_netdev err=%d\n", __func__, err);
2271f599c64fSRoss Lagerwall 			device_unregister(&np->xbdev->dev);
2272f599c64fSRoss Lagerwall 			return err;
2273f599c64fSRoss Lagerwall 		}
2274f599c64fSRoss Lagerwall 	}
2275f599c64fSRoss Lagerwall 
227645c8184cSRoss Lagerwall 	rtnl_lock();
227745c8184cSRoss Lagerwall 	netdev_update_features(dev);
227845c8184cSRoss Lagerwall 	rtnl_unlock();
227945c8184cSRoss Lagerwall 
22800d160211SJeremy Fitzhardinge 	/*
2281a5b5dc3cSDavid Vrabel 	 * All public and private state should now be sane.  Get
22820d160211SJeremy Fitzhardinge 	 * ready to start sending and receiving packets and give the driver
22830d160211SJeremy Fitzhardinge 	 * domain a kick because we've probably just requeued some
22840d160211SJeremy Fitzhardinge 	 * packets.
22850d160211SJeremy Fitzhardinge 	 */
22860d160211SJeremy Fitzhardinge 	netif_carrier_on(np->netdev);
22872688fcb7SAndrew J. Bennieston 	for (j = 0; j < num_queues; ++j) {
22882688fcb7SAndrew J. Bennieston 		queue = &np->queues[j];
2289f50b4076SDavid Vrabel 
22902688fcb7SAndrew J. Bennieston 		notify_remote_via_irq(queue->tx_irq);
22912688fcb7SAndrew J. Bennieston 		if (queue->tx_irq != queue->rx_irq)
22922688fcb7SAndrew J. Bennieston 			notify_remote_via_irq(queue->rx_irq);
22930d160211SJeremy Fitzhardinge 
2294f50b4076SDavid Vrabel 		spin_lock_irq(&queue->tx_lock);
2295f50b4076SDavid Vrabel 		xennet_tx_buf_gc(queue);
22962688fcb7SAndrew J. Bennieston 		spin_unlock_irq(&queue->tx_lock);
2297f50b4076SDavid Vrabel 
2298f50b4076SDavid Vrabel 		spin_lock_bh(&queue->rx_lock);
2299f50b4076SDavid Vrabel 		xennet_alloc_rx_buffers(queue);
23002688fcb7SAndrew J. Bennieston 		spin_unlock_bh(&queue->rx_lock);
23012688fcb7SAndrew J. Bennieston 	}
23020d160211SJeremy Fitzhardinge 
23030d160211SJeremy Fitzhardinge 	return 0;
23040d160211SJeremy Fitzhardinge }
23050d160211SJeremy Fitzhardinge 
230680708602SLee Jones /*
23070d160211SJeremy Fitzhardinge  * Callback received when the backend's state changes.
23080d160211SJeremy Fitzhardinge  */
2309f502bf2bSIan Campbell static void netback_changed(struct xenbus_device *dev,
23100d160211SJeremy Fitzhardinge 			    enum xenbus_state backend_state)
23110d160211SJeremy Fitzhardinge {
23121b713e00SGreg Kroah-Hartman 	struct netfront_info *np = dev_get_drvdata(&dev->dev);
23130d160211SJeremy Fitzhardinge 	struct net_device *netdev = np->netdev;
23140d160211SJeremy Fitzhardinge 
23150d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", xenbus_strstate(backend_state));
23160d160211SJeremy Fitzhardinge 
23178edfe2e9SJuergen Gross 	wake_up_all(&module_wq);
23188edfe2e9SJuergen Gross 
23190d160211SJeremy Fitzhardinge 	switch (backend_state) {
23200d160211SJeremy Fitzhardinge 	case XenbusStateInitialising:
23210d160211SJeremy Fitzhardinge 	case XenbusStateInitialised:
2322b78c9512SNoboru Iwamatsu 	case XenbusStateReconfiguring:
2323b78c9512SNoboru Iwamatsu 	case XenbusStateReconfigured:
23240d160211SJeremy Fitzhardinge 	case XenbusStateUnknown:
23250d160211SJeremy Fitzhardinge 		break;
23260d160211SJeremy Fitzhardinge 
23270d160211SJeremy Fitzhardinge 	case XenbusStateInitWait:
23280d160211SJeremy Fitzhardinge 		if (dev->state != XenbusStateInitialising)
23290d160211SJeremy Fitzhardinge 			break;
23300d160211SJeremy Fitzhardinge 		if (xennet_connect(netdev) != 0)
23310d160211SJeremy Fitzhardinge 			break;
23320d160211SJeremy Fitzhardinge 		xenbus_switch_state(dev, XenbusStateConnected);
233308e34eb1SLaszlo Ersek 		break;
233408e34eb1SLaszlo Ersek 
233508e34eb1SLaszlo Ersek 	case XenbusStateConnected:
2336ee89bab1SAmerigo Wang 		netdev_notify_peers(netdev);
23370d160211SJeremy Fitzhardinge 		break;
23380d160211SJeremy Fitzhardinge 
2339bce3ea81SDavid Vrabel 	case XenbusStateClosed:
2340bce3ea81SDavid Vrabel 		if (dev->state == XenbusStateClosed)
2341bce3ea81SDavid Vrabel 			break;
2342df561f66SGustavo A. R. Silva 		fallthrough;	/* Missed the backend's CLOSING state */
23430d160211SJeremy Fitzhardinge 	case XenbusStateClosing:
23440d160211SJeremy Fitzhardinge 		xenbus_frontend_closed(dev);
23450d160211SJeremy Fitzhardinge 		break;
23460d160211SJeremy Fitzhardinge 	}
23470d160211SJeremy Fitzhardinge }
23480d160211SJeremy Fitzhardinge 
2349e0ce4af9SIan Campbell static const struct xennet_stat {
2350e0ce4af9SIan Campbell 	char name[ETH_GSTRING_LEN];
2351e0ce4af9SIan Campbell 	u16 offset;
2352e0ce4af9SIan Campbell } xennet_stats[] = {
2353e0ce4af9SIan Campbell 	{
2354e0ce4af9SIan Campbell 		"rx_gso_checksum_fixup",
2355e0ce4af9SIan Campbell 		offsetof(struct netfront_info, rx_gso_checksum_fixup)
2356e0ce4af9SIan Campbell 	},
2357e0ce4af9SIan Campbell };
2358e0ce4af9SIan Campbell 
2359e0ce4af9SIan Campbell static int xennet_get_sset_count(struct net_device *dev, int string_set)
2360e0ce4af9SIan Campbell {
2361e0ce4af9SIan Campbell 	switch (string_set) {
2362e0ce4af9SIan Campbell 	case ETH_SS_STATS:
2363e0ce4af9SIan Campbell 		return ARRAY_SIZE(xennet_stats);
2364e0ce4af9SIan Campbell 	default:
2365e0ce4af9SIan Campbell 		return -EINVAL;
2366e0ce4af9SIan Campbell 	}
2367e0ce4af9SIan Campbell }
2368e0ce4af9SIan Campbell 
2369e0ce4af9SIan Campbell static void xennet_get_ethtool_stats(struct net_device *dev,
2370e0ce4af9SIan Campbell 				     struct ethtool_stats *stats, u64 * data)
2371e0ce4af9SIan Campbell {
2372e0ce4af9SIan Campbell 	void *np = netdev_priv(dev);
2373e0ce4af9SIan Campbell 	int i;
2374e0ce4af9SIan Campbell 
2375e0ce4af9SIan Campbell 	for (i = 0; i < ARRAY_SIZE(xennet_stats); i++)
23762688fcb7SAndrew J. Bennieston 		data[i] = atomic_read((atomic_t *)(np + xennet_stats[i].offset));
2377e0ce4af9SIan Campbell }
2378e0ce4af9SIan Campbell 
2379e0ce4af9SIan Campbell static void xennet_get_strings(struct net_device *dev, u32 stringset, u8 * data)
2380e0ce4af9SIan Campbell {
2381e0ce4af9SIan Campbell 	int i;
2382e0ce4af9SIan Campbell 
2383e0ce4af9SIan Campbell 	switch (stringset) {
2384e0ce4af9SIan Campbell 	case ETH_SS_STATS:
2385e0ce4af9SIan Campbell 		for (i = 0; i < ARRAY_SIZE(xennet_stats); i++)
2386e0ce4af9SIan Campbell 			memcpy(data + i * ETH_GSTRING_LEN,
2387e0ce4af9SIan Campbell 			       xennet_stats[i].name, ETH_GSTRING_LEN);
2388e0ce4af9SIan Campbell 		break;
2389e0ce4af9SIan Campbell 	}
2390e0ce4af9SIan Campbell }
2391e0ce4af9SIan Campbell 
23920fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops =
23930d160211SJeremy Fitzhardinge {
23940d160211SJeremy Fitzhardinge 	.get_link = ethtool_op_get_link,
2395e0ce4af9SIan Campbell 
2396e0ce4af9SIan Campbell 	.get_sset_count = xennet_get_sset_count,
2397e0ce4af9SIan Campbell 	.get_ethtool_stats = xennet_get_ethtool_stats,
2398e0ce4af9SIan Campbell 	.get_strings = xennet_get_strings,
239991ffb9d3SDaniel Drown 	.get_ts_info = ethtool_op_get_ts_info,
24000d160211SJeremy Fitzhardinge };
24010d160211SJeremy Fitzhardinge 
24020d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS
24031f3c2ebaSDavid Vrabel static ssize_t show_rxbuf(struct device *dev,
24040d160211SJeremy Fitzhardinge 			  struct device_attribute *attr, char *buf)
24050d160211SJeremy Fitzhardinge {
24061f3c2ebaSDavid Vrabel 	return sprintf(buf, "%lu\n", NET_RX_RING_SIZE);
24070d160211SJeremy Fitzhardinge }
24080d160211SJeremy Fitzhardinge 
24091f3c2ebaSDavid Vrabel static ssize_t store_rxbuf(struct device *dev,
24100d160211SJeremy Fitzhardinge 			   struct device_attribute *attr,
24110d160211SJeremy Fitzhardinge 			   const char *buf, size_t len)
24120d160211SJeremy Fitzhardinge {
24130d160211SJeremy Fitzhardinge 	char *endp;
24140d160211SJeremy Fitzhardinge 
24150d160211SJeremy Fitzhardinge 	if (!capable(CAP_NET_ADMIN))
24160d160211SJeremy Fitzhardinge 		return -EPERM;
24170d160211SJeremy Fitzhardinge 
24188ed7ec13SAndrew Lunn 	simple_strtoul(buf, &endp, 0);
24190d160211SJeremy Fitzhardinge 	if (endp == buf)
24200d160211SJeremy Fitzhardinge 		return -EBADMSG;
24210d160211SJeremy Fitzhardinge 
24221f3c2ebaSDavid Vrabel 	/* rxbuf_min and rxbuf_max are no longer configurable. */
24230d160211SJeremy Fitzhardinge 
24240d160211SJeremy Fitzhardinge 	return len;
24250d160211SJeremy Fitzhardinge }
24260d160211SJeremy Fitzhardinge 
2427d61e4038SJoe Perches static DEVICE_ATTR(rxbuf_min, 0644, show_rxbuf, store_rxbuf);
2428d61e4038SJoe Perches static DEVICE_ATTR(rxbuf_max, 0644, show_rxbuf, store_rxbuf);
2429d61e4038SJoe Perches static DEVICE_ATTR(rxbuf_cur, 0444, show_rxbuf, NULL);
243027b917e5STakashi Iwai 
243127b917e5STakashi Iwai static struct attribute *xennet_dev_attrs[] = {
243227b917e5STakashi Iwai 	&dev_attr_rxbuf_min.attr,
243327b917e5STakashi Iwai 	&dev_attr_rxbuf_max.attr,
243427b917e5STakashi Iwai 	&dev_attr_rxbuf_cur.attr,
243527b917e5STakashi Iwai 	NULL
24360d160211SJeremy Fitzhardinge };
24370d160211SJeremy Fitzhardinge 
243827b917e5STakashi Iwai static const struct attribute_group xennet_dev_group = {
243927b917e5STakashi Iwai 	.attrs = xennet_dev_attrs
244027b917e5STakashi Iwai };
24410d160211SJeremy Fitzhardinge #endif /* CONFIG_SYSFS */
24420d160211SJeremy Fitzhardinge 
2443c2c63310SAndrea Righi static void xennet_bus_close(struct xenbus_device *dev)
2444c2c63310SAndrea Righi {
2445c2c63310SAndrea Righi 	int ret;
2446c2c63310SAndrea Righi 
2447c2c63310SAndrea Righi 	if (xenbus_read_driver_state(dev->otherend) == XenbusStateClosed)
2448c2c63310SAndrea Righi 		return;
2449c2c63310SAndrea Righi 	do {
2450c2c63310SAndrea Righi 		xenbus_switch_state(dev, XenbusStateClosing);
2451c2c63310SAndrea Righi 		ret = wait_event_timeout(module_wq,
2452c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2453c2c63310SAndrea Righi 				   XenbusStateClosing ||
2454c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2455c2c63310SAndrea Righi 				   XenbusStateClosed ||
2456c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2457c2c63310SAndrea Righi 				   XenbusStateUnknown,
2458c2c63310SAndrea Righi 				   XENNET_TIMEOUT);
2459c2c63310SAndrea Righi 	} while (!ret);
2460c2c63310SAndrea Righi 
2461c2c63310SAndrea Righi 	if (xenbus_read_driver_state(dev->otherend) == XenbusStateClosed)
2462c2c63310SAndrea Righi 		return;
2463c2c63310SAndrea Righi 
2464c2c63310SAndrea Righi 	do {
2465c2c63310SAndrea Righi 		xenbus_switch_state(dev, XenbusStateClosed);
2466c2c63310SAndrea Righi 		ret = wait_event_timeout(module_wq,
2467c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2468c2c63310SAndrea Righi 				   XenbusStateClosed ||
2469c2c63310SAndrea Righi 				   xenbus_read_driver_state(dev->otherend) ==
2470c2c63310SAndrea Righi 				   XenbusStateUnknown,
2471c2c63310SAndrea Righi 				   XENNET_TIMEOUT);
2472c2c63310SAndrea Righi 	} while (!ret);
2473c2c63310SAndrea Righi }
2474c2c63310SAndrea Righi 
24758e0e46bbSBill Pemberton static int xennet_remove(struct xenbus_device *dev)
24760d160211SJeremy Fitzhardinge {
24771b713e00SGreg Kroah-Hartman 	struct netfront_info *info = dev_get_drvdata(&dev->dev);
24780d160211SJeremy Fitzhardinge 
2479c2c63310SAndrea Righi 	xennet_bus_close(dev);
24800d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
24810d160211SJeremy Fitzhardinge 
2482f599c64fSRoss Lagerwall 	if (info->netdev->reg_state == NETREG_REGISTERED)
24836bc96d04SIan Campbell 		unregister_netdev(info->netdev);
24846bc96d04SIan Campbell 
2485f599c64fSRoss Lagerwall 	if (info->queues) {
2486f599c64fSRoss Lagerwall 		rtnl_lock();
2487ad068118SDavid Vrabel 		xennet_destroy_queues(info);
2488f599c64fSRoss Lagerwall 		rtnl_unlock();
2489f599c64fSRoss Lagerwall 	}
2490900e1833SDavid Vrabel 	xennet_free_netdev(info->netdev);
24910d160211SJeremy Fitzhardinge 
24920d160211SJeremy Fitzhardinge 	return 0;
24930d160211SJeremy Fitzhardinge }
24940d160211SJeremy Fitzhardinge 
249595afae48SDavid Vrabel static const struct xenbus_device_id netfront_ids[] = {
249695afae48SDavid Vrabel 	{ "vif" },
249795afae48SDavid Vrabel 	{ "" }
249895afae48SDavid Vrabel };
249995afae48SDavid Vrabel 
250095afae48SDavid Vrabel static struct xenbus_driver netfront_driver = {
250195afae48SDavid Vrabel 	.ids = netfront_ids,
25020d160211SJeremy Fitzhardinge 	.probe = netfront_probe,
25038e0e46bbSBill Pemberton 	.remove = xennet_remove,
25040d160211SJeremy Fitzhardinge 	.resume = netfront_resume,
2505f502bf2bSIan Campbell 	.otherend_changed = netback_changed,
250695afae48SDavid Vrabel };
25070d160211SJeremy Fitzhardinge 
25080d160211SJeremy Fitzhardinge static int __init netif_init(void)
25090d160211SJeremy Fitzhardinge {
25106e833587SJeremy Fitzhardinge 	if (!xen_domain())
25110d160211SJeremy Fitzhardinge 		return -ENODEV;
25120d160211SJeremy Fitzhardinge 
251351c71a3bSKonrad Rzeszutek Wilk 	if (!xen_has_pv_nic_devices())
2514b9136d20SIgor Mammedov 		return -ENODEV;
2515b9136d20SIgor Mammedov 
2516383eda32SJoe Perches 	pr_info("Initialising Xen virtual ethernet driver\n");
25170d160211SJeremy Fitzhardinge 
2518034702a6SJuergen Gross 	/* Allow as many queues as there are CPUs inut max. 8 if user has not
251932a84405SWei Liu 	 * specified a value.
252032a84405SWei Liu 	 */
252132a84405SWei Liu 	if (xennet_max_queues == 0)
2522034702a6SJuergen Gross 		xennet_max_queues = min_t(unsigned int, MAX_QUEUES_DEFAULT,
2523034702a6SJuergen Gross 					  num_online_cpus());
252450ee6061SAndrew J. Bennieston 
2525ffb78a26SAl Viro 	return xenbus_register_frontend(&netfront_driver);
25260d160211SJeremy Fitzhardinge }
25270d160211SJeremy Fitzhardinge module_init(netif_init);
25280d160211SJeremy Fitzhardinge 
25290d160211SJeremy Fitzhardinge 
25300d160211SJeremy Fitzhardinge static void __exit netif_exit(void)
25310d160211SJeremy Fitzhardinge {
2532ffb78a26SAl Viro 	xenbus_unregister_driver(&netfront_driver);
25330d160211SJeremy Fitzhardinge }
25340d160211SJeremy Fitzhardinge module_exit(netif_exit);
25350d160211SJeremy Fitzhardinge 
25360d160211SJeremy Fitzhardinge MODULE_DESCRIPTION("Xen virtual network device frontend");
25370d160211SJeremy Fitzhardinge MODULE_LICENSE("GPL");
2538d2f0c52bSMark McLoughlin MODULE_ALIAS("xen:vif");
25394f93f09bSMark McLoughlin MODULE_ALIAS("xennet");
2540