xref: /openbmc/linux/drivers/net/xen-netfront.c (revision fc741216)
10d160211SJeremy Fitzhardinge /*
20d160211SJeremy Fitzhardinge  * Virtual network driver for conversing with remote driver backends.
30d160211SJeremy Fitzhardinge  *
40d160211SJeremy Fitzhardinge  * Copyright (c) 2002-2005, K A Fraser
50d160211SJeremy Fitzhardinge  * Copyright (c) 2005, XenSource Ltd
60d160211SJeremy Fitzhardinge  *
70d160211SJeremy Fitzhardinge  * This program is free software; you can redistribute it and/or
80d160211SJeremy Fitzhardinge  * modify it under the terms of the GNU General Public License version 2
90d160211SJeremy Fitzhardinge  * as published by the Free Software Foundation; or, when distributed
100d160211SJeremy Fitzhardinge  * separately from the Linux kernel or incorporated into other
110d160211SJeremy Fitzhardinge  * software packages, subject to the following license:
120d160211SJeremy Fitzhardinge  *
130d160211SJeremy Fitzhardinge  * Permission is hereby granted, free of charge, to any person obtaining a copy
140d160211SJeremy Fitzhardinge  * of this source file (the "Software"), to deal in the Software without
150d160211SJeremy Fitzhardinge  * restriction, including without limitation the rights to use, copy, modify,
160d160211SJeremy Fitzhardinge  * merge, publish, distribute, sublicense, and/or sell copies of the Software,
170d160211SJeremy Fitzhardinge  * and to permit persons to whom the Software is furnished to do so, subject to
180d160211SJeremy Fitzhardinge  * the following conditions:
190d160211SJeremy Fitzhardinge  *
200d160211SJeremy Fitzhardinge  * The above copyright notice and this permission notice shall be included in
210d160211SJeremy Fitzhardinge  * all copies or substantial portions of the Software.
220d160211SJeremy Fitzhardinge  *
230d160211SJeremy Fitzhardinge  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
240d160211SJeremy Fitzhardinge  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
250d160211SJeremy Fitzhardinge  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
260d160211SJeremy Fitzhardinge  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
270d160211SJeremy Fitzhardinge  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
280d160211SJeremy Fitzhardinge  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
290d160211SJeremy Fitzhardinge  * IN THE SOFTWARE.
300d160211SJeremy Fitzhardinge  */
310d160211SJeremy Fitzhardinge 
320d160211SJeremy Fitzhardinge #include <linux/module.h>
330d160211SJeremy Fitzhardinge #include <linux/kernel.h>
340d160211SJeremy Fitzhardinge #include <linux/netdevice.h>
350d160211SJeremy Fitzhardinge #include <linux/etherdevice.h>
360d160211SJeremy Fitzhardinge #include <linux/skbuff.h>
370d160211SJeremy Fitzhardinge #include <linux/ethtool.h>
380d160211SJeremy Fitzhardinge #include <linux/if_ether.h>
390d160211SJeremy Fitzhardinge #include <linux/tcp.h>
400d160211SJeremy Fitzhardinge #include <linux/udp.h>
410d160211SJeremy Fitzhardinge #include <linux/moduleparam.h>
420d160211SJeremy Fitzhardinge #include <linux/mm.h>
435a0e3ad6STejun Heo #include <linux/slab.h>
440d160211SJeremy Fitzhardinge #include <net/ip.h>
450d160211SJeremy Fitzhardinge 
461ccbf534SJeremy Fitzhardinge #include <xen/xen.h>
470d160211SJeremy Fitzhardinge #include <xen/xenbus.h>
480d160211SJeremy Fitzhardinge #include <xen/events.h>
490d160211SJeremy Fitzhardinge #include <xen/page.h>
500d160211SJeremy Fitzhardinge #include <xen/grant_table.h>
510d160211SJeremy Fitzhardinge 
520d160211SJeremy Fitzhardinge #include <xen/interface/io/netif.h>
530d160211SJeremy Fitzhardinge #include <xen/interface/memory.h>
540d160211SJeremy Fitzhardinge #include <xen/interface/grant_table.h>
550d160211SJeremy Fitzhardinge 
560fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops;
570d160211SJeremy Fitzhardinge 
580d160211SJeremy Fitzhardinge struct netfront_cb {
590d160211SJeremy Fitzhardinge 	struct page *page;
600d160211SJeremy Fitzhardinge 	unsigned offset;
610d160211SJeremy Fitzhardinge };
620d160211SJeremy Fitzhardinge 
630d160211SJeremy Fitzhardinge #define NETFRONT_SKB_CB(skb)	((struct netfront_cb *)((skb)->cb))
640d160211SJeremy Fitzhardinge 
650d160211SJeremy Fitzhardinge #define RX_COPY_THRESHOLD 256
660d160211SJeremy Fitzhardinge 
670d160211SJeremy Fitzhardinge #define GRANT_INVALID_REF	0
680d160211SJeremy Fitzhardinge 
69667c78afSJeremy Fitzhardinge #define NET_TX_RING_SIZE __CONST_RING_SIZE(xen_netif_tx, PAGE_SIZE)
70667c78afSJeremy Fitzhardinge #define NET_RX_RING_SIZE __CONST_RING_SIZE(xen_netif_rx, PAGE_SIZE)
710d160211SJeremy Fitzhardinge #define TX_MAX_TARGET min_t(int, NET_RX_RING_SIZE, 256)
720d160211SJeremy Fitzhardinge 
730d160211SJeremy Fitzhardinge struct netfront_info {
740d160211SJeremy Fitzhardinge 	struct list_head list;
750d160211SJeremy Fitzhardinge 	struct net_device *netdev;
760d160211SJeremy Fitzhardinge 
77bea3348eSStephen Hemminger 	struct napi_struct napi;
780d160211SJeremy Fitzhardinge 
7984284d3cSJeremy Fitzhardinge 	unsigned int evtchn;
8084284d3cSJeremy Fitzhardinge 	struct xenbus_device *xbdev;
810d160211SJeremy Fitzhardinge 
820d160211SJeremy Fitzhardinge 	spinlock_t   tx_lock;
8384284d3cSJeremy Fitzhardinge 	struct xen_netif_tx_front_ring tx;
8484284d3cSJeremy Fitzhardinge 	int tx_ring_ref;
850d160211SJeremy Fitzhardinge 
860d160211SJeremy Fitzhardinge 	/*
870d160211SJeremy Fitzhardinge 	 * {tx,rx}_skbs store outstanding skbuffs. Free tx_skb entries
880d160211SJeremy Fitzhardinge 	 * are linked from tx_skb_freelist through skb_entry.link.
890d160211SJeremy Fitzhardinge 	 *
900d160211SJeremy Fitzhardinge 	 *  NB. Freelist index entries are always going to be less than
910d160211SJeremy Fitzhardinge 	 *  PAGE_OFFSET, whereas pointers to skbs will always be equal or
920d160211SJeremy Fitzhardinge 	 *  greater than PAGE_OFFSET: we use this property to distinguish
930d160211SJeremy Fitzhardinge 	 *  them.
940d160211SJeremy Fitzhardinge 	 */
950d160211SJeremy Fitzhardinge 	union skb_entry {
960d160211SJeremy Fitzhardinge 		struct sk_buff *skb;
971ffb40b8SIsaku Yamahata 		unsigned long link;
980d160211SJeremy Fitzhardinge 	} tx_skbs[NET_TX_RING_SIZE];
990d160211SJeremy Fitzhardinge 	grant_ref_t gref_tx_head;
1000d160211SJeremy Fitzhardinge 	grant_ref_t grant_tx_ref[NET_TX_RING_SIZE];
1010d160211SJeremy Fitzhardinge 	unsigned tx_skb_freelist;
1020d160211SJeremy Fitzhardinge 
10384284d3cSJeremy Fitzhardinge 	spinlock_t   rx_lock ____cacheline_aligned_in_smp;
10484284d3cSJeremy Fitzhardinge 	struct xen_netif_rx_front_ring rx;
10584284d3cSJeremy Fitzhardinge 	int rx_ring_ref;
10684284d3cSJeremy Fitzhardinge 
10784284d3cSJeremy Fitzhardinge 	/* Receive-ring batched refills. */
10884284d3cSJeremy Fitzhardinge #define RX_MIN_TARGET 8
10984284d3cSJeremy Fitzhardinge #define RX_DFL_MIN_TARGET 64
11084284d3cSJeremy Fitzhardinge #define RX_MAX_TARGET min_t(int, NET_RX_RING_SIZE, 256)
11184284d3cSJeremy Fitzhardinge 	unsigned rx_min_target, rx_max_target, rx_target;
11284284d3cSJeremy Fitzhardinge 	struct sk_buff_head rx_batch;
11384284d3cSJeremy Fitzhardinge 
11484284d3cSJeremy Fitzhardinge 	struct timer_list rx_refill_timer;
11584284d3cSJeremy Fitzhardinge 
1160d160211SJeremy Fitzhardinge 	struct sk_buff *rx_skbs[NET_RX_RING_SIZE];
1170d160211SJeremy Fitzhardinge 	grant_ref_t gref_rx_head;
1180d160211SJeremy Fitzhardinge 	grant_ref_t grant_rx_ref[NET_RX_RING_SIZE];
1190d160211SJeremy Fitzhardinge 
1200d160211SJeremy Fitzhardinge 	unsigned long rx_pfn_array[NET_RX_RING_SIZE];
1210d160211SJeremy Fitzhardinge 	struct multicall_entry rx_mcl[NET_RX_RING_SIZE+1];
1220d160211SJeremy Fitzhardinge 	struct mmu_update rx_mmu[NET_RX_RING_SIZE];
1230d160211SJeremy Fitzhardinge };
1240d160211SJeremy Fitzhardinge 
1250d160211SJeremy Fitzhardinge struct netfront_rx_info {
1260d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response rx;
1270d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info extras[XEN_NETIF_EXTRA_TYPE_MAX - 1];
1280d160211SJeremy Fitzhardinge };
1290d160211SJeremy Fitzhardinge 
1301ffb40b8SIsaku Yamahata static void skb_entry_set_link(union skb_entry *list, unsigned short id)
1311ffb40b8SIsaku Yamahata {
1321ffb40b8SIsaku Yamahata 	list->link = id;
1331ffb40b8SIsaku Yamahata }
1341ffb40b8SIsaku Yamahata 
1351ffb40b8SIsaku Yamahata static int skb_entry_is_link(const union skb_entry *list)
1361ffb40b8SIsaku Yamahata {
1371ffb40b8SIsaku Yamahata 	BUILD_BUG_ON(sizeof(list->skb) != sizeof(list->link));
138807540baSEric Dumazet 	return (unsigned long)list->skb < PAGE_OFFSET;
1391ffb40b8SIsaku Yamahata }
1401ffb40b8SIsaku Yamahata 
1410d160211SJeremy Fitzhardinge /*
1420d160211SJeremy Fitzhardinge  * Access macros for acquiring freeing slots in tx_skbs[].
1430d160211SJeremy Fitzhardinge  */
1440d160211SJeremy Fitzhardinge 
1450d160211SJeremy Fitzhardinge static void add_id_to_freelist(unsigned *head, union skb_entry *list,
1460d160211SJeremy Fitzhardinge 			       unsigned short id)
1470d160211SJeremy Fitzhardinge {
1481ffb40b8SIsaku Yamahata 	skb_entry_set_link(&list[id], *head);
1490d160211SJeremy Fitzhardinge 	*head = id;
1500d160211SJeremy Fitzhardinge }
1510d160211SJeremy Fitzhardinge 
1520d160211SJeremy Fitzhardinge static unsigned short get_id_from_freelist(unsigned *head,
1530d160211SJeremy Fitzhardinge 					   union skb_entry *list)
1540d160211SJeremy Fitzhardinge {
1550d160211SJeremy Fitzhardinge 	unsigned int id = *head;
1560d160211SJeremy Fitzhardinge 	*head = list[id].link;
1570d160211SJeremy Fitzhardinge 	return id;
1580d160211SJeremy Fitzhardinge }
1590d160211SJeremy Fitzhardinge 
1600d160211SJeremy Fitzhardinge static int xennet_rxidx(RING_IDX idx)
1610d160211SJeremy Fitzhardinge {
1620d160211SJeremy Fitzhardinge 	return idx & (NET_RX_RING_SIZE - 1);
1630d160211SJeremy Fitzhardinge }
1640d160211SJeremy Fitzhardinge 
1650d160211SJeremy Fitzhardinge static struct sk_buff *xennet_get_rx_skb(struct netfront_info *np,
1660d160211SJeremy Fitzhardinge 					 RING_IDX ri)
1670d160211SJeremy Fitzhardinge {
1680d160211SJeremy Fitzhardinge 	int i = xennet_rxidx(ri);
1690d160211SJeremy Fitzhardinge 	struct sk_buff *skb = np->rx_skbs[i];
1700d160211SJeremy Fitzhardinge 	np->rx_skbs[i] = NULL;
1710d160211SJeremy Fitzhardinge 	return skb;
1720d160211SJeremy Fitzhardinge }
1730d160211SJeremy Fitzhardinge 
1740d160211SJeremy Fitzhardinge static grant_ref_t xennet_get_rx_ref(struct netfront_info *np,
1750d160211SJeremy Fitzhardinge 					    RING_IDX ri)
1760d160211SJeremy Fitzhardinge {
1770d160211SJeremy Fitzhardinge 	int i = xennet_rxidx(ri);
1780d160211SJeremy Fitzhardinge 	grant_ref_t ref = np->grant_rx_ref[i];
1790d160211SJeremy Fitzhardinge 	np->grant_rx_ref[i] = GRANT_INVALID_REF;
1800d160211SJeremy Fitzhardinge 	return ref;
1810d160211SJeremy Fitzhardinge }
1820d160211SJeremy Fitzhardinge 
1830d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS
1840d160211SJeremy Fitzhardinge static int xennet_sysfs_addif(struct net_device *netdev);
1850d160211SJeremy Fitzhardinge static void xennet_sysfs_delif(struct net_device *netdev);
1860d160211SJeremy Fitzhardinge #else /* !CONFIG_SYSFS */
1870d160211SJeremy Fitzhardinge #define xennet_sysfs_addif(dev) (0)
1880d160211SJeremy Fitzhardinge #define xennet_sysfs_delif(dev) do { } while (0)
1890d160211SJeremy Fitzhardinge #endif
1900d160211SJeremy Fitzhardinge 
1910d160211SJeremy Fitzhardinge static int xennet_can_sg(struct net_device *dev)
1920d160211SJeremy Fitzhardinge {
1930d160211SJeremy Fitzhardinge 	return dev->features & NETIF_F_SG;
1940d160211SJeremy Fitzhardinge }
1950d160211SJeremy Fitzhardinge 
1960d160211SJeremy Fitzhardinge 
1970d160211SJeremy Fitzhardinge static void rx_refill_timeout(unsigned long data)
1980d160211SJeremy Fitzhardinge {
1990d160211SJeremy Fitzhardinge 	struct net_device *dev = (struct net_device *)data;
200bea3348eSStephen Hemminger 	struct netfront_info *np = netdev_priv(dev);
201288379f0SBen Hutchings 	napi_schedule(&np->napi);
2020d160211SJeremy Fitzhardinge }
2030d160211SJeremy Fitzhardinge 
2040d160211SJeremy Fitzhardinge static int netfront_tx_slot_available(struct netfront_info *np)
2050d160211SJeremy Fitzhardinge {
206807540baSEric Dumazet 	return (np->tx.req_prod_pvt - np->tx.rsp_cons) <
207807540baSEric Dumazet 		(TX_MAX_TARGET - MAX_SKB_FRAGS - 2);
2080d160211SJeremy Fitzhardinge }
2090d160211SJeremy Fitzhardinge 
2100d160211SJeremy Fitzhardinge static void xennet_maybe_wake_tx(struct net_device *dev)
2110d160211SJeremy Fitzhardinge {
2120d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
2130d160211SJeremy Fitzhardinge 
2140d160211SJeremy Fitzhardinge 	if (unlikely(netif_queue_stopped(dev)) &&
2150d160211SJeremy Fitzhardinge 	    netfront_tx_slot_available(np) &&
2160d160211SJeremy Fitzhardinge 	    likely(netif_running(dev)))
2170d160211SJeremy Fitzhardinge 		netif_wake_queue(dev);
2180d160211SJeremy Fitzhardinge }
2190d160211SJeremy Fitzhardinge 
2200d160211SJeremy Fitzhardinge static void xennet_alloc_rx_buffers(struct net_device *dev)
2210d160211SJeremy Fitzhardinge {
2220d160211SJeremy Fitzhardinge 	unsigned short id;
2230d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
2240d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
2250d160211SJeremy Fitzhardinge 	struct page *page;
2260d160211SJeremy Fitzhardinge 	int i, batch_target, notify;
2270d160211SJeremy Fitzhardinge 	RING_IDX req_prod = np->rx.req_prod_pvt;
2280d160211SJeremy Fitzhardinge 	grant_ref_t ref;
2290d160211SJeremy Fitzhardinge 	unsigned long pfn;
2300d160211SJeremy Fitzhardinge 	void *vaddr;
2310d160211SJeremy Fitzhardinge 	struct xen_netif_rx_request *req;
2320d160211SJeremy Fitzhardinge 
2330d160211SJeremy Fitzhardinge 	if (unlikely(!netif_carrier_ok(dev)))
2340d160211SJeremy Fitzhardinge 		return;
2350d160211SJeremy Fitzhardinge 
2360d160211SJeremy Fitzhardinge 	/*
2370d160211SJeremy Fitzhardinge 	 * Allocate skbuffs greedily, even though we batch updates to the
2380d160211SJeremy Fitzhardinge 	 * receive ring. This creates a less bursty demand on the memory
2390d160211SJeremy Fitzhardinge 	 * allocator, so should reduce the chance of failed allocation requests
2400d160211SJeremy Fitzhardinge 	 * both for ourself and for other kernel subsystems.
2410d160211SJeremy Fitzhardinge 	 */
2420d160211SJeremy Fitzhardinge 	batch_target = np->rx_target - (req_prod - np->rx.rsp_cons);
2430d160211SJeremy Fitzhardinge 	for (i = skb_queue_len(&np->rx_batch); i < batch_target; i++) {
244617a20bbSIsaku Yamahata 		skb = __netdev_alloc_skb(dev, RX_COPY_THRESHOLD + NET_IP_ALIGN,
2450d160211SJeremy Fitzhardinge 					 GFP_ATOMIC | __GFP_NOWARN);
2460d160211SJeremy Fitzhardinge 		if (unlikely(!skb))
2470d160211SJeremy Fitzhardinge 			goto no_skb;
2480d160211SJeremy Fitzhardinge 
249617a20bbSIsaku Yamahata 		/* Align ip header to a 16 bytes boundary */
250617a20bbSIsaku Yamahata 		skb_reserve(skb, NET_IP_ALIGN);
251617a20bbSIsaku Yamahata 
2520d160211SJeremy Fitzhardinge 		page = alloc_page(GFP_ATOMIC | __GFP_NOWARN);
2530d160211SJeremy Fitzhardinge 		if (!page) {
2540d160211SJeremy Fitzhardinge 			kfree_skb(skb);
2550d160211SJeremy Fitzhardinge no_skb:
2560d160211SJeremy Fitzhardinge 			/* Any skbuffs queued for refill? Force them out. */
2570d160211SJeremy Fitzhardinge 			if (i != 0)
2580d160211SJeremy Fitzhardinge 				goto refill;
2590d160211SJeremy Fitzhardinge 			/* Could not allocate any skbuffs. Try again later. */
2600d160211SJeremy Fitzhardinge 			mod_timer(&np->rx_refill_timer,
2610d160211SJeremy Fitzhardinge 				  jiffies + (HZ/10));
2620d160211SJeremy Fitzhardinge 			break;
2630d160211SJeremy Fitzhardinge 		}
2640d160211SJeremy Fitzhardinge 
2650d160211SJeremy Fitzhardinge 		skb_shinfo(skb)->frags[0].page = page;
2660d160211SJeremy Fitzhardinge 		skb_shinfo(skb)->nr_frags = 1;
2670d160211SJeremy Fitzhardinge 		__skb_queue_tail(&np->rx_batch, skb);
2680d160211SJeremy Fitzhardinge 	}
2690d160211SJeremy Fitzhardinge 
2700d160211SJeremy Fitzhardinge 	/* Is the batch large enough to be worthwhile? */
2710d160211SJeremy Fitzhardinge 	if (i < (np->rx_target/2)) {
2720d160211SJeremy Fitzhardinge 		if (req_prod > np->rx.sring->req_prod)
2730d160211SJeremy Fitzhardinge 			goto push;
2740d160211SJeremy Fitzhardinge 		return;
2750d160211SJeremy Fitzhardinge 	}
2760d160211SJeremy Fitzhardinge 
2770d160211SJeremy Fitzhardinge 	/* Adjust our fill target if we risked running out of buffers. */
2780d160211SJeremy Fitzhardinge 	if (((req_prod - np->rx.sring->rsp_prod) < (np->rx_target / 4)) &&
2790d160211SJeremy Fitzhardinge 	    ((np->rx_target *= 2) > np->rx_max_target))
2800d160211SJeremy Fitzhardinge 		np->rx_target = np->rx_max_target;
2810d160211SJeremy Fitzhardinge 
2820d160211SJeremy Fitzhardinge  refill:
2835dcddfaeSJeremy Fitzhardinge 	for (i = 0; ; i++) {
2840d160211SJeremy Fitzhardinge 		skb = __skb_dequeue(&np->rx_batch);
2850d160211SJeremy Fitzhardinge 		if (skb == NULL)
2860d160211SJeremy Fitzhardinge 			break;
2870d160211SJeremy Fitzhardinge 
2880d160211SJeremy Fitzhardinge 		skb->dev = dev;
2890d160211SJeremy Fitzhardinge 
2900d160211SJeremy Fitzhardinge 		id = xennet_rxidx(req_prod + i);
2910d160211SJeremy Fitzhardinge 
2920d160211SJeremy Fitzhardinge 		BUG_ON(np->rx_skbs[id]);
2930d160211SJeremy Fitzhardinge 		np->rx_skbs[id] = skb;
2940d160211SJeremy Fitzhardinge 
2950d160211SJeremy Fitzhardinge 		ref = gnttab_claim_grant_reference(&np->gref_rx_head);
2960d160211SJeremy Fitzhardinge 		BUG_ON((signed short)ref < 0);
2970d160211SJeremy Fitzhardinge 		np->grant_rx_ref[id] = ref;
2980d160211SJeremy Fitzhardinge 
2990d160211SJeremy Fitzhardinge 		pfn = page_to_pfn(skb_shinfo(skb)->frags[0].page);
3000d160211SJeremy Fitzhardinge 		vaddr = page_address(skb_shinfo(skb)->frags[0].page);
3010d160211SJeremy Fitzhardinge 
3020d160211SJeremy Fitzhardinge 		req = RING_GET_REQUEST(&np->rx, req_prod + i);
3030d160211SJeremy Fitzhardinge 		gnttab_grant_foreign_access_ref(ref,
3040d160211SJeremy Fitzhardinge 						np->xbdev->otherend_id,
3050d160211SJeremy Fitzhardinge 						pfn_to_mfn(pfn),
3060d160211SJeremy Fitzhardinge 						0);
3070d160211SJeremy Fitzhardinge 
3080d160211SJeremy Fitzhardinge 		req->id = id;
3090d160211SJeremy Fitzhardinge 		req->gref = ref;
3100d160211SJeremy Fitzhardinge 	}
3110d160211SJeremy Fitzhardinge 
3120d160211SJeremy Fitzhardinge 	wmb();		/* barrier so backend seens requests */
3130d160211SJeremy Fitzhardinge 
3140d160211SJeremy Fitzhardinge 	/* Above is a suitable barrier to ensure backend will see requests. */
3150d160211SJeremy Fitzhardinge 	np->rx.req_prod_pvt = req_prod + i;
3160d160211SJeremy Fitzhardinge  push:
3170d160211SJeremy Fitzhardinge 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&np->rx, notify);
3180d160211SJeremy Fitzhardinge 	if (notify)
3190d160211SJeremy Fitzhardinge 		notify_remote_via_irq(np->netdev->irq);
3200d160211SJeremy Fitzhardinge }
3210d160211SJeremy Fitzhardinge 
3220d160211SJeremy Fitzhardinge static int xennet_open(struct net_device *dev)
3230d160211SJeremy Fitzhardinge {
3240d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
3250d160211SJeremy Fitzhardinge 
326bea3348eSStephen Hemminger 	napi_enable(&np->napi);
327bea3348eSStephen Hemminger 
3280d160211SJeremy Fitzhardinge 	spin_lock_bh(&np->rx_lock);
3290d160211SJeremy Fitzhardinge 	if (netif_carrier_ok(dev)) {
3300d160211SJeremy Fitzhardinge 		xennet_alloc_rx_buffers(dev);
3310d160211SJeremy Fitzhardinge 		np->rx.sring->rsp_event = np->rx.rsp_cons + 1;
3320d160211SJeremy Fitzhardinge 		if (RING_HAS_UNCONSUMED_RESPONSES(&np->rx))
333288379f0SBen Hutchings 			napi_schedule(&np->napi);
3340d160211SJeremy Fitzhardinge 	}
3350d160211SJeremy Fitzhardinge 	spin_unlock_bh(&np->rx_lock);
3360d160211SJeremy Fitzhardinge 
3370b1ab1b8SEduardo Habkost 	netif_start_queue(dev);
3380d160211SJeremy Fitzhardinge 
3390d160211SJeremy Fitzhardinge 	return 0;
3400d160211SJeremy Fitzhardinge }
3410d160211SJeremy Fitzhardinge 
3420d160211SJeremy Fitzhardinge static void xennet_tx_buf_gc(struct net_device *dev)
3430d160211SJeremy Fitzhardinge {
3440d160211SJeremy Fitzhardinge 	RING_IDX cons, prod;
3450d160211SJeremy Fitzhardinge 	unsigned short id;
3460d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
3470d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
3480d160211SJeremy Fitzhardinge 
3490d160211SJeremy Fitzhardinge 	BUG_ON(!netif_carrier_ok(dev));
3500d160211SJeremy Fitzhardinge 
3510d160211SJeremy Fitzhardinge 	do {
3520d160211SJeremy Fitzhardinge 		prod = np->tx.sring->rsp_prod;
3530d160211SJeremy Fitzhardinge 		rmb(); /* Ensure we see responses up to 'rp'. */
3540d160211SJeremy Fitzhardinge 
3550d160211SJeremy Fitzhardinge 		for (cons = np->tx.rsp_cons; cons != prod; cons++) {
3560d160211SJeremy Fitzhardinge 			struct xen_netif_tx_response *txrsp;
3570d160211SJeremy Fitzhardinge 
3580d160211SJeremy Fitzhardinge 			txrsp = RING_GET_RESPONSE(&np->tx, cons);
3590d160211SJeremy Fitzhardinge 			if (txrsp->status == NETIF_RSP_NULL)
3600d160211SJeremy Fitzhardinge 				continue;
3610d160211SJeremy Fitzhardinge 
3620d160211SJeremy Fitzhardinge 			id  = txrsp->id;
3630d160211SJeremy Fitzhardinge 			skb = np->tx_skbs[id].skb;
3640d160211SJeremy Fitzhardinge 			if (unlikely(gnttab_query_foreign_access(
3650d160211SJeremy Fitzhardinge 				np->grant_tx_ref[id]) != 0)) {
3660d160211SJeremy Fitzhardinge 				printk(KERN_ALERT "xennet_tx_buf_gc: warning "
3670d160211SJeremy Fitzhardinge 				       "-- grant still in use by backend "
3680d160211SJeremy Fitzhardinge 				       "domain.\n");
3690d160211SJeremy Fitzhardinge 				BUG();
3700d160211SJeremy Fitzhardinge 			}
3710d160211SJeremy Fitzhardinge 			gnttab_end_foreign_access_ref(
3720d160211SJeremy Fitzhardinge 				np->grant_tx_ref[id], GNTMAP_readonly);
3730d160211SJeremy Fitzhardinge 			gnttab_release_grant_reference(
3740d160211SJeremy Fitzhardinge 				&np->gref_tx_head, np->grant_tx_ref[id]);
3750d160211SJeremy Fitzhardinge 			np->grant_tx_ref[id] = GRANT_INVALID_REF;
3760d160211SJeremy Fitzhardinge 			add_id_to_freelist(&np->tx_skb_freelist, np->tx_skbs, id);
3770d160211SJeremy Fitzhardinge 			dev_kfree_skb_irq(skb);
3780d160211SJeremy Fitzhardinge 		}
3790d160211SJeremy Fitzhardinge 
3800d160211SJeremy Fitzhardinge 		np->tx.rsp_cons = prod;
3810d160211SJeremy Fitzhardinge 
3820d160211SJeremy Fitzhardinge 		/*
3830d160211SJeremy Fitzhardinge 		 * Set a new event, then check for race with update of tx_cons.
3840d160211SJeremy Fitzhardinge 		 * Note that it is essential to schedule a callback, no matter
3850d160211SJeremy Fitzhardinge 		 * how few buffers are pending. Even if there is space in the
3860d160211SJeremy Fitzhardinge 		 * transmit ring, higher layers may be blocked because too much
3870d160211SJeremy Fitzhardinge 		 * data is outstanding: in such cases notification from Xen is
3880d160211SJeremy Fitzhardinge 		 * likely to be the only kick that we'll get.
3890d160211SJeremy Fitzhardinge 		 */
3900d160211SJeremy Fitzhardinge 		np->tx.sring->rsp_event =
3910d160211SJeremy Fitzhardinge 			prod + ((np->tx.sring->req_prod - prod) >> 1) + 1;
3920d160211SJeremy Fitzhardinge 		mb();		/* update shared area */
3930d160211SJeremy Fitzhardinge 	} while ((cons == prod) && (prod != np->tx.sring->rsp_prod));
3940d160211SJeremy Fitzhardinge 
3950d160211SJeremy Fitzhardinge 	xennet_maybe_wake_tx(dev);
3960d160211SJeremy Fitzhardinge }
3970d160211SJeremy Fitzhardinge 
3980d160211SJeremy Fitzhardinge static void xennet_make_frags(struct sk_buff *skb, struct net_device *dev,
3990d160211SJeremy Fitzhardinge 			      struct xen_netif_tx_request *tx)
4000d160211SJeremy Fitzhardinge {
4010d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
4020d160211SJeremy Fitzhardinge 	char *data = skb->data;
4030d160211SJeremy Fitzhardinge 	unsigned long mfn;
4040d160211SJeremy Fitzhardinge 	RING_IDX prod = np->tx.req_prod_pvt;
4050d160211SJeremy Fitzhardinge 	int frags = skb_shinfo(skb)->nr_frags;
4060d160211SJeremy Fitzhardinge 	unsigned int offset = offset_in_page(data);
4070d160211SJeremy Fitzhardinge 	unsigned int len = skb_headlen(skb);
4080d160211SJeremy Fitzhardinge 	unsigned int id;
4090d160211SJeremy Fitzhardinge 	grant_ref_t ref;
4100d160211SJeremy Fitzhardinge 	int i;
4110d160211SJeremy Fitzhardinge 
4120d160211SJeremy Fitzhardinge 	/* While the header overlaps a page boundary (including being
4130d160211SJeremy Fitzhardinge 	   larger than a page), split it it into page-sized chunks. */
4140d160211SJeremy Fitzhardinge 	while (len > PAGE_SIZE - offset) {
4150d160211SJeremy Fitzhardinge 		tx->size = PAGE_SIZE - offset;
4160d160211SJeremy Fitzhardinge 		tx->flags |= NETTXF_more_data;
4170d160211SJeremy Fitzhardinge 		len -= tx->size;
4180d160211SJeremy Fitzhardinge 		data += tx->size;
4190d160211SJeremy Fitzhardinge 		offset = 0;
4200d160211SJeremy Fitzhardinge 
4210d160211SJeremy Fitzhardinge 		id = get_id_from_freelist(&np->tx_skb_freelist, np->tx_skbs);
4220d160211SJeremy Fitzhardinge 		np->tx_skbs[id].skb = skb_get(skb);
4230d160211SJeremy Fitzhardinge 		tx = RING_GET_REQUEST(&np->tx, prod++);
4240d160211SJeremy Fitzhardinge 		tx->id = id;
4250d160211SJeremy Fitzhardinge 		ref = gnttab_claim_grant_reference(&np->gref_tx_head);
4260d160211SJeremy Fitzhardinge 		BUG_ON((signed short)ref < 0);
4270d160211SJeremy Fitzhardinge 
4280d160211SJeremy Fitzhardinge 		mfn = virt_to_mfn(data);
4290d160211SJeremy Fitzhardinge 		gnttab_grant_foreign_access_ref(ref, np->xbdev->otherend_id,
4300d160211SJeremy Fitzhardinge 						mfn, GNTMAP_readonly);
4310d160211SJeremy Fitzhardinge 
4320d160211SJeremy Fitzhardinge 		tx->gref = np->grant_tx_ref[id] = ref;
4330d160211SJeremy Fitzhardinge 		tx->offset = offset;
4340d160211SJeremy Fitzhardinge 		tx->size = len;
4350d160211SJeremy Fitzhardinge 		tx->flags = 0;
4360d160211SJeremy Fitzhardinge 	}
4370d160211SJeremy Fitzhardinge 
4380d160211SJeremy Fitzhardinge 	/* Grant backend access to each skb fragment page. */
4390d160211SJeremy Fitzhardinge 	for (i = 0; i < frags; i++) {
4400d160211SJeremy Fitzhardinge 		skb_frag_t *frag = skb_shinfo(skb)->frags + i;
4410d160211SJeremy Fitzhardinge 
4420d160211SJeremy Fitzhardinge 		tx->flags |= NETTXF_more_data;
4430d160211SJeremy Fitzhardinge 
4440d160211SJeremy Fitzhardinge 		id = get_id_from_freelist(&np->tx_skb_freelist, np->tx_skbs);
4450d160211SJeremy Fitzhardinge 		np->tx_skbs[id].skb = skb_get(skb);
4460d160211SJeremy Fitzhardinge 		tx = RING_GET_REQUEST(&np->tx, prod++);
4470d160211SJeremy Fitzhardinge 		tx->id = id;
4480d160211SJeremy Fitzhardinge 		ref = gnttab_claim_grant_reference(&np->gref_tx_head);
4490d160211SJeremy Fitzhardinge 		BUG_ON((signed short)ref < 0);
4500d160211SJeremy Fitzhardinge 
4510d160211SJeremy Fitzhardinge 		mfn = pfn_to_mfn(page_to_pfn(frag->page));
4520d160211SJeremy Fitzhardinge 		gnttab_grant_foreign_access_ref(ref, np->xbdev->otherend_id,
4530d160211SJeremy Fitzhardinge 						mfn, GNTMAP_readonly);
4540d160211SJeremy Fitzhardinge 
4550d160211SJeremy Fitzhardinge 		tx->gref = np->grant_tx_ref[id] = ref;
4560d160211SJeremy Fitzhardinge 		tx->offset = frag->page_offset;
4570d160211SJeremy Fitzhardinge 		tx->size = frag->size;
4580d160211SJeremy Fitzhardinge 		tx->flags = 0;
4590d160211SJeremy Fitzhardinge 	}
4600d160211SJeremy Fitzhardinge 
4610d160211SJeremy Fitzhardinge 	np->tx.req_prod_pvt = prod;
4620d160211SJeremy Fitzhardinge }
4630d160211SJeremy Fitzhardinge 
4640d160211SJeremy Fitzhardinge static int xennet_start_xmit(struct sk_buff *skb, struct net_device *dev)
4650d160211SJeremy Fitzhardinge {
4660d160211SJeremy Fitzhardinge 	unsigned short id;
4670d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
4680d160211SJeremy Fitzhardinge 	struct xen_netif_tx_request *tx;
4690d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extra;
4700d160211SJeremy Fitzhardinge 	char *data = skb->data;
4710d160211SJeremy Fitzhardinge 	RING_IDX i;
4720d160211SJeremy Fitzhardinge 	grant_ref_t ref;
4730d160211SJeremy Fitzhardinge 	unsigned long mfn;
4740d160211SJeremy Fitzhardinge 	int notify;
4750d160211SJeremy Fitzhardinge 	int frags = skb_shinfo(skb)->nr_frags;
4760d160211SJeremy Fitzhardinge 	unsigned int offset = offset_in_page(data);
4770d160211SJeremy Fitzhardinge 	unsigned int len = skb_headlen(skb);
4780d160211SJeremy Fitzhardinge 
47943526370SJulia Lawall 	frags += DIV_ROUND_UP(offset + len, PAGE_SIZE);
4800d160211SJeremy Fitzhardinge 	if (unlikely(frags > MAX_SKB_FRAGS + 1)) {
4810d160211SJeremy Fitzhardinge 		printk(KERN_ALERT "xennet: skb rides the rocket: %d frags\n",
4820d160211SJeremy Fitzhardinge 		       frags);
4830d160211SJeremy Fitzhardinge 		dump_stack();
4840d160211SJeremy Fitzhardinge 		goto drop;
4850d160211SJeremy Fitzhardinge 	}
4860d160211SJeremy Fitzhardinge 
4870d160211SJeremy Fitzhardinge 	spin_lock_irq(&np->tx_lock);
4880d160211SJeremy Fitzhardinge 
4890d160211SJeremy Fitzhardinge 	if (unlikely(!netif_carrier_ok(dev) ||
4900d160211SJeremy Fitzhardinge 		     (frags > 1 && !xennet_can_sg(dev)) ||
491fc741216SJesse Gross 		     netif_needs_gso(skb, netif_skb_features(skb)))) {
4920d160211SJeremy Fitzhardinge 		spin_unlock_irq(&np->tx_lock);
4930d160211SJeremy Fitzhardinge 		goto drop;
4940d160211SJeremy Fitzhardinge 	}
4950d160211SJeremy Fitzhardinge 
4960d160211SJeremy Fitzhardinge 	i = np->tx.req_prod_pvt;
4970d160211SJeremy Fitzhardinge 
4980d160211SJeremy Fitzhardinge 	id = get_id_from_freelist(&np->tx_skb_freelist, np->tx_skbs);
4990d160211SJeremy Fitzhardinge 	np->tx_skbs[id].skb = skb;
5000d160211SJeremy Fitzhardinge 
5010d160211SJeremy Fitzhardinge 	tx = RING_GET_REQUEST(&np->tx, i);
5020d160211SJeremy Fitzhardinge 
5030d160211SJeremy Fitzhardinge 	tx->id   = id;
5040d160211SJeremy Fitzhardinge 	ref = gnttab_claim_grant_reference(&np->gref_tx_head);
5050d160211SJeremy Fitzhardinge 	BUG_ON((signed short)ref < 0);
5060d160211SJeremy Fitzhardinge 	mfn = virt_to_mfn(data);
5070d160211SJeremy Fitzhardinge 	gnttab_grant_foreign_access_ref(
5080d160211SJeremy Fitzhardinge 		ref, np->xbdev->otherend_id, mfn, GNTMAP_readonly);
5090d160211SJeremy Fitzhardinge 	tx->gref = np->grant_tx_ref[id] = ref;
5100d160211SJeremy Fitzhardinge 	tx->offset = offset;
5110d160211SJeremy Fitzhardinge 	tx->size = len;
5120d160211SJeremy Fitzhardinge 	extra = NULL;
5130d160211SJeremy Fitzhardinge 
5140d160211SJeremy Fitzhardinge 	tx->flags = 0;
5150d160211SJeremy Fitzhardinge 	if (skb->ip_summed == CHECKSUM_PARTIAL)
5160d160211SJeremy Fitzhardinge 		/* local packet? */
5170d160211SJeremy Fitzhardinge 		tx->flags |= NETTXF_csum_blank | NETTXF_data_validated;
5180d160211SJeremy Fitzhardinge 	else if (skb->ip_summed == CHECKSUM_UNNECESSARY)
5190d160211SJeremy Fitzhardinge 		/* remote but checksummed. */
5200d160211SJeremy Fitzhardinge 		tx->flags |= NETTXF_data_validated;
5210d160211SJeremy Fitzhardinge 
5220d160211SJeremy Fitzhardinge 	if (skb_shinfo(skb)->gso_size) {
5230d160211SJeremy Fitzhardinge 		struct xen_netif_extra_info *gso;
5240d160211SJeremy Fitzhardinge 
5250d160211SJeremy Fitzhardinge 		gso = (struct xen_netif_extra_info *)
5260d160211SJeremy Fitzhardinge 			RING_GET_REQUEST(&np->tx, ++i);
5270d160211SJeremy Fitzhardinge 
5280d160211SJeremy Fitzhardinge 		if (extra)
5290d160211SJeremy Fitzhardinge 			extra->flags |= XEN_NETIF_EXTRA_FLAG_MORE;
5300d160211SJeremy Fitzhardinge 		else
5310d160211SJeremy Fitzhardinge 			tx->flags |= NETTXF_extra_info;
5320d160211SJeremy Fitzhardinge 
5330d160211SJeremy Fitzhardinge 		gso->u.gso.size = skb_shinfo(skb)->gso_size;
5340d160211SJeremy Fitzhardinge 		gso->u.gso.type = XEN_NETIF_GSO_TYPE_TCPV4;
5350d160211SJeremy Fitzhardinge 		gso->u.gso.pad = 0;
5360d160211SJeremy Fitzhardinge 		gso->u.gso.features = 0;
5370d160211SJeremy Fitzhardinge 
5380d160211SJeremy Fitzhardinge 		gso->type = XEN_NETIF_EXTRA_TYPE_GSO;
5390d160211SJeremy Fitzhardinge 		gso->flags = 0;
5400d160211SJeremy Fitzhardinge 		extra = gso;
5410d160211SJeremy Fitzhardinge 	}
5420d160211SJeremy Fitzhardinge 
5430d160211SJeremy Fitzhardinge 	np->tx.req_prod_pvt = i + 1;
5440d160211SJeremy Fitzhardinge 
5450d160211SJeremy Fitzhardinge 	xennet_make_frags(skb, dev, tx);
5460d160211SJeremy Fitzhardinge 	tx->size = skb->len;
5470d160211SJeremy Fitzhardinge 
5480d160211SJeremy Fitzhardinge 	RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&np->tx, notify);
5490d160211SJeremy Fitzhardinge 	if (notify)
5500d160211SJeremy Fitzhardinge 		notify_remote_via_irq(np->netdev->irq);
5510d160211SJeremy Fitzhardinge 
55209f75cd7SJeff Garzik 	dev->stats.tx_bytes += skb->len;
55309f75cd7SJeff Garzik 	dev->stats.tx_packets++;
55410a273a6SJeremy Fitzhardinge 
55510a273a6SJeremy Fitzhardinge 	/* Note: It is not safe to access skb after xennet_tx_buf_gc()! */
5560d160211SJeremy Fitzhardinge 	xennet_tx_buf_gc(dev);
5570d160211SJeremy Fitzhardinge 
5580d160211SJeremy Fitzhardinge 	if (!netfront_tx_slot_available(np))
5590d160211SJeremy Fitzhardinge 		netif_stop_queue(dev);
5600d160211SJeremy Fitzhardinge 
5610d160211SJeremy Fitzhardinge 	spin_unlock_irq(&np->tx_lock);
5620d160211SJeremy Fitzhardinge 
5636ed10654SPatrick McHardy 	return NETDEV_TX_OK;
5640d160211SJeremy Fitzhardinge 
5650d160211SJeremy Fitzhardinge  drop:
56609f75cd7SJeff Garzik 	dev->stats.tx_dropped++;
5670d160211SJeremy Fitzhardinge 	dev_kfree_skb(skb);
5686ed10654SPatrick McHardy 	return NETDEV_TX_OK;
5690d160211SJeremy Fitzhardinge }
5700d160211SJeremy Fitzhardinge 
5710d160211SJeremy Fitzhardinge static int xennet_close(struct net_device *dev)
5720d160211SJeremy Fitzhardinge {
5730d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
5740d160211SJeremy Fitzhardinge 	netif_stop_queue(np->netdev);
575bea3348eSStephen Hemminger 	napi_disable(&np->napi);
5760d160211SJeremy Fitzhardinge 	return 0;
5770d160211SJeremy Fitzhardinge }
5780d160211SJeremy Fitzhardinge 
5790d160211SJeremy Fitzhardinge static void xennet_move_rx_slot(struct netfront_info *np, struct sk_buff *skb,
5800d160211SJeremy Fitzhardinge 				grant_ref_t ref)
5810d160211SJeremy Fitzhardinge {
5820d160211SJeremy Fitzhardinge 	int new = xennet_rxidx(np->rx.req_prod_pvt);
5830d160211SJeremy Fitzhardinge 
5840d160211SJeremy Fitzhardinge 	BUG_ON(np->rx_skbs[new]);
5850d160211SJeremy Fitzhardinge 	np->rx_skbs[new] = skb;
5860d160211SJeremy Fitzhardinge 	np->grant_rx_ref[new] = ref;
5870d160211SJeremy Fitzhardinge 	RING_GET_REQUEST(&np->rx, np->rx.req_prod_pvt)->id = new;
5880d160211SJeremy Fitzhardinge 	RING_GET_REQUEST(&np->rx, np->rx.req_prod_pvt)->gref = ref;
5890d160211SJeremy Fitzhardinge 	np->rx.req_prod_pvt++;
5900d160211SJeremy Fitzhardinge }
5910d160211SJeremy Fitzhardinge 
5920d160211SJeremy Fitzhardinge static int xennet_get_extras(struct netfront_info *np,
5930d160211SJeremy Fitzhardinge 			     struct xen_netif_extra_info *extras,
5940d160211SJeremy Fitzhardinge 			     RING_IDX rp)
5950d160211SJeremy Fitzhardinge 
5960d160211SJeremy Fitzhardinge {
5970d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extra;
5980d160211SJeremy Fitzhardinge 	struct device *dev = &np->netdev->dev;
5990d160211SJeremy Fitzhardinge 	RING_IDX cons = np->rx.rsp_cons;
6000d160211SJeremy Fitzhardinge 	int err = 0;
6010d160211SJeremy Fitzhardinge 
6020d160211SJeremy Fitzhardinge 	do {
6030d160211SJeremy Fitzhardinge 		struct sk_buff *skb;
6040d160211SJeremy Fitzhardinge 		grant_ref_t ref;
6050d160211SJeremy Fitzhardinge 
6060d160211SJeremy Fitzhardinge 		if (unlikely(cons + 1 == rp)) {
6070d160211SJeremy Fitzhardinge 			if (net_ratelimit())
6080d160211SJeremy Fitzhardinge 				dev_warn(dev, "Missing extra info\n");
6090d160211SJeremy Fitzhardinge 			err = -EBADR;
6100d160211SJeremy Fitzhardinge 			break;
6110d160211SJeremy Fitzhardinge 		}
6120d160211SJeremy Fitzhardinge 
6130d160211SJeremy Fitzhardinge 		extra = (struct xen_netif_extra_info *)
6140d160211SJeremy Fitzhardinge 			RING_GET_RESPONSE(&np->rx, ++cons);
6150d160211SJeremy Fitzhardinge 
6160d160211SJeremy Fitzhardinge 		if (unlikely(!extra->type ||
6170d160211SJeremy Fitzhardinge 			     extra->type >= XEN_NETIF_EXTRA_TYPE_MAX)) {
6180d160211SJeremy Fitzhardinge 			if (net_ratelimit())
6190d160211SJeremy Fitzhardinge 				dev_warn(dev, "Invalid extra type: %d\n",
6200d160211SJeremy Fitzhardinge 					extra->type);
6210d160211SJeremy Fitzhardinge 			err = -EINVAL;
6220d160211SJeremy Fitzhardinge 		} else {
6230d160211SJeremy Fitzhardinge 			memcpy(&extras[extra->type - 1], extra,
6240d160211SJeremy Fitzhardinge 			       sizeof(*extra));
6250d160211SJeremy Fitzhardinge 		}
6260d160211SJeremy Fitzhardinge 
6270d160211SJeremy Fitzhardinge 		skb = xennet_get_rx_skb(np, cons);
6280d160211SJeremy Fitzhardinge 		ref = xennet_get_rx_ref(np, cons);
6290d160211SJeremy Fitzhardinge 		xennet_move_rx_slot(np, skb, ref);
6300d160211SJeremy Fitzhardinge 	} while (extra->flags & XEN_NETIF_EXTRA_FLAG_MORE);
6310d160211SJeremy Fitzhardinge 
6320d160211SJeremy Fitzhardinge 	np->rx.rsp_cons = cons;
6330d160211SJeremy Fitzhardinge 	return err;
6340d160211SJeremy Fitzhardinge }
6350d160211SJeremy Fitzhardinge 
6360d160211SJeremy Fitzhardinge static int xennet_get_responses(struct netfront_info *np,
6370d160211SJeremy Fitzhardinge 				struct netfront_rx_info *rinfo, RING_IDX rp,
6380d160211SJeremy Fitzhardinge 				struct sk_buff_head *list)
6390d160211SJeremy Fitzhardinge {
6400d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response *rx = &rinfo->rx;
6410d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extras = rinfo->extras;
6420d160211SJeremy Fitzhardinge 	struct device *dev = &np->netdev->dev;
6430d160211SJeremy Fitzhardinge 	RING_IDX cons = np->rx.rsp_cons;
6440d160211SJeremy Fitzhardinge 	struct sk_buff *skb = xennet_get_rx_skb(np, cons);
6450d160211SJeremy Fitzhardinge 	grant_ref_t ref = xennet_get_rx_ref(np, cons);
6460d160211SJeremy Fitzhardinge 	int max = MAX_SKB_FRAGS + (rx->status <= RX_COPY_THRESHOLD);
6470d160211SJeremy Fitzhardinge 	int frags = 1;
6480d160211SJeremy Fitzhardinge 	int err = 0;
6490d160211SJeremy Fitzhardinge 	unsigned long ret;
6500d160211SJeremy Fitzhardinge 
6510d160211SJeremy Fitzhardinge 	if (rx->flags & NETRXF_extra_info) {
6520d160211SJeremy Fitzhardinge 		err = xennet_get_extras(np, extras, rp);
6530d160211SJeremy Fitzhardinge 		cons = np->rx.rsp_cons;
6540d160211SJeremy Fitzhardinge 	}
6550d160211SJeremy Fitzhardinge 
6560d160211SJeremy Fitzhardinge 	for (;;) {
6570d160211SJeremy Fitzhardinge 		if (unlikely(rx->status < 0 ||
6580d160211SJeremy Fitzhardinge 			     rx->offset + rx->status > PAGE_SIZE)) {
6590d160211SJeremy Fitzhardinge 			if (net_ratelimit())
6600d160211SJeremy Fitzhardinge 				dev_warn(dev, "rx->offset: %x, size: %u\n",
6610d160211SJeremy Fitzhardinge 					 rx->offset, rx->status);
6620d160211SJeremy Fitzhardinge 			xennet_move_rx_slot(np, skb, ref);
6630d160211SJeremy Fitzhardinge 			err = -EINVAL;
6640d160211SJeremy Fitzhardinge 			goto next;
6650d160211SJeremy Fitzhardinge 		}
6660d160211SJeremy Fitzhardinge 
6670d160211SJeremy Fitzhardinge 		/*
6680d160211SJeremy Fitzhardinge 		 * This definitely indicates a bug, either in this driver or in
6690d160211SJeremy Fitzhardinge 		 * the backend driver. In future this should flag the bad
6700d160211SJeremy Fitzhardinge 		 * situation to the system controller to reboot the backed.
6710d160211SJeremy Fitzhardinge 		 */
6720d160211SJeremy Fitzhardinge 		if (ref == GRANT_INVALID_REF) {
6730d160211SJeremy Fitzhardinge 			if (net_ratelimit())
6740d160211SJeremy Fitzhardinge 				dev_warn(dev, "Bad rx response id %d.\n",
6750d160211SJeremy Fitzhardinge 					 rx->id);
6760d160211SJeremy Fitzhardinge 			err = -EINVAL;
6770d160211SJeremy Fitzhardinge 			goto next;
6780d160211SJeremy Fitzhardinge 		}
6790d160211SJeremy Fitzhardinge 
6800d160211SJeremy Fitzhardinge 		ret = gnttab_end_foreign_access_ref(ref, 0);
6810d160211SJeremy Fitzhardinge 		BUG_ON(!ret);
6820d160211SJeremy Fitzhardinge 
6830d160211SJeremy Fitzhardinge 		gnttab_release_grant_reference(&np->gref_rx_head, ref);
6840d160211SJeremy Fitzhardinge 
6850d160211SJeremy Fitzhardinge 		__skb_queue_tail(list, skb);
6860d160211SJeremy Fitzhardinge 
6870d160211SJeremy Fitzhardinge next:
6880d160211SJeremy Fitzhardinge 		if (!(rx->flags & NETRXF_more_data))
6890d160211SJeremy Fitzhardinge 			break;
6900d160211SJeremy Fitzhardinge 
6910d160211SJeremy Fitzhardinge 		if (cons + frags == rp) {
6920d160211SJeremy Fitzhardinge 			if (net_ratelimit())
6930d160211SJeremy Fitzhardinge 				dev_warn(dev, "Need more frags\n");
6940d160211SJeremy Fitzhardinge 			err = -ENOENT;
6950d160211SJeremy Fitzhardinge 			break;
6960d160211SJeremy Fitzhardinge 		}
6970d160211SJeremy Fitzhardinge 
6980d160211SJeremy Fitzhardinge 		rx = RING_GET_RESPONSE(&np->rx, cons + frags);
6990d160211SJeremy Fitzhardinge 		skb = xennet_get_rx_skb(np, cons + frags);
7000d160211SJeremy Fitzhardinge 		ref = xennet_get_rx_ref(np, cons + frags);
7010d160211SJeremy Fitzhardinge 		frags++;
7020d160211SJeremy Fitzhardinge 	}
7030d160211SJeremy Fitzhardinge 
7040d160211SJeremy Fitzhardinge 	if (unlikely(frags > max)) {
7050d160211SJeremy Fitzhardinge 		if (net_ratelimit())
7060d160211SJeremy Fitzhardinge 			dev_warn(dev, "Too many frags\n");
7070d160211SJeremy Fitzhardinge 		err = -E2BIG;
7080d160211SJeremy Fitzhardinge 	}
7090d160211SJeremy Fitzhardinge 
7100d160211SJeremy Fitzhardinge 	if (unlikely(err))
7110d160211SJeremy Fitzhardinge 		np->rx.rsp_cons = cons + frags;
7120d160211SJeremy Fitzhardinge 
7130d160211SJeremy Fitzhardinge 	return err;
7140d160211SJeremy Fitzhardinge }
7150d160211SJeremy Fitzhardinge 
7160d160211SJeremy Fitzhardinge static int xennet_set_skb_gso(struct sk_buff *skb,
7170d160211SJeremy Fitzhardinge 			      struct xen_netif_extra_info *gso)
7180d160211SJeremy Fitzhardinge {
7190d160211SJeremy Fitzhardinge 	if (!gso->u.gso.size) {
7200d160211SJeremy Fitzhardinge 		if (net_ratelimit())
7210d160211SJeremy Fitzhardinge 			printk(KERN_WARNING "GSO size must not be zero.\n");
7220d160211SJeremy Fitzhardinge 		return -EINVAL;
7230d160211SJeremy Fitzhardinge 	}
7240d160211SJeremy Fitzhardinge 
7250d160211SJeremy Fitzhardinge 	/* Currently only TCPv4 S.O. is supported. */
7260d160211SJeremy Fitzhardinge 	if (gso->u.gso.type != XEN_NETIF_GSO_TYPE_TCPV4) {
7270d160211SJeremy Fitzhardinge 		if (net_ratelimit())
7280d160211SJeremy Fitzhardinge 			printk(KERN_WARNING "Bad GSO type %d.\n", gso->u.gso.type);
7290d160211SJeremy Fitzhardinge 		return -EINVAL;
7300d160211SJeremy Fitzhardinge 	}
7310d160211SJeremy Fitzhardinge 
7320d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_size = gso->u.gso.size;
7330d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
7340d160211SJeremy Fitzhardinge 
7350d160211SJeremy Fitzhardinge 	/* Header must be checked, and gso_segs computed. */
7360d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
7370d160211SJeremy Fitzhardinge 	skb_shinfo(skb)->gso_segs = 0;
7380d160211SJeremy Fitzhardinge 
7390d160211SJeremy Fitzhardinge 	return 0;
7400d160211SJeremy Fitzhardinge }
7410d160211SJeremy Fitzhardinge 
7420d160211SJeremy Fitzhardinge static RING_IDX xennet_fill_frags(struct netfront_info *np,
7430d160211SJeremy Fitzhardinge 				  struct sk_buff *skb,
7440d160211SJeremy Fitzhardinge 				  struct sk_buff_head *list)
7450d160211SJeremy Fitzhardinge {
7460d160211SJeremy Fitzhardinge 	struct skb_shared_info *shinfo = skb_shinfo(skb);
7470d160211SJeremy Fitzhardinge 	int nr_frags = shinfo->nr_frags;
7480d160211SJeremy Fitzhardinge 	RING_IDX cons = np->rx.rsp_cons;
7490d160211SJeremy Fitzhardinge 	skb_frag_t *frag = shinfo->frags + nr_frags;
7500d160211SJeremy Fitzhardinge 	struct sk_buff *nskb;
7510d160211SJeremy Fitzhardinge 
7520d160211SJeremy Fitzhardinge 	while ((nskb = __skb_dequeue(list))) {
7530d160211SJeremy Fitzhardinge 		struct xen_netif_rx_response *rx =
7540d160211SJeremy Fitzhardinge 			RING_GET_RESPONSE(&np->rx, ++cons);
7550d160211SJeremy Fitzhardinge 
7560d160211SJeremy Fitzhardinge 		frag->page = skb_shinfo(nskb)->frags[0].page;
7570d160211SJeremy Fitzhardinge 		frag->page_offset = rx->offset;
7580d160211SJeremy Fitzhardinge 		frag->size = rx->status;
7590d160211SJeremy Fitzhardinge 
7600d160211SJeremy Fitzhardinge 		skb->data_len += rx->status;
7610d160211SJeremy Fitzhardinge 
7620d160211SJeremy Fitzhardinge 		skb_shinfo(nskb)->nr_frags = 0;
7630d160211SJeremy Fitzhardinge 		kfree_skb(nskb);
7640d160211SJeremy Fitzhardinge 
7650d160211SJeremy Fitzhardinge 		frag++;
7660d160211SJeremy Fitzhardinge 		nr_frags++;
7670d160211SJeremy Fitzhardinge 	}
7680d160211SJeremy Fitzhardinge 
7690d160211SJeremy Fitzhardinge 	shinfo->nr_frags = nr_frags;
7700d160211SJeremy Fitzhardinge 	return cons;
7710d160211SJeremy Fitzhardinge }
7720d160211SJeremy Fitzhardinge 
7730d160211SJeremy Fitzhardinge static int skb_checksum_setup(struct sk_buff *skb)
7740d160211SJeremy Fitzhardinge {
7750d160211SJeremy Fitzhardinge 	struct iphdr *iph;
7760d160211SJeremy Fitzhardinge 	unsigned char *th;
7770d160211SJeremy Fitzhardinge 	int err = -EPROTO;
7780d160211SJeremy Fitzhardinge 
7790d160211SJeremy Fitzhardinge 	if (skb->protocol != htons(ETH_P_IP))
7800d160211SJeremy Fitzhardinge 		goto out;
7810d160211SJeremy Fitzhardinge 
7820d160211SJeremy Fitzhardinge 	iph = (void *)skb->data;
7830d160211SJeremy Fitzhardinge 	th = skb->data + 4 * iph->ihl;
7840d160211SJeremy Fitzhardinge 	if (th >= skb_tail_pointer(skb))
7850d160211SJeremy Fitzhardinge 		goto out;
7860d160211SJeremy Fitzhardinge 
7870d160211SJeremy Fitzhardinge 	skb->csum_start = th - skb->head;
7880d160211SJeremy Fitzhardinge 	switch (iph->protocol) {
7890d160211SJeremy Fitzhardinge 	case IPPROTO_TCP:
7900d160211SJeremy Fitzhardinge 		skb->csum_offset = offsetof(struct tcphdr, check);
7910d160211SJeremy Fitzhardinge 		break;
7920d160211SJeremy Fitzhardinge 	case IPPROTO_UDP:
7930d160211SJeremy Fitzhardinge 		skb->csum_offset = offsetof(struct udphdr, check);
7940d160211SJeremy Fitzhardinge 		break;
7950d160211SJeremy Fitzhardinge 	default:
7960d160211SJeremy Fitzhardinge 		if (net_ratelimit())
7970d160211SJeremy Fitzhardinge 			printk(KERN_ERR "Attempting to checksum a non-"
7980d160211SJeremy Fitzhardinge 			       "TCP/UDP packet, dropping a protocol"
7990d160211SJeremy Fitzhardinge 			       " %d packet", iph->protocol);
8000d160211SJeremy Fitzhardinge 		goto out;
8010d160211SJeremy Fitzhardinge 	}
8020d160211SJeremy Fitzhardinge 
8030d160211SJeremy Fitzhardinge 	if ((th + skb->csum_offset + 2) > skb_tail_pointer(skb))
8040d160211SJeremy Fitzhardinge 		goto out;
8050d160211SJeremy Fitzhardinge 
8060d160211SJeremy Fitzhardinge 	err = 0;
8070d160211SJeremy Fitzhardinge 
8080d160211SJeremy Fitzhardinge out:
8090d160211SJeremy Fitzhardinge 	return err;
8100d160211SJeremy Fitzhardinge }
8110d160211SJeremy Fitzhardinge 
8120d160211SJeremy Fitzhardinge static int handle_incoming_queue(struct net_device *dev,
8130d160211SJeremy Fitzhardinge 				 struct sk_buff_head *rxq)
8140d160211SJeremy Fitzhardinge {
8150d160211SJeremy Fitzhardinge 	int packets_dropped = 0;
8160d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
8170d160211SJeremy Fitzhardinge 
8180d160211SJeremy Fitzhardinge 	while ((skb = __skb_dequeue(rxq)) != NULL) {
8190d160211SJeremy Fitzhardinge 		struct page *page = NETFRONT_SKB_CB(skb)->page;
8200d160211SJeremy Fitzhardinge 		void *vaddr = page_address(page);
8210d160211SJeremy Fitzhardinge 		unsigned offset = NETFRONT_SKB_CB(skb)->offset;
8220d160211SJeremy Fitzhardinge 
8230d160211SJeremy Fitzhardinge 		memcpy(skb->data, vaddr + offset,
8240d160211SJeremy Fitzhardinge 		       skb_headlen(skb));
8250d160211SJeremy Fitzhardinge 
8260d160211SJeremy Fitzhardinge 		if (page != skb_shinfo(skb)->frags[0].page)
8270d160211SJeremy Fitzhardinge 			__free_page(page);
8280d160211SJeremy Fitzhardinge 
8290d160211SJeremy Fitzhardinge 		/* Ethernet work: Delayed to here as it peeks the header. */
8300d160211SJeremy Fitzhardinge 		skb->protocol = eth_type_trans(skb, dev);
8310d160211SJeremy Fitzhardinge 
8320d160211SJeremy Fitzhardinge 		if (skb->ip_summed == CHECKSUM_PARTIAL) {
8330d160211SJeremy Fitzhardinge 			if (skb_checksum_setup(skb)) {
8340d160211SJeremy Fitzhardinge 				kfree_skb(skb);
8350d160211SJeremy Fitzhardinge 				packets_dropped++;
83609f75cd7SJeff Garzik 				dev->stats.rx_errors++;
8370d160211SJeremy Fitzhardinge 				continue;
8380d160211SJeremy Fitzhardinge 			}
8390d160211SJeremy Fitzhardinge 		}
8400d160211SJeremy Fitzhardinge 
84109f75cd7SJeff Garzik 		dev->stats.rx_packets++;
84209f75cd7SJeff Garzik 		dev->stats.rx_bytes += skb->len;
8430d160211SJeremy Fitzhardinge 
8440d160211SJeremy Fitzhardinge 		/* Pass it up. */
8450d160211SJeremy Fitzhardinge 		netif_receive_skb(skb);
8460d160211SJeremy Fitzhardinge 	}
8470d160211SJeremy Fitzhardinge 
8480d160211SJeremy Fitzhardinge 	return packets_dropped;
8490d160211SJeremy Fitzhardinge }
8500d160211SJeremy Fitzhardinge 
851bea3348eSStephen Hemminger static int xennet_poll(struct napi_struct *napi, int budget)
8520d160211SJeremy Fitzhardinge {
853bea3348eSStephen Hemminger 	struct netfront_info *np = container_of(napi, struct netfront_info, napi);
854bea3348eSStephen Hemminger 	struct net_device *dev = np->netdev;
8550d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
8560d160211SJeremy Fitzhardinge 	struct netfront_rx_info rinfo;
8570d160211SJeremy Fitzhardinge 	struct xen_netif_rx_response *rx = &rinfo.rx;
8580d160211SJeremy Fitzhardinge 	struct xen_netif_extra_info *extras = rinfo.extras;
8590d160211SJeremy Fitzhardinge 	RING_IDX i, rp;
860bea3348eSStephen Hemminger 	int work_done;
8610d160211SJeremy Fitzhardinge 	struct sk_buff_head rxq;
8620d160211SJeremy Fitzhardinge 	struct sk_buff_head errq;
8630d160211SJeremy Fitzhardinge 	struct sk_buff_head tmpq;
8640d160211SJeremy Fitzhardinge 	unsigned long flags;
8650d160211SJeremy Fitzhardinge 	unsigned int len;
8660d160211SJeremy Fitzhardinge 	int err;
8670d160211SJeremy Fitzhardinge 
8680d160211SJeremy Fitzhardinge 	spin_lock(&np->rx_lock);
8690d160211SJeremy Fitzhardinge 
8700d160211SJeremy Fitzhardinge 	skb_queue_head_init(&rxq);
8710d160211SJeremy Fitzhardinge 	skb_queue_head_init(&errq);
8720d160211SJeremy Fitzhardinge 	skb_queue_head_init(&tmpq);
8730d160211SJeremy Fitzhardinge 
8740d160211SJeremy Fitzhardinge 	rp = np->rx.sring->rsp_prod;
8750d160211SJeremy Fitzhardinge 	rmb(); /* Ensure we see queued responses up to 'rp'. */
8760d160211SJeremy Fitzhardinge 
8770d160211SJeremy Fitzhardinge 	i = np->rx.rsp_cons;
8780d160211SJeremy Fitzhardinge 	work_done = 0;
8790d160211SJeremy Fitzhardinge 	while ((i != rp) && (work_done < budget)) {
8800d160211SJeremy Fitzhardinge 		memcpy(rx, RING_GET_RESPONSE(&np->rx, i), sizeof(*rx));
8810d160211SJeremy Fitzhardinge 		memset(extras, 0, sizeof(rinfo.extras));
8820d160211SJeremy Fitzhardinge 
8830d160211SJeremy Fitzhardinge 		err = xennet_get_responses(np, &rinfo, rp, &tmpq);
8840d160211SJeremy Fitzhardinge 
8850d160211SJeremy Fitzhardinge 		if (unlikely(err)) {
8860d160211SJeremy Fitzhardinge err:
8870d160211SJeremy Fitzhardinge 			while ((skb = __skb_dequeue(&tmpq)))
8880d160211SJeremy Fitzhardinge 				__skb_queue_tail(&errq, skb);
88909f75cd7SJeff Garzik 			dev->stats.rx_errors++;
8900d160211SJeremy Fitzhardinge 			i = np->rx.rsp_cons;
8910d160211SJeremy Fitzhardinge 			continue;
8920d160211SJeremy Fitzhardinge 		}
8930d160211SJeremy Fitzhardinge 
8940d160211SJeremy Fitzhardinge 		skb = __skb_dequeue(&tmpq);
8950d160211SJeremy Fitzhardinge 
8960d160211SJeremy Fitzhardinge 		if (extras[XEN_NETIF_EXTRA_TYPE_GSO - 1].type) {
8970d160211SJeremy Fitzhardinge 			struct xen_netif_extra_info *gso;
8980d160211SJeremy Fitzhardinge 			gso = &extras[XEN_NETIF_EXTRA_TYPE_GSO - 1];
8990d160211SJeremy Fitzhardinge 
9000d160211SJeremy Fitzhardinge 			if (unlikely(xennet_set_skb_gso(skb, gso))) {
9010d160211SJeremy Fitzhardinge 				__skb_queue_head(&tmpq, skb);
9020d160211SJeremy Fitzhardinge 				np->rx.rsp_cons += skb_queue_len(&tmpq);
9030d160211SJeremy Fitzhardinge 				goto err;
9040d160211SJeremy Fitzhardinge 			}
9050d160211SJeremy Fitzhardinge 		}
9060d160211SJeremy Fitzhardinge 
9070d160211SJeremy Fitzhardinge 		NETFRONT_SKB_CB(skb)->page = skb_shinfo(skb)->frags[0].page;
9080d160211SJeremy Fitzhardinge 		NETFRONT_SKB_CB(skb)->offset = rx->offset;
9090d160211SJeremy Fitzhardinge 
9100d160211SJeremy Fitzhardinge 		len = rx->status;
9110d160211SJeremy Fitzhardinge 		if (len > RX_COPY_THRESHOLD)
9120d160211SJeremy Fitzhardinge 			len = RX_COPY_THRESHOLD;
9130d160211SJeremy Fitzhardinge 		skb_put(skb, len);
9140d160211SJeremy Fitzhardinge 
9150d160211SJeremy Fitzhardinge 		if (rx->status > len) {
9160d160211SJeremy Fitzhardinge 			skb_shinfo(skb)->frags[0].page_offset =
9170d160211SJeremy Fitzhardinge 				rx->offset + len;
9180d160211SJeremy Fitzhardinge 			skb_shinfo(skb)->frags[0].size = rx->status - len;
9190d160211SJeremy Fitzhardinge 			skb->data_len = rx->status - len;
9200d160211SJeremy Fitzhardinge 		} else {
9210d160211SJeremy Fitzhardinge 			skb_shinfo(skb)->frags[0].page = NULL;
9220d160211SJeremy Fitzhardinge 			skb_shinfo(skb)->nr_frags = 0;
9230d160211SJeremy Fitzhardinge 		}
9240d160211SJeremy Fitzhardinge 
9250d160211SJeremy Fitzhardinge 		i = xennet_fill_frags(np, skb, &tmpq);
9260d160211SJeremy Fitzhardinge 
9270d160211SJeremy Fitzhardinge 		/*
9280d160211SJeremy Fitzhardinge 		 * Truesize approximates the size of true data plus
9290d160211SJeremy Fitzhardinge 		 * any supervisor overheads. Adding hypervisor
9300d160211SJeremy Fitzhardinge 		 * overheads has been shown to significantly reduce
9310d160211SJeremy Fitzhardinge 		 * achievable bandwidth with the default receive
9320d160211SJeremy Fitzhardinge 		 * buffer size. It is therefore not wise to account
9330d160211SJeremy Fitzhardinge 		 * for it here.
9340d160211SJeremy Fitzhardinge 		 *
9350d160211SJeremy Fitzhardinge 		 * After alloc_skb(RX_COPY_THRESHOLD), truesize is set
9360d160211SJeremy Fitzhardinge 		 * to RX_COPY_THRESHOLD + the supervisor
9370d160211SJeremy Fitzhardinge 		 * overheads. Here, we add the size of the data pulled
9380d160211SJeremy Fitzhardinge 		 * in xennet_fill_frags().
9390d160211SJeremy Fitzhardinge 		 *
9400d160211SJeremy Fitzhardinge 		 * We also adjust for any unused space in the main
9410d160211SJeremy Fitzhardinge 		 * data area by subtracting (RX_COPY_THRESHOLD -
9420d160211SJeremy Fitzhardinge 		 * len). This is especially important with drivers
9430d160211SJeremy Fitzhardinge 		 * which split incoming packets into header and data,
9440d160211SJeremy Fitzhardinge 		 * using only 66 bytes of the main data area (see the
9450d160211SJeremy Fitzhardinge 		 * e1000 driver for example.)  On such systems,
9460d160211SJeremy Fitzhardinge 		 * without this last adjustement, our achievable
9470d160211SJeremy Fitzhardinge 		 * receive throughout using the standard receive
9480d160211SJeremy Fitzhardinge 		 * buffer size was cut by 25%(!!!).
9490d160211SJeremy Fitzhardinge 		 */
9500d160211SJeremy Fitzhardinge 		skb->truesize += skb->data_len - (RX_COPY_THRESHOLD - len);
9510d160211SJeremy Fitzhardinge 		skb->len += skb->data_len;
9520d160211SJeremy Fitzhardinge 
9530d160211SJeremy Fitzhardinge 		if (rx->flags & NETRXF_csum_blank)
9540d160211SJeremy Fitzhardinge 			skb->ip_summed = CHECKSUM_PARTIAL;
9550d160211SJeremy Fitzhardinge 		else if (rx->flags & NETRXF_data_validated)
9560d160211SJeremy Fitzhardinge 			skb->ip_summed = CHECKSUM_UNNECESSARY;
9570d160211SJeremy Fitzhardinge 
9580d160211SJeremy Fitzhardinge 		__skb_queue_tail(&rxq, skb);
9590d160211SJeremy Fitzhardinge 
9600d160211SJeremy Fitzhardinge 		np->rx.rsp_cons = ++i;
9610d160211SJeremy Fitzhardinge 		work_done++;
9620d160211SJeremy Fitzhardinge 	}
9630d160211SJeremy Fitzhardinge 
96456cfe5d0SWang Chen 	__skb_queue_purge(&errq);
9650d160211SJeremy Fitzhardinge 
9660d160211SJeremy Fitzhardinge 	work_done -= handle_incoming_queue(dev, &rxq);
9670d160211SJeremy Fitzhardinge 
9680d160211SJeremy Fitzhardinge 	/* If we get a callback with very few responses, reduce fill target. */
9690d160211SJeremy Fitzhardinge 	/* NB. Note exponential increase, linear decrease. */
9700d160211SJeremy Fitzhardinge 	if (((np->rx.req_prod_pvt - np->rx.sring->rsp_prod) >
9710d160211SJeremy Fitzhardinge 	     ((3*np->rx_target) / 4)) &&
9720d160211SJeremy Fitzhardinge 	    (--np->rx_target < np->rx_min_target))
9730d160211SJeremy Fitzhardinge 		np->rx_target = np->rx_min_target;
9740d160211SJeremy Fitzhardinge 
9750d160211SJeremy Fitzhardinge 	xennet_alloc_rx_buffers(dev);
9760d160211SJeremy Fitzhardinge 
9770d160211SJeremy Fitzhardinge 	if (work_done < budget) {
978bea3348eSStephen Hemminger 		int more_to_do = 0;
979bea3348eSStephen Hemminger 
9800d160211SJeremy Fitzhardinge 		local_irq_save(flags);
9810d160211SJeremy Fitzhardinge 
9820d160211SJeremy Fitzhardinge 		RING_FINAL_CHECK_FOR_RESPONSES(&np->rx, more_to_do);
9830d160211SJeremy Fitzhardinge 		if (!more_to_do)
984288379f0SBen Hutchings 			__napi_complete(napi);
9850d160211SJeremy Fitzhardinge 
9860d160211SJeremy Fitzhardinge 		local_irq_restore(flags);
9870d160211SJeremy Fitzhardinge 	}
9880d160211SJeremy Fitzhardinge 
9890d160211SJeremy Fitzhardinge 	spin_unlock(&np->rx_lock);
9900d160211SJeremy Fitzhardinge 
991bea3348eSStephen Hemminger 	return work_done;
9920d160211SJeremy Fitzhardinge }
9930d160211SJeremy Fitzhardinge 
9940d160211SJeremy Fitzhardinge static int xennet_change_mtu(struct net_device *dev, int mtu)
9950d160211SJeremy Fitzhardinge {
9960d160211SJeremy Fitzhardinge 	int max = xennet_can_sg(dev) ? 65535 - ETH_HLEN : ETH_DATA_LEN;
9970d160211SJeremy Fitzhardinge 
9980d160211SJeremy Fitzhardinge 	if (mtu > max)
9990d160211SJeremy Fitzhardinge 		return -EINVAL;
10000d160211SJeremy Fitzhardinge 	dev->mtu = mtu;
10010d160211SJeremy Fitzhardinge 	return 0;
10020d160211SJeremy Fitzhardinge }
10030d160211SJeremy Fitzhardinge 
10040d160211SJeremy Fitzhardinge static void xennet_release_tx_bufs(struct netfront_info *np)
10050d160211SJeremy Fitzhardinge {
10060d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
10070d160211SJeremy Fitzhardinge 	int i;
10080d160211SJeremy Fitzhardinge 
10090d160211SJeremy Fitzhardinge 	for (i = 0; i < NET_TX_RING_SIZE; i++) {
10100d160211SJeremy Fitzhardinge 		/* Skip over entries which are actually freelist references */
10111ffb40b8SIsaku Yamahata 		if (skb_entry_is_link(&np->tx_skbs[i]))
10120d160211SJeremy Fitzhardinge 			continue;
10130d160211SJeremy Fitzhardinge 
10140d160211SJeremy Fitzhardinge 		skb = np->tx_skbs[i].skb;
10150d160211SJeremy Fitzhardinge 		gnttab_end_foreign_access_ref(np->grant_tx_ref[i],
10160d160211SJeremy Fitzhardinge 					      GNTMAP_readonly);
10170d160211SJeremy Fitzhardinge 		gnttab_release_grant_reference(&np->gref_tx_head,
10180d160211SJeremy Fitzhardinge 					       np->grant_tx_ref[i]);
10190d160211SJeremy Fitzhardinge 		np->grant_tx_ref[i] = GRANT_INVALID_REF;
10200d160211SJeremy Fitzhardinge 		add_id_to_freelist(&np->tx_skb_freelist, np->tx_skbs, i);
10210d160211SJeremy Fitzhardinge 		dev_kfree_skb_irq(skb);
10220d160211SJeremy Fitzhardinge 	}
10230d160211SJeremy Fitzhardinge }
10240d160211SJeremy Fitzhardinge 
10250d160211SJeremy Fitzhardinge static void xennet_release_rx_bufs(struct netfront_info *np)
10260d160211SJeremy Fitzhardinge {
10270d160211SJeremy Fitzhardinge 	struct mmu_update      *mmu = np->rx_mmu;
10280d160211SJeremy Fitzhardinge 	struct multicall_entry *mcl = np->rx_mcl;
10290d160211SJeremy Fitzhardinge 	struct sk_buff_head free_list;
10300d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
10310d160211SJeremy Fitzhardinge 	unsigned long mfn;
10320d160211SJeremy Fitzhardinge 	int xfer = 0, noxfer = 0, unused = 0;
10330d160211SJeremy Fitzhardinge 	int id, ref;
10340d160211SJeremy Fitzhardinge 
10350d160211SJeremy Fitzhardinge 	dev_warn(&np->netdev->dev, "%s: fix me for copying receiver.\n",
10360d160211SJeremy Fitzhardinge 			 __func__);
10370d160211SJeremy Fitzhardinge 	return;
10380d160211SJeremy Fitzhardinge 
10390d160211SJeremy Fitzhardinge 	skb_queue_head_init(&free_list);
10400d160211SJeremy Fitzhardinge 
10410d160211SJeremy Fitzhardinge 	spin_lock_bh(&np->rx_lock);
10420d160211SJeremy Fitzhardinge 
10430d160211SJeremy Fitzhardinge 	for (id = 0; id < NET_RX_RING_SIZE; id++) {
10440d160211SJeremy Fitzhardinge 		ref = np->grant_rx_ref[id];
10450d160211SJeremy Fitzhardinge 		if (ref == GRANT_INVALID_REF) {
10460d160211SJeremy Fitzhardinge 			unused++;
10470d160211SJeremy Fitzhardinge 			continue;
10480d160211SJeremy Fitzhardinge 		}
10490d160211SJeremy Fitzhardinge 
10500d160211SJeremy Fitzhardinge 		skb = np->rx_skbs[id];
10510d160211SJeremy Fitzhardinge 		mfn = gnttab_end_foreign_transfer_ref(ref);
10520d160211SJeremy Fitzhardinge 		gnttab_release_grant_reference(&np->gref_rx_head, ref);
10530d160211SJeremy Fitzhardinge 		np->grant_rx_ref[id] = GRANT_INVALID_REF;
10540d160211SJeremy Fitzhardinge 
10550d160211SJeremy Fitzhardinge 		if (0 == mfn) {
10560d160211SJeremy Fitzhardinge 			skb_shinfo(skb)->nr_frags = 0;
10570d160211SJeremy Fitzhardinge 			dev_kfree_skb(skb);
10580d160211SJeremy Fitzhardinge 			noxfer++;
10590d160211SJeremy Fitzhardinge 			continue;
10600d160211SJeremy Fitzhardinge 		}
10610d160211SJeremy Fitzhardinge 
10620d160211SJeremy Fitzhardinge 		if (!xen_feature(XENFEAT_auto_translated_physmap)) {
10630d160211SJeremy Fitzhardinge 			/* Remap the page. */
10640d160211SJeremy Fitzhardinge 			struct page *page = skb_shinfo(skb)->frags[0].page;
10650d160211SJeremy Fitzhardinge 			unsigned long pfn = page_to_pfn(page);
10660d160211SJeremy Fitzhardinge 			void *vaddr = page_address(page);
10670d160211SJeremy Fitzhardinge 
10680d160211SJeremy Fitzhardinge 			MULTI_update_va_mapping(mcl, (unsigned long)vaddr,
10690d160211SJeremy Fitzhardinge 						mfn_pte(mfn, PAGE_KERNEL),
10700d160211SJeremy Fitzhardinge 						0);
10710d160211SJeremy Fitzhardinge 			mcl++;
10720d160211SJeremy Fitzhardinge 			mmu->ptr = ((u64)mfn << PAGE_SHIFT)
10730d160211SJeremy Fitzhardinge 				| MMU_MACHPHYS_UPDATE;
10740d160211SJeremy Fitzhardinge 			mmu->val = pfn;
10750d160211SJeremy Fitzhardinge 			mmu++;
10760d160211SJeremy Fitzhardinge 
10770d160211SJeremy Fitzhardinge 			set_phys_to_machine(pfn, mfn);
10780d160211SJeremy Fitzhardinge 		}
10790d160211SJeremy Fitzhardinge 		__skb_queue_tail(&free_list, skb);
10800d160211SJeremy Fitzhardinge 		xfer++;
10810d160211SJeremy Fitzhardinge 	}
10820d160211SJeremy Fitzhardinge 
10830d160211SJeremy Fitzhardinge 	dev_info(&np->netdev->dev, "%s: %d xfer, %d noxfer, %d unused\n",
10840d160211SJeremy Fitzhardinge 		 __func__, xfer, noxfer, unused);
10850d160211SJeremy Fitzhardinge 
10860d160211SJeremy Fitzhardinge 	if (xfer) {
10870d160211SJeremy Fitzhardinge 		if (!xen_feature(XENFEAT_auto_translated_physmap)) {
10880d160211SJeremy Fitzhardinge 			/* Do all the remapping work and M2P updates. */
10890d160211SJeremy Fitzhardinge 			MULTI_mmu_update(mcl, np->rx_mmu, mmu - np->rx_mmu,
109079ea13ceSAl Viro 					 NULL, DOMID_SELF);
10910d160211SJeremy Fitzhardinge 			mcl++;
10920d160211SJeremy Fitzhardinge 			HYPERVISOR_multicall(np->rx_mcl, mcl - np->rx_mcl);
10930d160211SJeremy Fitzhardinge 		}
10940d160211SJeremy Fitzhardinge 	}
10950d160211SJeremy Fitzhardinge 
109656cfe5d0SWang Chen 	__skb_queue_purge(&free_list);
10970d160211SJeremy Fitzhardinge 
10980d160211SJeremy Fitzhardinge 	spin_unlock_bh(&np->rx_lock);
10990d160211SJeremy Fitzhardinge }
11000d160211SJeremy Fitzhardinge 
11010d160211SJeremy Fitzhardinge static void xennet_uninit(struct net_device *dev)
11020d160211SJeremy Fitzhardinge {
11030d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
11040d160211SJeremy Fitzhardinge 	xennet_release_tx_bufs(np);
11050d160211SJeremy Fitzhardinge 	xennet_release_rx_bufs(np);
11060d160211SJeremy Fitzhardinge 	gnttab_free_grant_references(np->gref_tx_head);
11070d160211SJeremy Fitzhardinge 	gnttab_free_grant_references(np->gref_rx_head);
11080d160211SJeremy Fitzhardinge }
11090d160211SJeremy Fitzhardinge 
11100a0b9d2eSStephen Hemminger static const struct net_device_ops xennet_netdev_ops = {
11110a0b9d2eSStephen Hemminger 	.ndo_open            = xennet_open,
11120a0b9d2eSStephen Hemminger 	.ndo_uninit          = xennet_uninit,
11130a0b9d2eSStephen Hemminger 	.ndo_stop            = xennet_close,
11140a0b9d2eSStephen Hemminger 	.ndo_start_xmit      = xennet_start_xmit,
11150a0b9d2eSStephen Hemminger 	.ndo_change_mtu	     = xennet_change_mtu,
11160a0b9d2eSStephen Hemminger 	.ndo_set_mac_address = eth_mac_addr,
11170a0b9d2eSStephen Hemminger 	.ndo_validate_addr   = eth_validate_addr,
11180a0b9d2eSStephen Hemminger };
11190a0b9d2eSStephen Hemminger 
11200d160211SJeremy Fitzhardinge static struct net_device * __devinit xennet_create_dev(struct xenbus_device *dev)
11210d160211SJeremy Fitzhardinge {
11220d160211SJeremy Fitzhardinge 	int i, err;
11230d160211SJeremy Fitzhardinge 	struct net_device *netdev;
11240d160211SJeremy Fitzhardinge 	struct netfront_info *np;
11250d160211SJeremy Fitzhardinge 
11260d160211SJeremy Fitzhardinge 	netdev = alloc_etherdev(sizeof(struct netfront_info));
11270d160211SJeremy Fitzhardinge 	if (!netdev) {
11280d160211SJeremy Fitzhardinge 		printk(KERN_WARNING "%s> alloc_etherdev failed.\n",
11290d160211SJeremy Fitzhardinge 		       __func__);
11300d160211SJeremy Fitzhardinge 		return ERR_PTR(-ENOMEM);
11310d160211SJeremy Fitzhardinge 	}
11320d160211SJeremy Fitzhardinge 
11330d160211SJeremy Fitzhardinge 	np                   = netdev_priv(netdev);
11340d160211SJeremy Fitzhardinge 	np->xbdev            = dev;
11350d160211SJeremy Fitzhardinge 
11360d160211SJeremy Fitzhardinge 	spin_lock_init(&np->tx_lock);
11370d160211SJeremy Fitzhardinge 	spin_lock_init(&np->rx_lock);
11380d160211SJeremy Fitzhardinge 
11390d160211SJeremy Fitzhardinge 	skb_queue_head_init(&np->rx_batch);
11400d160211SJeremy Fitzhardinge 	np->rx_target     = RX_DFL_MIN_TARGET;
11410d160211SJeremy Fitzhardinge 	np->rx_min_target = RX_DFL_MIN_TARGET;
11420d160211SJeremy Fitzhardinge 	np->rx_max_target = RX_MAX_TARGET;
11430d160211SJeremy Fitzhardinge 
11440d160211SJeremy Fitzhardinge 	init_timer(&np->rx_refill_timer);
11450d160211SJeremy Fitzhardinge 	np->rx_refill_timer.data = (unsigned long)netdev;
11460d160211SJeremy Fitzhardinge 	np->rx_refill_timer.function = rx_refill_timeout;
11470d160211SJeremy Fitzhardinge 
11480d160211SJeremy Fitzhardinge 	/* Initialise tx_skbs as a free chain containing every entry. */
11490d160211SJeremy Fitzhardinge 	np->tx_skb_freelist = 0;
11500d160211SJeremy Fitzhardinge 	for (i = 0; i < NET_TX_RING_SIZE; i++) {
11511ffb40b8SIsaku Yamahata 		skb_entry_set_link(&np->tx_skbs[i], i+1);
11520d160211SJeremy Fitzhardinge 		np->grant_tx_ref[i] = GRANT_INVALID_REF;
11530d160211SJeremy Fitzhardinge 	}
11540d160211SJeremy Fitzhardinge 
11550d160211SJeremy Fitzhardinge 	/* Clear out rx_skbs */
11560d160211SJeremy Fitzhardinge 	for (i = 0; i < NET_RX_RING_SIZE; i++) {
11570d160211SJeremy Fitzhardinge 		np->rx_skbs[i] = NULL;
11580d160211SJeremy Fitzhardinge 		np->grant_rx_ref[i] = GRANT_INVALID_REF;
11590d160211SJeremy Fitzhardinge 	}
11600d160211SJeremy Fitzhardinge 
11610d160211SJeremy Fitzhardinge 	/* A grant for every tx ring slot */
11620d160211SJeremy Fitzhardinge 	if (gnttab_alloc_grant_references(TX_MAX_TARGET,
11630d160211SJeremy Fitzhardinge 					  &np->gref_tx_head) < 0) {
11640d160211SJeremy Fitzhardinge 		printk(KERN_ALERT "#### netfront can't alloc tx grant refs\n");
11650d160211SJeremy Fitzhardinge 		err = -ENOMEM;
11660d160211SJeremy Fitzhardinge 		goto exit;
11670d160211SJeremy Fitzhardinge 	}
11680d160211SJeremy Fitzhardinge 	/* A grant for every rx ring slot */
11690d160211SJeremy Fitzhardinge 	if (gnttab_alloc_grant_references(RX_MAX_TARGET,
11700d160211SJeremy Fitzhardinge 					  &np->gref_rx_head) < 0) {
11710d160211SJeremy Fitzhardinge 		printk(KERN_ALERT "#### netfront can't alloc rx grant refs\n");
11720d160211SJeremy Fitzhardinge 		err = -ENOMEM;
11730d160211SJeremy Fitzhardinge 		goto exit_free_tx;
11740d160211SJeremy Fitzhardinge 	}
11750d160211SJeremy Fitzhardinge 
11760a0b9d2eSStephen Hemminger 	netdev->netdev_ops	= &xennet_netdev_ops;
11770a0b9d2eSStephen Hemminger 
1178bea3348eSStephen Hemminger 	netif_napi_add(netdev, &np->napi, xennet_poll, 64);
11790d160211SJeremy Fitzhardinge 	netdev->features        = NETIF_F_IP_CSUM;
11800d160211SJeremy Fitzhardinge 
11810d160211SJeremy Fitzhardinge 	SET_ETHTOOL_OPS(netdev, &xennet_ethtool_ops);
11820d160211SJeremy Fitzhardinge 	SET_NETDEV_DEV(netdev, &dev->dev);
11830d160211SJeremy Fitzhardinge 
11840d160211SJeremy Fitzhardinge 	np->netdev = netdev;
11850d160211SJeremy Fitzhardinge 
11860d160211SJeremy Fitzhardinge 	netif_carrier_off(netdev);
11870d160211SJeremy Fitzhardinge 
11880d160211SJeremy Fitzhardinge 	return netdev;
11890d160211SJeremy Fitzhardinge 
11900d160211SJeremy Fitzhardinge  exit_free_tx:
11910d160211SJeremy Fitzhardinge 	gnttab_free_grant_references(np->gref_tx_head);
11920d160211SJeremy Fitzhardinge  exit:
11930d160211SJeremy Fitzhardinge 	free_netdev(netdev);
11940d160211SJeremy Fitzhardinge 	return ERR_PTR(err);
11950d160211SJeremy Fitzhardinge }
11960d160211SJeremy Fitzhardinge 
11970d160211SJeremy Fitzhardinge /**
11980d160211SJeremy Fitzhardinge  * Entry point to this code when a new device is created.  Allocate the basic
11990d160211SJeremy Fitzhardinge  * structures and the ring buffers for communication with the backend, and
12000d160211SJeremy Fitzhardinge  * inform the backend of the appropriate details for those.
12010d160211SJeremy Fitzhardinge  */
12020d160211SJeremy Fitzhardinge static int __devinit netfront_probe(struct xenbus_device *dev,
12030d160211SJeremy Fitzhardinge 				    const struct xenbus_device_id *id)
12040d160211SJeremy Fitzhardinge {
12050d160211SJeremy Fitzhardinge 	int err;
12060d160211SJeremy Fitzhardinge 	struct net_device *netdev;
12070d160211SJeremy Fitzhardinge 	struct netfront_info *info;
12080d160211SJeremy Fitzhardinge 
12090d160211SJeremy Fitzhardinge 	netdev = xennet_create_dev(dev);
12100d160211SJeremy Fitzhardinge 	if (IS_ERR(netdev)) {
12110d160211SJeremy Fitzhardinge 		err = PTR_ERR(netdev);
12120d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "creating netdev");
12130d160211SJeremy Fitzhardinge 		return err;
12140d160211SJeremy Fitzhardinge 	}
12150d160211SJeremy Fitzhardinge 
12160d160211SJeremy Fitzhardinge 	info = netdev_priv(netdev);
12171b713e00SGreg Kroah-Hartman 	dev_set_drvdata(&dev->dev, info);
12180d160211SJeremy Fitzhardinge 
12190d160211SJeremy Fitzhardinge 	err = register_netdev(info->netdev);
12200d160211SJeremy Fitzhardinge 	if (err) {
12210d160211SJeremy Fitzhardinge 		printk(KERN_WARNING "%s: register_netdev err=%d\n",
12220d160211SJeremy Fitzhardinge 		       __func__, err);
12230d160211SJeremy Fitzhardinge 		goto fail;
12240d160211SJeremy Fitzhardinge 	}
12250d160211SJeremy Fitzhardinge 
12260d160211SJeremy Fitzhardinge 	err = xennet_sysfs_addif(info->netdev);
12270d160211SJeremy Fitzhardinge 	if (err) {
12280d160211SJeremy Fitzhardinge 		unregister_netdev(info->netdev);
12290d160211SJeremy Fitzhardinge 		printk(KERN_WARNING "%s: add sysfs failed err=%d\n",
12300d160211SJeremy Fitzhardinge 		       __func__, err);
12310d160211SJeremy Fitzhardinge 		goto fail;
12320d160211SJeremy Fitzhardinge 	}
12330d160211SJeremy Fitzhardinge 
12340d160211SJeremy Fitzhardinge 	return 0;
12350d160211SJeremy Fitzhardinge 
12360d160211SJeremy Fitzhardinge  fail:
12370d160211SJeremy Fitzhardinge 	free_netdev(netdev);
12381b713e00SGreg Kroah-Hartman 	dev_set_drvdata(&dev->dev, NULL);
12390d160211SJeremy Fitzhardinge 	return err;
12400d160211SJeremy Fitzhardinge }
12410d160211SJeremy Fitzhardinge 
12420d160211SJeremy Fitzhardinge static void xennet_end_access(int ref, void *page)
12430d160211SJeremy Fitzhardinge {
12440d160211SJeremy Fitzhardinge 	/* This frees the page as a side-effect */
12450d160211SJeremy Fitzhardinge 	if (ref != GRANT_INVALID_REF)
12460d160211SJeremy Fitzhardinge 		gnttab_end_foreign_access(ref, 0, (unsigned long)page);
12470d160211SJeremy Fitzhardinge }
12480d160211SJeremy Fitzhardinge 
12490d160211SJeremy Fitzhardinge static void xennet_disconnect_backend(struct netfront_info *info)
12500d160211SJeremy Fitzhardinge {
12510d160211SJeremy Fitzhardinge 	/* Stop old i/f to prevent errors whilst we rebuild the state. */
12520d160211SJeremy Fitzhardinge 	spin_lock_bh(&info->rx_lock);
12530d160211SJeremy Fitzhardinge 	spin_lock_irq(&info->tx_lock);
12540d160211SJeremy Fitzhardinge 	netif_carrier_off(info->netdev);
12550d160211SJeremy Fitzhardinge 	spin_unlock_irq(&info->tx_lock);
12560d160211SJeremy Fitzhardinge 	spin_unlock_bh(&info->rx_lock);
12570d160211SJeremy Fitzhardinge 
12580d160211SJeremy Fitzhardinge 	if (info->netdev->irq)
12590d160211SJeremy Fitzhardinge 		unbind_from_irqhandler(info->netdev->irq, info->netdev);
12600d160211SJeremy Fitzhardinge 	info->evtchn = info->netdev->irq = 0;
12610d160211SJeremy Fitzhardinge 
12620d160211SJeremy Fitzhardinge 	/* End access and free the pages */
12630d160211SJeremy Fitzhardinge 	xennet_end_access(info->tx_ring_ref, info->tx.sring);
12640d160211SJeremy Fitzhardinge 	xennet_end_access(info->rx_ring_ref, info->rx.sring);
12650d160211SJeremy Fitzhardinge 
12660d160211SJeremy Fitzhardinge 	info->tx_ring_ref = GRANT_INVALID_REF;
12670d160211SJeremy Fitzhardinge 	info->rx_ring_ref = GRANT_INVALID_REF;
12680d160211SJeremy Fitzhardinge 	info->tx.sring = NULL;
12690d160211SJeremy Fitzhardinge 	info->rx.sring = NULL;
12700d160211SJeremy Fitzhardinge }
12710d160211SJeremy Fitzhardinge 
12720d160211SJeremy Fitzhardinge /**
12730d160211SJeremy Fitzhardinge  * We are reconnecting to the backend, due to a suspend/resume, or a backend
12740d160211SJeremy Fitzhardinge  * driver restart.  We tear down our netif structure and recreate it, but
12750d160211SJeremy Fitzhardinge  * leave the device-layer structures intact so that this is transparent to the
12760d160211SJeremy Fitzhardinge  * rest of the kernel.
12770d160211SJeremy Fitzhardinge  */
12780d160211SJeremy Fitzhardinge static int netfront_resume(struct xenbus_device *dev)
12790d160211SJeremy Fitzhardinge {
12801b713e00SGreg Kroah-Hartman 	struct netfront_info *info = dev_get_drvdata(&dev->dev);
12810d160211SJeremy Fitzhardinge 
12820d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", dev->nodename);
12830d160211SJeremy Fitzhardinge 
12840d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
12850d160211SJeremy Fitzhardinge 	return 0;
12860d160211SJeremy Fitzhardinge }
12870d160211SJeremy Fitzhardinge 
12880d160211SJeremy Fitzhardinge static int xen_net_read_mac(struct xenbus_device *dev, u8 mac[])
12890d160211SJeremy Fitzhardinge {
12900d160211SJeremy Fitzhardinge 	char *s, *e, *macstr;
12910d160211SJeremy Fitzhardinge 	int i;
12920d160211SJeremy Fitzhardinge 
12930d160211SJeremy Fitzhardinge 	macstr = s = xenbus_read(XBT_NIL, dev->nodename, "mac", NULL);
12940d160211SJeremy Fitzhardinge 	if (IS_ERR(macstr))
12950d160211SJeremy Fitzhardinge 		return PTR_ERR(macstr);
12960d160211SJeremy Fitzhardinge 
12970d160211SJeremy Fitzhardinge 	for (i = 0; i < ETH_ALEN; i++) {
12980d160211SJeremy Fitzhardinge 		mac[i] = simple_strtoul(s, &e, 16);
12990d160211SJeremy Fitzhardinge 		if ((s == e) || (*e != ((i == ETH_ALEN-1) ? '\0' : ':'))) {
13000d160211SJeremy Fitzhardinge 			kfree(macstr);
13010d160211SJeremy Fitzhardinge 			return -ENOENT;
13020d160211SJeremy Fitzhardinge 		}
13030d160211SJeremy Fitzhardinge 		s = e+1;
13040d160211SJeremy Fitzhardinge 	}
13050d160211SJeremy Fitzhardinge 
13060d160211SJeremy Fitzhardinge 	kfree(macstr);
13070d160211SJeremy Fitzhardinge 	return 0;
13080d160211SJeremy Fitzhardinge }
13090d160211SJeremy Fitzhardinge 
13100d160211SJeremy Fitzhardinge static irqreturn_t xennet_interrupt(int irq, void *dev_id)
13110d160211SJeremy Fitzhardinge {
13120d160211SJeremy Fitzhardinge 	struct net_device *dev = dev_id;
13130d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
13140d160211SJeremy Fitzhardinge 	unsigned long flags;
13150d160211SJeremy Fitzhardinge 
13160d160211SJeremy Fitzhardinge 	spin_lock_irqsave(&np->tx_lock, flags);
13170d160211SJeremy Fitzhardinge 
13180d160211SJeremy Fitzhardinge 	if (likely(netif_carrier_ok(dev))) {
13190d160211SJeremy Fitzhardinge 		xennet_tx_buf_gc(dev);
13200d160211SJeremy Fitzhardinge 		/* Under tx_lock: protects access to rx shared-ring indexes. */
13210d160211SJeremy Fitzhardinge 		if (RING_HAS_UNCONSUMED_RESPONSES(&np->rx))
1322288379f0SBen Hutchings 			napi_schedule(&np->napi);
13230d160211SJeremy Fitzhardinge 	}
13240d160211SJeremy Fitzhardinge 
13250d160211SJeremy Fitzhardinge 	spin_unlock_irqrestore(&np->tx_lock, flags);
13260d160211SJeremy Fitzhardinge 
13270d160211SJeremy Fitzhardinge 	return IRQ_HANDLED;
13280d160211SJeremy Fitzhardinge }
13290d160211SJeremy Fitzhardinge 
13300d160211SJeremy Fitzhardinge static int setup_netfront(struct xenbus_device *dev, struct netfront_info *info)
13310d160211SJeremy Fitzhardinge {
13320d160211SJeremy Fitzhardinge 	struct xen_netif_tx_sring *txs;
13330d160211SJeremy Fitzhardinge 	struct xen_netif_rx_sring *rxs;
13340d160211SJeremy Fitzhardinge 	int err;
13350d160211SJeremy Fitzhardinge 	struct net_device *netdev = info->netdev;
13360d160211SJeremy Fitzhardinge 
13370d160211SJeremy Fitzhardinge 	info->tx_ring_ref = GRANT_INVALID_REF;
13380d160211SJeremy Fitzhardinge 	info->rx_ring_ref = GRANT_INVALID_REF;
13390d160211SJeremy Fitzhardinge 	info->rx.sring = NULL;
13400d160211SJeremy Fitzhardinge 	info->tx.sring = NULL;
13410d160211SJeremy Fitzhardinge 	netdev->irq = 0;
13420d160211SJeremy Fitzhardinge 
13430d160211SJeremy Fitzhardinge 	err = xen_net_read_mac(dev, netdev->dev_addr);
13440d160211SJeremy Fitzhardinge 	if (err) {
13450d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "parsing %s/mac", dev->nodename);
13460d160211SJeremy Fitzhardinge 		goto fail;
13470d160211SJeremy Fitzhardinge 	}
13480d160211SJeremy Fitzhardinge 
1349a144ff09SIan Campbell 	txs = (struct xen_netif_tx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH);
13500d160211SJeremy Fitzhardinge 	if (!txs) {
13510d160211SJeremy Fitzhardinge 		err = -ENOMEM;
13520d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "allocating tx ring page");
13530d160211SJeremy Fitzhardinge 		goto fail;
13540d160211SJeremy Fitzhardinge 	}
13550d160211SJeremy Fitzhardinge 	SHARED_RING_INIT(txs);
13560d160211SJeremy Fitzhardinge 	FRONT_RING_INIT(&info->tx, txs, PAGE_SIZE);
13570d160211SJeremy Fitzhardinge 
13580d160211SJeremy Fitzhardinge 	err = xenbus_grant_ring(dev, virt_to_mfn(txs));
13590d160211SJeremy Fitzhardinge 	if (err < 0) {
13600d160211SJeremy Fitzhardinge 		free_page((unsigned long)txs);
13610d160211SJeremy Fitzhardinge 		goto fail;
13620d160211SJeremy Fitzhardinge 	}
13630d160211SJeremy Fitzhardinge 
13640d160211SJeremy Fitzhardinge 	info->tx_ring_ref = err;
1365a144ff09SIan Campbell 	rxs = (struct xen_netif_rx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH);
13660d160211SJeremy Fitzhardinge 	if (!rxs) {
13670d160211SJeremy Fitzhardinge 		err = -ENOMEM;
13680d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "allocating rx ring page");
13690d160211SJeremy Fitzhardinge 		goto fail;
13700d160211SJeremy Fitzhardinge 	}
13710d160211SJeremy Fitzhardinge 	SHARED_RING_INIT(rxs);
13720d160211SJeremy Fitzhardinge 	FRONT_RING_INIT(&info->rx, rxs, PAGE_SIZE);
13730d160211SJeremy Fitzhardinge 
13740d160211SJeremy Fitzhardinge 	err = xenbus_grant_ring(dev, virt_to_mfn(rxs));
13750d160211SJeremy Fitzhardinge 	if (err < 0) {
13760d160211SJeremy Fitzhardinge 		free_page((unsigned long)rxs);
13770d160211SJeremy Fitzhardinge 		goto fail;
13780d160211SJeremy Fitzhardinge 	}
13790d160211SJeremy Fitzhardinge 	info->rx_ring_ref = err;
13800d160211SJeremy Fitzhardinge 
13810d160211SJeremy Fitzhardinge 	err = xenbus_alloc_evtchn(dev, &info->evtchn);
13820d160211SJeremy Fitzhardinge 	if (err)
13830d160211SJeremy Fitzhardinge 		goto fail;
13840d160211SJeremy Fitzhardinge 
13850d160211SJeremy Fitzhardinge 	err = bind_evtchn_to_irqhandler(info->evtchn, xennet_interrupt,
13860d160211SJeremy Fitzhardinge 					IRQF_SAMPLE_RANDOM, netdev->name,
13870d160211SJeremy Fitzhardinge 					netdev);
13880d160211SJeremy Fitzhardinge 	if (err < 0)
13890d160211SJeremy Fitzhardinge 		goto fail;
13900d160211SJeremy Fitzhardinge 	netdev->irq = err;
13910d160211SJeremy Fitzhardinge 	return 0;
13920d160211SJeremy Fitzhardinge 
13930d160211SJeremy Fitzhardinge  fail:
13940d160211SJeremy Fitzhardinge 	return err;
13950d160211SJeremy Fitzhardinge }
13960d160211SJeremy Fitzhardinge 
13970d160211SJeremy Fitzhardinge /* Common code used when first setting up, and when resuming. */
1398f502bf2bSIan Campbell static int talk_to_netback(struct xenbus_device *dev,
13990d160211SJeremy Fitzhardinge 			   struct netfront_info *info)
14000d160211SJeremy Fitzhardinge {
14010d160211SJeremy Fitzhardinge 	const char *message;
14020d160211SJeremy Fitzhardinge 	struct xenbus_transaction xbt;
14030d160211SJeremy Fitzhardinge 	int err;
14040d160211SJeremy Fitzhardinge 
14050d160211SJeremy Fitzhardinge 	/* Create shared ring, alloc event channel. */
14060d160211SJeremy Fitzhardinge 	err = setup_netfront(dev, info);
14070d160211SJeremy Fitzhardinge 	if (err)
14080d160211SJeremy Fitzhardinge 		goto out;
14090d160211SJeremy Fitzhardinge 
14100d160211SJeremy Fitzhardinge again:
14110d160211SJeremy Fitzhardinge 	err = xenbus_transaction_start(&xbt);
14120d160211SJeremy Fitzhardinge 	if (err) {
14130d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "starting transaction");
14140d160211SJeremy Fitzhardinge 		goto destroy_ring;
14150d160211SJeremy Fitzhardinge 	}
14160d160211SJeremy Fitzhardinge 
14170d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "tx-ring-ref", "%u",
14180d160211SJeremy Fitzhardinge 			    info->tx_ring_ref);
14190d160211SJeremy Fitzhardinge 	if (err) {
14200d160211SJeremy Fitzhardinge 		message = "writing tx ring-ref";
14210d160211SJeremy Fitzhardinge 		goto abort_transaction;
14220d160211SJeremy Fitzhardinge 	}
14230d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "rx-ring-ref", "%u",
14240d160211SJeremy Fitzhardinge 			    info->rx_ring_ref);
14250d160211SJeremy Fitzhardinge 	if (err) {
14260d160211SJeremy Fitzhardinge 		message = "writing rx ring-ref";
14270d160211SJeremy Fitzhardinge 		goto abort_transaction;
14280d160211SJeremy Fitzhardinge 	}
14290d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename,
14300d160211SJeremy Fitzhardinge 			    "event-channel", "%u", info->evtchn);
14310d160211SJeremy Fitzhardinge 	if (err) {
14320d160211SJeremy Fitzhardinge 		message = "writing event-channel";
14330d160211SJeremy Fitzhardinge 		goto abort_transaction;
14340d160211SJeremy Fitzhardinge 	}
14350d160211SJeremy Fitzhardinge 
14360d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "request-rx-copy", "%u",
14370d160211SJeremy Fitzhardinge 			    1);
14380d160211SJeremy Fitzhardinge 	if (err) {
14390d160211SJeremy Fitzhardinge 		message = "writing request-rx-copy";
14400d160211SJeremy Fitzhardinge 		goto abort_transaction;
14410d160211SJeremy Fitzhardinge 	}
14420d160211SJeremy Fitzhardinge 
14430d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-rx-notify", "%d", 1);
14440d160211SJeremy Fitzhardinge 	if (err) {
14450d160211SJeremy Fitzhardinge 		message = "writing feature-rx-notify";
14460d160211SJeremy Fitzhardinge 		goto abort_transaction;
14470d160211SJeremy Fitzhardinge 	}
14480d160211SJeremy Fitzhardinge 
14490d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-sg", "%d", 1);
14500d160211SJeremy Fitzhardinge 	if (err) {
14510d160211SJeremy Fitzhardinge 		message = "writing feature-sg";
14520d160211SJeremy Fitzhardinge 		goto abort_transaction;
14530d160211SJeremy Fitzhardinge 	}
14540d160211SJeremy Fitzhardinge 
14550d160211SJeremy Fitzhardinge 	err = xenbus_printf(xbt, dev->nodename, "feature-gso-tcpv4", "%d", 1);
14560d160211SJeremy Fitzhardinge 	if (err) {
14570d160211SJeremy Fitzhardinge 		message = "writing feature-gso-tcpv4";
14580d160211SJeremy Fitzhardinge 		goto abort_transaction;
14590d160211SJeremy Fitzhardinge 	}
14600d160211SJeremy Fitzhardinge 
14610d160211SJeremy Fitzhardinge 	err = xenbus_transaction_end(xbt, 0);
14620d160211SJeremy Fitzhardinge 	if (err) {
14630d160211SJeremy Fitzhardinge 		if (err == -EAGAIN)
14640d160211SJeremy Fitzhardinge 			goto again;
14650d160211SJeremy Fitzhardinge 		xenbus_dev_fatal(dev, err, "completing transaction");
14660d160211SJeremy Fitzhardinge 		goto destroy_ring;
14670d160211SJeremy Fitzhardinge 	}
14680d160211SJeremy Fitzhardinge 
14690d160211SJeremy Fitzhardinge 	return 0;
14700d160211SJeremy Fitzhardinge 
14710d160211SJeremy Fitzhardinge  abort_transaction:
14720d160211SJeremy Fitzhardinge 	xenbus_transaction_end(xbt, 1);
14730d160211SJeremy Fitzhardinge 	xenbus_dev_fatal(dev, err, "%s", message);
14740d160211SJeremy Fitzhardinge  destroy_ring:
14750d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
14760d160211SJeremy Fitzhardinge  out:
14770d160211SJeremy Fitzhardinge 	return err;
14780d160211SJeremy Fitzhardinge }
14790d160211SJeremy Fitzhardinge 
14800d160211SJeremy Fitzhardinge static int xennet_set_sg(struct net_device *dev, u32 data)
14810d160211SJeremy Fitzhardinge {
14820d160211SJeremy Fitzhardinge 	if (data) {
14830d160211SJeremy Fitzhardinge 		struct netfront_info *np = netdev_priv(dev);
14840d160211SJeremy Fitzhardinge 		int val;
14850d160211SJeremy Fitzhardinge 
14860d160211SJeremy Fitzhardinge 		if (xenbus_scanf(XBT_NIL, np->xbdev->otherend, "feature-sg",
14870d160211SJeremy Fitzhardinge 				 "%d", &val) < 0)
14880d160211SJeremy Fitzhardinge 			val = 0;
14890d160211SJeremy Fitzhardinge 		if (!val)
14900d160211SJeremy Fitzhardinge 			return -ENOSYS;
14910d160211SJeremy Fitzhardinge 	} else if (dev->mtu > ETH_DATA_LEN)
14920d160211SJeremy Fitzhardinge 		dev->mtu = ETH_DATA_LEN;
14930d160211SJeremy Fitzhardinge 
14940d160211SJeremy Fitzhardinge 	return ethtool_op_set_sg(dev, data);
14950d160211SJeremy Fitzhardinge }
14960d160211SJeremy Fitzhardinge 
14970d160211SJeremy Fitzhardinge static int xennet_set_tso(struct net_device *dev, u32 data)
14980d160211SJeremy Fitzhardinge {
14990d160211SJeremy Fitzhardinge 	if (data) {
15000d160211SJeremy Fitzhardinge 		struct netfront_info *np = netdev_priv(dev);
15010d160211SJeremy Fitzhardinge 		int val;
15020d160211SJeremy Fitzhardinge 
15030d160211SJeremy Fitzhardinge 		if (xenbus_scanf(XBT_NIL, np->xbdev->otherend,
15040d160211SJeremy Fitzhardinge 				 "feature-gso-tcpv4", "%d", &val) < 0)
15050d160211SJeremy Fitzhardinge 			val = 0;
15060d160211SJeremy Fitzhardinge 		if (!val)
15070d160211SJeremy Fitzhardinge 			return -ENOSYS;
15080d160211SJeremy Fitzhardinge 	}
15090d160211SJeremy Fitzhardinge 
15100d160211SJeremy Fitzhardinge 	return ethtool_op_set_tso(dev, data);
15110d160211SJeremy Fitzhardinge }
15120d160211SJeremy Fitzhardinge 
15130d160211SJeremy Fitzhardinge static void xennet_set_features(struct net_device *dev)
15140d160211SJeremy Fitzhardinge {
15150d160211SJeremy Fitzhardinge 	/* Turn off all GSO bits except ROBUST. */
151643eb99c5SChris Leech 	dev->features &= ~NETIF_F_GSO_MASK;
15170d160211SJeremy Fitzhardinge 	dev->features |= NETIF_F_GSO_ROBUST;
15180d160211SJeremy Fitzhardinge 	xennet_set_sg(dev, 0);
15190d160211SJeremy Fitzhardinge 
15200d160211SJeremy Fitzhardinge 	/* We need checksum offload to enable scatter/gather and TSO. */
15210d160211SJeremy Fitzhardinge 	if (!(dev->features & NETIF_F_IP_CSUM))
15220d160211SJeremy Fitzhardinge 		return;
15230d160211SJeremy Fitzhardinge 
15240d160211SJeremy Fitzhardinge 	if (!xennet_set_sg(dev, 1))
15250d160211SJeremy Fitzhardinge 		xennet_set_tso(dev, 1);
15260d160211SJeremy Fitzhardinge }
15270d160211SJeremy Fitzhardinge 
15280d160211SJeremy Fitzhardinge static int xennet_connect(struct net_device *dev)
15290d160211SJeremy Fitzhardinge {
15300d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(dev);
15310d160211SJeremy Fitzhardinge 	int i, requeue_idx, err;
15320d160211SJeremy Fitzhardinge 	struct sk_buff *skb;
15330d160211SJeremy Fitzhardinge 	grant_ref_t ref;
15340d160211SJeremy Fitzhardinge 	struct xen_netif_rx_request *req;
15350d160211SJeremy Fitzhardinge 	unsigned int feature_rx_copy;
15360d160211SJeremy Fitzhardinge 
15370d160211SJeremy Fitzhardinge 	err = xenbus_scanf(XBT_NIL, np->xbdev->otherend,
15380d160211SJeremy Fitzhardinge 			   "feature-rx-copy", "%u", &feature_rx_copy);
15390d160211SJeremy Fitzhardinge 	if (err != 1)
15400d160211SJeremy Fitzhardinge 		feature_rx_copy = 0;
15410d160211SJeremy Fitzhardinge 
15420d160211SJeremy Fitzhardinge 	if (!feature_rx_copy) {
15430d160211SJeremy Fitzhardinge 		dev_info(&dev->dev,
1544898eb71cSJoe Perches 			 "backend does not support copying receive path\n");
15450d160211SJeremy Fitzhardinge 		return -ENODEV;
15460d160211SJeremy Fitzhardinge 	}
15470d160211SJeremy Fitzhardinge 
1548f502bf2bSIan Campbell 	err = talk_to_netback(np->xbdev, np);
15490d160211SJeremy Fitzhardinge 	if (err)
15500d160211SJeremy Fitzhardinge 		return err;
15510d160211SJeremy Fitzhardinge 
15520d160211SJeremy Fitzhardinge 	xennet_set_features(dev);
15530d160211SJeremy Fitzhardinge 
15540d160211SJeremy Fitzhardinge 	spin_lock_bh(&np->rx_lock);
15550d160211SJeremy Fitzhardinge 	spin_lock_irq(&np->tx_lock);
15560d160211SJeremy Fitzhardinge 
15570d160211SJeremy Fitzhardinge 	/* Step 1: Discard all pending TX packet fragments. */
15580d160211SJeremy Fitzhardinge 	xennet_release_tx_bufs(np);
15590d160211SJeremy Fitzhardinge 
15600d160211SJeremy Fitzhardinge 	/* Step 2: Rebuild the RX buffer freelist and the RX ring itself. */
15610d160211SJeremy Fitzhardinge 	for (requeue_idx = 0, i = 0; i < NET_RX_RING_SIZE; i++) {
15620d160211SJeremy Fitzhardinge 		if (!np->rx_skbs[i])
15630d160211SJeremy Fitzhardinge 			continue;
15640d160211SJeremy Fitzhardinge 
15650d160211SJeremy Fitzhardinge 		skb = np->rx_skbs[requeue_idx] = xennet_get_rx_skb(np, i);
15660d160211SJeremy Fitzhardinge 		ref = np->grant_rx_ref[requeue_idx] = xennet_get_rx_ref(np, i);
15670d160211SJeremy Fitzhardinge 		req = RING_GET_REQUEST(&np->rx, requeue_idx);
15680d160211SJeremy Fitzhardinge 
15690d160211SJeremy Fitzhardinge 		gnttab_grant_foreign_access_ref(
15700d160211SJeremy Fitzhardinge 			ref, np->xbdev->otherend_id,
15710d160211SJeremy Fitzhardinge 			pfn_to_mfn(page_to_pfn(skb_shinfo(skb)->
15720d160211SJeremy Fitzhardinge 					       frags->page)),
15730d160211SJeremy Fitzhardinge 			0);
15740d160211SJeremy Fitzhardinge 		req->gref = ref;
15750d160211SJeremy Fitzhardinge 		req->id   = requeue_idx;
15760d160211SJeremy Fitzhardinge 
15770d160211SJeremy Fitzhardinge 		requeue_idx++;
15780d160211SJeremy Fitzhardinge 	}
15790d160211SJeremy Fitzhardinge 
15800d160211SJeremy Fitzhardinge 	np->rx.req_prod_pvt = requeue_idx;
15810d160211SJeremy Fitzhardinge 
15820d160211SJeremy Fitzhardinge 	/*
15830d160211SJeremy Fitzhardinge 	 * Step 3: All public and private state should now be sane.  Get
15840d160211SJeremy Fitzhardinge 	 * ready to start sending and receiving packets and give the driver
15850d160211SJeremy Fitzhardinge 	 * domain a kick because we've probably just requeued some
15860d160211SJeremy Fitzhardinge 	 * packets.
15870d160211SJeremy Fitzhardinge 	 */
15880d160211SJeremy Fitzhardinge 	netif_carrier_on(np->netdev);
15890d160211SJeremy Fitzhardinge 	notify_remote_via_irq(np->netdev->irq);
15900d160211SJeremy Fitzhardinge 	xennet_tx_buf_gc(dev);
15910d160211SJeremy Fitzhardinge 	xennet_alloc_rx_buffers(dev);
15920d160211SJeremy Fitzhardinge 
15930d160211SJeremy Fitzhardinge 	spin_unlock_irq(&np->tx_lock);
15940d160211SJeremy Fitzhardinge 	spin_unlock_bh(&np->rx_lock);
15950d160211SJeremy Fitzhardinge 
15960d160211SJeremy Fitzhardinge 	return 0;
15970d160211SJeremy Fitzhardinge }
15980d160211SJeremy Fitzhardinge 
15990d160211SJeremy Fitzhardinge /**
16000d160211SJeremy Fitzhardinge  * Callback received when the backend's state changes.
16010d160211SJeremy Fitzhardinge  */
1602f502bf2bSIan Campbell static void netback_changed(struct xenbus_device *dev,
16030d160211SJeremy Fitzhardinge 			    enum xenbus_state backend_state)
16040d160211SJeremy Fitzhardinge {
16051b713e00SGreg Kroah-Hartman 	struct netfront_info *np = dev_get_drvdata(&dev->dev);
16060d160211SJeremy Fitzhardinge 	struct net_device *netdev = np->netdev;
16070d160211SJeremy Fitzhardinge 
16080d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", xenbus_strstate(backend_state));
16090d160211SJeremy Fitzhardinge 
16100d160211SJeremy Fitzhardinge 	switch (backend_state) {
16110d160211SJeremy Fitzhardinge 	case XenbusStateInitialising:
16120d160211SJeremy Fitzhardinge 	case XenbusStateInitialised:
1613b78c9512SNoboru Iwamatsu 	case XenbusStateReconfiguring:
1614b78c9512SNoboru Iwamatsu 	case XenbusStateReconfigured:
16150d160211SJeremy Fitzhardinge 	case XenbusStateConnected:
16160d160211SJeremy Fitzhardinge 	case XenbusStateUnknown:
16170d160211SJeremy Fitzhardinge 	case XenbusStateClosed:
16180d160211SJeremy Fitzhardinge 		break;
16190d160211SJeremy Fitzhardinge 
16200d160211SJeremy Fitzhardinge 	case XenbusStateInitWait:
16210d160211SJeremy Fitzhardinge 		if (dev->state != XenbusStateInitialising)
16220d160211SJeremy Fitzhardinge 			break;
16230d160211SJeremy Fitzhardinge 		if (xennet_connect(netdev) != 0)
16240d160211SJeremy Fitzhardinge 			break;
16250d160211SJeremy Fitzhardinge 		xenbus_switch_state(dev, XenbusStateConnected);
162659297067SIan Campbell 		netif_notify_peers(netdev);
16270d160211SJeremy Fitzhardinge 		break;
16280d160211SJeremy Fitzhardinge 
16290d160211SJeremy Fitzhardinge 	case XenbusStateClosing:
16300d160211SJeremy Fitzhardinge 		xenbus_frontend_closed(dev);
16310d160211SJeremy Fitzhardinge 		break;
16320d160211SJeremy Fitzhardinge 	}
16330d160211SJeremy Fitzhardinge }
16340d160211SJeremy Fitzhardinge 
16350fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops =
16360d160211SJeremy Fitzhardinge {
16370d160211SJeremy Fitzhardinge 	.set_tx_csum = ethtool_op_set_tx_csum,
16380d160211SJeremy Fitzhardinge 	.set_sg = xennet_set_sg,
16390d160211SJeremy Fitzhardinge 	.set_tso = xennet_set_tso,
16400d160211SJeremy Fitzhardinge 	.get_link = ethtool_op_get_link,
16410d160211SJeremy Fitzhardinge };
16420d160211SJeremy Fitzhardinge 
16430d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS
16440d160211SJeremy Fitzhardinge static ssize_t show_rxbuf_min(struct device *dev,
16450d160211SJeremy Fitzhardinge 			      struct device_attribute *attr, char *buf)
16460d160211SJeremy Fitzhardinge {
16470d160211SJeremy Fitzhardinge 	struct net_device *netdev = to_net_dev(dev);
16480d160211SJeremy Fitzhardinge 	struct netfront_info *info = netdev_priv(netdev);
16490d160211SJeremy Fitzhardinge 
16500d160211SJeremy Fitzhardinge 	return sprintf(buf, "%u\n", info->rx_min_target);
16510d160211SJeremy Fitzhardinge }
16520d160211SJeremy Fitzhardinge 
16530d160211SJeremy Fitzhardinge static ssize_t store_rxbuf_min(struct device *dev,
16540d160211SJeremy Fitzhardinge 			       struct device_attribute *attr,
16550d160211SJeremy Fitzhardinge 			       const char *buf, size_t len)
16560d160211SJeremy Fitzhardinge {
16570d160211SJeremy Fitzhardinge 	struct net_device *netdev = to_net_dev(dev);
16580d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(netdev);
16590d160211SJeremy Fitzhardinge 	char *endp;
16600d160211SJeremy Fitzhardinge 	unsigned long target;
16610d160211SJeremy Fitzhardinge 
16620d160211SJeremy Fitzhardinge 	if (!capable(CAP_NET_ADMIN))
16630d160211SJeremy Fitzhardinge 		return -EPERM;
16640d160211SJeremy Fitzhardinge 
16650d160211SJeremy Fitzhardinge 	target = simple_strtoul(buf, &endp, 0);
16660d160211SJeremy Fitzhardinge 	if (endp == buf)
16670d160211SJeremy Fitzhardinge 		return -EBADMSG;
16680d160211SJeremy Fitzhardinge 
16690d160211SJeremy Fitzhardinge 	if (target < RX_MIN_TARGET)
16700d160211SJeremy Fitzhardinge 		target = RX_MIN_TARGET;
16710d160211SJeremy Fitzhardinge 	if (target > RX_MAX_TARGET)
16720d160211SJeremy Fitzhardinge 		target = RX_MAX_TARGET;
16730d160211SJeremy Fitzhardinge 
16740d160211SJeremy Fitzhardinge 	spin_lock_bh(&np->rx_lock);
16750d160211SJeremy Fitzhardinge 	if (target > np->rx_max_target)
16760d160211SJeremy Fitzhardinge 		np->rx_max_target = target;
16770d160211SJeremy Fitzhardinge 	np->rx_min_target = target;
16780d160211SJeremy Fitzhardinge 	if (target > np->rx_target)
16790d160211SJeremy Fitzhardinge 		np->rx_target = target;
16800d160211SJeremy Fitzhardinge 
16810d160211SJeremy Fitzhardinge 	xennet_alloc_rx_buffers(netdev);
16820d160211SJeremy Fitzhardinge 
16830d160211SJeremy Fitzhardinge 	spin_unlock_bh(&np->rx_lock);
16840d160211SJeremy Fitzhardinge 	return len;
16850d160211SJeremy Fitzhardinge }
16860d160211SJeremy Fitzhardinge 
16870d160211SJeremy Fitzhardinge static ssize_t show_rxbuf_max(struct device *dev,
16880d160211SJeremy Fitzhardinge 			      struct device_attribute *attr, char *buf)
16890d160211SJeremy Fitzhardinge {
16900d160211SJeremy Fitzhardinge 	struct net_device *netdev = to_net_dev(dev);
16910d160211SJeremy Fitzhardinge 	struct netfront_info *info = netdev_priv(netdev);
16920d160211SJeremy Fitzhardinge 
16930d160211SJeremy Fitzhardinge 	return sprintf(buf, "%u\n", info->rx_max_target);
16940d160211SJeremy Fitzhardinge }
16950d160211SJeremy Fitzhardinge 
16960d160211SJeremy Fitzhardinge static ssize_t store_rxbuf_max(struct device *dev,
16970d160211SJeremy Fitzhardinge 			       struct device_attribute *attr,
16980d160211SJeremy Fitzhardinge 			       const char *buf, size_t len)
16990d160211SJeremy Fitzhardinge {
17000d160211SJeremy Fitzhardinge 	struct net_device *netdev = to_net_dev(dev);
17010d160211SJeremy Fitzhardinge 	struct netfront_info *np = netdev_priv(netdev);
17020d160211SJeremy Fitzhardinge 	char *endp;
17030d160211SJeremy Fitzhardinge 	unsigned long target;
17040d160211SJeremy Fitzhardinge 
17050d160211SJeremy Fitzhardinge 	if (!capable(CAP_NET_ADMIN))
17060d160211SJeremy Fitzhardinge 		return -EPERM;
17070d160211SJeremy Fitzhardinge 
17080d160211SJeremy Fitzhardinge 	target = simple_strtoul(buf, &endp, 0);
17090d160211SJeremy Fitzhardinge 	if (endp == buf)
17100d160211SJeremy Fitzhardinge 		return -EBADMSG;
17110d160211SJeremy Fitzhardinge 
17120d160211SJeremy Fitzhardinge 	if (target < RX_MIN_TARGET)
17130d160211SJeremy Fitzhardinge 		target = RX_MIN_TARGET;
17140d160211SJeremy Fitzhardinge 	if (target > RX_MAX_TARGET)
17150d160211SJeremy Fitzhardinge 		target = RX_MAX_TARGET;
17160d160211SJeremy Fitzhardinge 
17170d160211SJeremy Fitzhardinge 	spin_lock_bh(&np->rx_lock);
17180d160211SJeremy Fitzhardinge 	if (target < np->rx_min_target)
17190d160211SJeremy Fitzhardinge 		np->rx_min_target = target;
17200d160211SJeremy Fitzhardinge 	np->rx_max_target = target;
17210d160211SJeremy Fitzhardinge 	if (target < np->rx_target)
17220d160211SJeremy Fitzhardinge 		np->rx_target = target;
17230d160211SJeremy Fitzhardinge 
17240d160211SJeremy Fitzhardinge 	xennet_alloc_rx_buffers(netdev);
17250d160211SJeremy Fitzhardinge 
17260d160211SJeremy Fitzhardinge 	spin_unlock_bh(&np->rx_lock);
17270d160211SJeremy Fitzhardinge 	return len;
17280d160211SJeremy Fitzhardinge }
17290d160211SJeremy Fitzhardinge 
17300d160211SJeremy Fitzhardinge static ssize_t show_rxbuf_cur(struct device *dev,
17310d160211SJeremy Fitzhardinge 			      struct device_attribute *attr, char *buf)
17320d160211SJeremy Fitzhardinge {
17330d160211SJeremy Fitzhardinge 	struct net_device *netdev = to_net_dev(dev);
17340d160211SJeremy Fitzhardinge 	struct netfront_info *info = netdev_priv(netdev);
17350d160211SJeremy Fitzhardinge 
17360d160211SJeremy Fitzhardinge 	return sprintf(buf, "%u\n", info->rx_target);
17370d160211SJeremy Fitzhardinge }
17380d160211SJeremy Fitzhardinge 
17390d160211SJeremy Fitzhardinge static struct device_attribute xennet_attrs[] = {
17400d160211SJeremy Fitzhardinge 	__ATTR(rxbuf_min, S_IRUGO|S_IWUSR, show_rxbuf_min, store_rxbuf_min),
17410d160211SJeremy Fitzhardinge 	__ATTR(rxbuf_max, S_IRUGO|S_IWUSR, show_rxbuf_max, store_rxbuf_max),
17420d160211SJeremy Fitzhardinge 	__ATTR(rxbuf_cur, S_IRUGO, show_rxbuf_cur, NULL),
17430d160211SJeremy Fitzhardinge };
17440d160211SJeremy Fitzhardinge 
17450d160211SJeremy Fitzhardinge static int xennet_sysfs_addif(struct net_device *netdev)
17460d160211SJeremy Fitzhardinge {
17470d160211SJeremy Fitzhardinge 	int i;
17480d160211SJeremy Fitzhardinge 	int err;
17490d160211SJeremy Fitzhardinge 
17500d160211SJeremy Fitzhardinge 	for (i = 0; i < ARRAY_SIZE(xennet_attrs); i++) {
17510d160211SJeremy Fitzhardinge 		err = device_create_file(&netdev->dev,
17520d160211SJeremy Fitzhardinge 					   &xennet_attrs[i]);
17530d160211SJeremy Fitzhardinge 		if (err)
17540d160211SJeremy Fitzhardinge 			goto fail;
17550d160211SJeremy Fitzhardinge 	}
17560d160211SJeremy Fitzhardinge 	return 0;
17570d160211SJeremy Fitzhardinge 
17580d160211SJeremy Fitzhardinge  fail:
17590d160211SJeremy Fitzhardinge 	while (--i >= 0)
17600d160211SJeremy Fitzhardinge 		device_remove_file(&netdev->dev, &xennet_attrs[i]);
17610d160211SJeremy Fitzhardinge 	return err;
17620d160211SJeremy Fitzhardinge }
17630d160211SJeremy Fitzhardinge 
17640d160211SJeremy Fitzhardinge static void xennet_sysfs_delif(struct net_device *netdev)
17650d160211SJeremy Fitzhardinge {
17660d160211SJeremy Fitzhardinge 	int i;
17670d160211SJeremy Fitzhardinge 
17680d160211SJeremy Fitzhardinge 	for (i = 0; i < ARRAY_SIZE(xennet_attrs); i++)
17690d160211SJeremy Fitzhardinge 		device_remove_file(&netdev->dev, &xennet_attrs[i]);
17700d160211SJeremy Fitzhardinge }
17710d160211SJeremy Fitzhardinge 
17720d160211SJeremy Fitzhardinge #endif /* CONFIG_SYSFS */
17730d160211SJeremy Fitzhardinge 
17740d160211SJeremy Fitzhardinge static struct xenbus_device_id netfront_ids[] = {
17750d160211SJeremy Fitzhardinge 	{ "vif" },
17760d160211SJeremy Fitzhardinge 	{ "" }
17770d160211SJeremy Fitzhardinge };
17780d160211SJeremy Fitzhardinge 
17790d160211SJeremy Fitzhardinge 
17800d160211SJeremy Fitzhardinge static int __devexit xennet_remove(struct xenbus_device *dev)
17810d160211SJeremy Fitzhardinge {
17821b713e00SGreg Kroah-Hartman 	struct netfront_info *info = dev_get_drvdata(&dev->dev);
17830d160211SJeremy Fitzhardinge 
17840d160211SJeremy Fitzhardinge 	dev_dbg(&dev->dev, "%s\n", dev->nodename);
17850d160211SJeremy Fitzhardinge 
17860d160211SJeremy Fitzhardinge 	unregister_netdev(info->netdev);
17870d160211SJeremy Fitzhardinge 
17880d160211SJeremy Fitzhardinge 	xennet_disconnect_backend(info);
17890d160211SJeremy Fitzhardinge 
17900d160211SJeremy Fitzhardinge 	del_timer_sync(&info->rx_refill_timer);
17910d160211SJeremy Fitzhardinge 
17920d160211SJeremy Fitzhardinge 	xennet_sysfs_delif(info->netdev);
17930d160211SJeremy Fitzhardinge 
17940d160211SJeremy Fitzhardinge 	free_netdev(info->netdev);
17950d160211SJeremy Fitzhardinge 
17960d160211SJeremy Fitzhardinge 	return 0;
17970d160211SJeremy Fitzhardinge }
17980d160211SJeremy Fitzhardinge 
1799ffb78a26SAl Viro static struct xenbus_driver netfront_driver = {
18000d160211SJeremy Fitzhardinge 	.name = "vif",
18010d160211SJeremy Fitzhardinge 	.owner = THIS_MODULE,
18020d160211SJeremy Fitzhardinge 	.ids = netfront_ids,
18030d160211SJeremy Fitzhardinge 	.probe = netfront_probe,
18040d160211SJeremy Fitzhardinge 	.remove = __devexit_p(xennet_remove),
18050d160211SJeremy Fitzhardinge 	.resume = netfront_resume,
1806f502bf2bSIan Campbell 	.otherend_changed = netback_changed,
18070d160211SJeremy Fitzhardinge };
18080d160211SJeremy Fitzhardinge 
18090d160211SJeremy Fitzhardinge static int __init netif_init(void)
18100d160211SJeremy Fitzhardinge {
18116e833587SJeremy Fitzhardinge 	if (!xen_domain())
18120d160211SJeremy Fitzhardinge 		return -ENODEV;
18130d160211SJeremy Fitzhardinge 
18146e833587SJeremy Fitzhardinge 	if (xen_initial_domain())
18150d160211SJeremy Fitzhardinge 		return 0;
18160d160211SJeremy Fitzhardinge 
18170d160211SJeremy Fitzhardinge 	printk(KERN_INFO "Initialising Xen virtual ethernet driver.\n");
18180d160211SJeremy Fitzhardinge 
1819ffb78a26SAl Viro 	return xenbus_register_frontend(&netfront_driver);
18200d160211SJeremy Fitzhardinge }
18210d160211SJeremy Fitzhardinge module_init(netif_init);
18220d160211SJeremy Fitzhardinge 
18230d160211SJeremy Fitzhardinge 
18240d160211SJeremy Fitzhardinge static void __exit netif_exit(void)
18250d160211SJeremy Fitzhardinge {
18266e833587SJeremy Fitzhardinge 	if (xen_initial_domain())
18270d160211SJeremy Fitzhardinge 		return;
18280d160211SJeremy Fitzhardinge 
1829ffb78a26SAl Viro 	xenbus_unregister_driver(&netfront_driver);
18300d160211SJeremy Fitzhardinge }
18310d160211SJeremy Fitzhardinge module_exit(netif_exit);
18320d160211SJeremy Fitzhardinge 
18330d160211SJeremy Fitzhardinge MODULE_DESCRIPTION("Xen virtual network device frontend");
18340d160211SJeremy Fitzhardinge MODULE_LICENSE("GPL");
1835d2f0c52bSMark McLoughlin MODULE_ALIAS("xen:vif");
18364f93f09bSMark McLoughlin MODULE_ALIAS("xennet");
1837