10d160211SJeremy Fitzhardinge /* 20d160211SJeremy Fitzhardinge * Virtual network driver for conversing with remote driver backends. 30d160211SJeremy Fitzhardinge * 40d160211SJeremy Fitzhardinge * Copyright (c) 2002-2005, K A Fraser 50d160211SJeremy Fitzhardinge * Copyright (c) 2005, XenSource Ltd 60d160211SJeremy Fitzhardinge * 70d160211SJeremy Fitzhardinge * This program is free software; you can redistribute it and/or 80d160211SJeremy Fitzhardinge * modify it under the terms of the GNU General Public License version 2 90d160211SJeremy Fitzhardinge * as published by the Free Software Foundation; or, when distributed 100d160211SJeremy Fitzhardinge * separately from the Linux kernel or incorporated into other 110d160211SJeremy Fitzhardinge * software packages, subject to the following license: 120d160211SJeremy Fitzhardinge * 130d160211SJeremy Fitzhardinge * Permission is hereby granted, free of charge, to any person obtaining a copy 140d160211SJeremy Fitzhardinge * of this source file (the "Software"), to deal in the Software without 150d160211SJeremy Fitzhardinge * restriction, including without limitation the rights to use, copy, modify, 160d160211SJeremy Fitzhardinge * merge, publish, distribute, sublicense, and/or sell copies of the Software, 170d160211SJeremy Fitzhardinge * and to permit persons to whom the Software is furnished to do so, subject to 180d160211SJeremy Fitzhardinge * the following conditions: 190d160211SJeremy Fitzhardinge * 200d160211SJeremy Fitzhardinge * The above copyright notice and this permission notice shall be included in 210d160211SJeremy Fitzhardinge * all copies or substantial portions of the Software. 220d160211SJeremy Fitzhardinge * 230d160211SJeremy Fitzhardinge * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 240d160211SJeremy Fitzhardinge * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 250d160211SJeremy Fitzhardinge * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 260d160211SJeremy Fitzhardinge * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 270d160211SJeremy Fitzhardinge * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 280d160211SJeremy Fitzhardinge * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 290d160211SJeremy Fitzhardinge * IN THE SOFTWARE. 300d160211SJeremy Fitzhardinge */ 310d160211SJeremy Fitzhardinge 320d160211SJeremy Fitzhardinge #include <linux/module.h> 330d160211SJeremy Fitzhardinge #include <linux/kernel.h> 340d160211SJeremy Fitzhardinge #include <linux/netdevice.h> 350d160211SJeremy Fitzhardinge #include <linux/etherdevice.h> 360d160211SJeremy Fitzhardinge #include <linux/skbuff.h> 370d160211SJeremy Fitzhardinge #include <linux/ethtool.h> 380d160211SJeremy Fitzhardinge #include <linux/if_ether.h> 390d160211SJeremy Fitzhardinge #include <linux/tcp.h> 400d160211SJeremy Fitzhardinge #include <linux/udp.h> 410d160211SJeremy Fitzhardinge #include <linux/moduleparam.h> 420d160211SJeremy Fitzhardinge #include <linux/mm.h> 435a0e3ad6STejun Heo #include <linux/slab.h> 440d160211SJeremy Fitzhardinge #include <net/ip.h> 450d160211SJeremy Fitzhardinge 46ca981633SStefano Stabellini #include <asm/xen/page.h> 471ccbf534SJeremy Fitzhardinge #include <xen/xen.h> 480d160211SJeremy Fitzhardinge #include <xen/xenbus.h> 490d160211SJeremy Fitzhardinge #include <xen/events.h> 500d160211SJeremy Fitzhardinge #include <xen/page.h> 51b9136d20SIgor Mammedov #include <xen/platform_pci.h> 520d160211SJeremy Fitzhardinge #include <xen/grant_table.h> 530d160211SJeremy Fitzhardinge 540d160211SJeremy Fitzhardinge #include <xen/interface/io/netif.h> 550d160211SJeremy Fitzhardinge #include <xen/interface/memory.h> 560d160211SJeremy Fitzhardinge #include <xen/interface/grant_table.h> 570d160211SJeremy Fitzhardinge 580fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops; 590d160211SJeremy Fitzhardinge 600d160211SJeremy Fitzhardinge struct netfront_cb { 613683243bSIan Campbell int pull_to; 620d160211SJeremy Fitzhardinge }; 630d160211SJeremy Fitzhardinge 640d160211SJeremy Fitzhardinge #define NETFRONT_SKB_CB(skb) ((struct netfront_cb *)((skb)->cb)) 650d160211SJeremy Fitzhardinge 660d160211SJeremy Fitzhardinge #define RX_COPY_THRESHOLD 256 670d160211SJeremy Fitzhardinge 680d160211SJeremy Fitzhardinge #define GRANT_INVALID_REF 0 690d160211SJeremy Fitzhardinge 70667c78afSJeremy Fitzhardinge #define NET_TX_RING_SIZE __CONST_RING_SIZE(xen_netif_tx, PAGE_SIZE) 71667c78afSJeremy Fitzhardinge #define NET_RX_RING_SIZE __CONST_RING_SIZE(xen_netif_rx, PAGE_SIZE) 7240206dd9SWei Liu #define TX_MAX_TARGET min_t(int, NET_TX_RING_SIZE, 256) 730d160211SJeremy Fitzhardinge 74e00f85beSstephen hemminger struct netfront_stats { 75e00f85beSstephen hemminger u64 rx_packets; 76e00f85beSstephen hemminger u64 tx_packets; 77e00f85beSstephen hemminger u64 rx_bytes; 78e00f85beSstephen hemminger u64 tx_bytes; 79e00f85beSstephen hemminger struct u64_stats_sync syncp; 80e00f85beSstephen hemminger }; 81e00f85beSstephen hemminger 820d160211SJeremy Fitzhardinge struct netfront_info { 830d160211SJeremy Fitzhardinge struct list_head list; 840d160211SJeremy Fitzhardinge struct net_device *netdev; 850d160211SJeremy Fitzhardinge 86bea3348eSStephen Hemminger struct napi_struct napi; 870d160211SJeremy Fitzhardinge 8884284d3cSJeremy Fitzhardinge unsigned int evtchn; 8984284d3cSJeremy Fitzhardinge struct xenbus_device *xbdev; 900d160211SJeremy Fitzhardinge 910d160211SJeremy Fitzhardinge spinlock_t tx_lock; 9284284d3cSJeremy Fitzhardinge struct xen_netif_tx_front_ring tx; 9384284d3cSJeremy Fitzhardinge int tx_ring_ref; 940d160211SJeremy Fitzhardinge 950d160211SJeremy Fitzhardinge /* 960d160211SJeremy Fitzhardinge * {tx,rx}_skbs store outstanding skbuffs. Free tx_skb entries 970d160211SJeremy Fitzhardinge * are linked from tx_skb_freelist through skb_entry.link. 980d160211SJeremy Fitzhardinge * 990d160211SJeremy Fitzhardinge * NB. Freelist index entries are always going to be less than 1000d160211SJeremy Fitzhardinge * PAGE_OFFSET, whereas pointers to skbs will always be equal or 1010d160211SJeremy Fitzhardinge * greater than PAGE_OFFSET: we use this property to distinguish 1020d160211SJeremy Fitzhardinge * them. 1030d160211SJeremy Fitzhardinge */ 1040d160211SJeremy Fitzhardinge union skb_entry { 1050d160211SJeremy Fitzhardinge struct sk_buff *skb; 1061ffb40b8SIsaku Yamahata unsigned long link; 1070d160211SJeremy Fitzhardinge } tx_skbs[NET_TX_RING_SIZE]; 1080d160211SJeremy Fitzhardinge grant_ref_t gref_tx_head; 1090d160211SJeremy Fitzhardinge grant_ref_t grant_tx_ref[NET_TX_RING_SIZE]; 1100d160211SJeremy Fitzhardinge unsigned tx_skb_freelist; 1110d160211SJeremy Fitzhardinge 11284284d3cSJeremy Fitzhardinge spinlock_t rx_lock ____cacheline_aligned_in_smp; 11384284d3cSJeremy Fitzhardinge struct xen_netif_rx_front_ring rx; 11484284d3cSJeremy Fitzhardinge int rx_ring_ref; 11584284d3cSJeremy Fitzhardinge 11684284d3cSJeremy Fitzhardinge /* Receive-ring batched refills. */ 11784284d3cSJeremy Fitzhardinge #define RX_MIN_TARGET 8 11884284d3cSJeremy Fitzhardinge #define RX_DFL_MIN_TARGET 64 11984284d3cSJeremy Fitzhardinge #define RX_MAX_TARGET min_t(int, NET_RX_RING_SIZE, 256) 12084284d3cSJeremy Fitzhardinge unsigned rx_min_target, rx_max_target, rx_target; 12184284d3cSJeremy Fitzhardinge struct sk_buff_head rx_batch; 12284284d3cSJeremy Fitzhardinge 12384284d3cSJeremy Fitzhardinge struct timer_list rx_refill_timer; 12484284d3cSJeremy Fitzhardinge 1250d160211SJeremy Fitzhardinge struct sk_buff *rx_skbs[NET_RX_RING_SIZE]; 1260d160211SJeremy Fitzhardinge grant_ref_t gref_rx_head; 1270d160211SJeremy Fitzhardinge grant_ref_t grant_rx_ref[NET_RX_RING_SIZE]; 1280d160211SJeremy Fitzhardinge 1290d160211SJeremy Fitzhardinge unsigned long rx_pfn_array[NET_RX_RING_SIZE]; 1300d160211SJeremy Fitzhardinge struct multicall_entry rx_mcl[NET_RX_RING_SIZE+1]; 1310d160211SJeremy Fitzhardinge struct mmu_update rx_mmu[NET_RX_RING_SIZE]; 132e0ce4af9SIan Campbell 133e0ce4af9SIan Campbell /* Statistics */ 134e00f85beSstephen hemminger struct netfront_stats __percpu *stats; 135e00f85beSstephen hemminger 136e9a799eaSIan Campbell unsigned long rx_gso_checksum_fixup; 1370d160211SJeremy Fitzhardinge }; 1380d160211SJeremy Fitzhardinge 1390d160211SJeremy Fitzhardinge struct netfront_rx_info { 1400d160211SJeremy Fitzhardinge struct xen_netif_rx_response rx; 1410d160211SJeremy Fitzhardinge struct xen_netif_extra_info extras[XEN_NETIF_EXTRA_TYPE_MAX - 1]; 1420d160211SJeremy Fitzhardinge }; 1430d160211SJeremy Fitzhardinge 1441ffb40b8SIsaku Yamahata static void skb_entry_set_link(union skb_entry *list, unsigned short id) 1451ffb40b8SIsaku Yamahata { 1461ffb40b8SIsaku Yamahata list->link = id; 1471ffb40b8SIsaku Yamahata } 1481ffb40b8SIsaku Yamahata 1491ffb40b8SIsaku Yamahata static int skb_entry_is_link(const union skb_entry *list) 1501ffb40b8SIsaku Yamahata { 1511ffb40b8SIsaku Yamahata BUILD_BUG_ON(sizeof(list->skb) != sizeof(list->link)); 152807540baSEric Dumazet return (unsigned long)list->skb < PAGE_OFFSET; 1531ffb40b8SIsaku Yamahata } 1541ffb40b8SIsaku Yamahata 1550d160211SJeremy Fitzhardinge /* 1560d160211SJeremy Fitzhardinge * Access macros for acquiring freeing slots in tx_skbs[]. 1570d160211SJeremy Fitzhardinge */ 1580d160211SJeremy Fitzhardinge 1590d160211SJeremy Fitzhardinge static void add_id_to_freelist(unsigned *head, union skb_entry *list, 1600d160211SJeremy Fitzhardinge unsigned short id) 1610d160211SJeremy Fitzhardinge { 1621ffb40b8SIsaku Yamahata skb_entry_set_link(&list[id], *head); 1630d160211SJeremy Fitzhardinge *head = id; 1640d160211SJeremy Fitzhardinge } 1650d160211SJeremy Fitzhardinge 1660d160211SJeremy Fitzhardinge static unsigned short get_id_from_freelist(unsigned *head, 1670d160211SJeremy Fitzhardinge union skb_entry *list) 1680d160211SJeremy Fitzhardinge { 1690d160211SJeremy Fitzhardinge unsigned int id = *head; 1700d160211SJeremy Fitzhardinge *head = list[id].link; 1710d160211SJeremy Fitzhardinge return id; 1720d160211SJeremy Fitzhardinge } 1730d160211SJeremy Fitzhardinge 1740d160211SJeremy Fitzhardinge static int xennet_rxidx(RING_IDX idx) 1750d160211SJeremy Fitzhardinge { 1760d160211SJeremy Fitzhardinge return idx & (NET_RX_RING_SIZE - 1); 1770d160211SJeremy Fitzhardinge } 1780d160211SJeremy Fitzhardinge 1790d160211SJeremy Fitzhardinge static struct sk_buff *xennet_get_rx_skb(struct netfront_info *np, 1800d160211SJeremy Fitzhardinge RING_IDX ri) 1810d160211SJeremy Fitzhardinge { 1820d160211SJeremy Fitzhardinge int i = xennet_rxidx(ri); 1830d160211SJeremy Fitzhardinge struct sk_buff *skb = np->rx_skbs[i]; 1840d160211SJeremy Fitzhardinge np->rx_skbs[i] = NULL; 1850d160211SJeremy Fitzhardinge return skb; 1860d160211SJeremy Fitzhardinge } 1870d160211SJeremy Fitzhardinge 1880d160211SJeremy Fitzhardinge static grant_ref_t xennet_get_rx_ref(struct netfront_info *np, 1890d160211SJeremy Fitzhardinge RING_IDX ri) 1900d160211SJeremy Fitzhardinge { 1910d160211SJeremy Fitzhardinge int i = xennet_rxidx(ri); 1920d160211SJeremy Fitzhardinge grant_ref_t ref = np->grant_rx_ref[i]; 1930d160211SJeremy Fitzhardinge np->grant_rx_ref[i] = GRANT_INVALID_REF; 1940d160211SJeremy Fitzhardinge return ref; 1950d160211SJeremy Fitzhardinge } 1960d160211SJeremy Fitzhardinge 1970d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS 1980d160211SJeremy Fitzhardinge static int xennet_sysfs_addif(struct net_device *netdev); 1990d160211SJeremy Fitzhardinge static void xennet_sysfs_delif(struct net_device *netdev); 2000d160211SJeremy Fitzhardinge #else /* !CONFIG_SYSFS */ 2010d160211SJeremy Fitzhardinge #define xennet_sysfs_addif(dev) (0) 2020d160211SJeremy Fitzhardinge #define xennet_sysfs_delif(dev) do { } while (0) 2030d160211SJeremy Fitzhardinge #endif 2040d160211SJeremy Fitzhardinge 2053ad9b358SMichał Mirosław static bool xennet_can_sg(struct net_device *dev) 2060d160211SJeremy Fitzhardinge { 2073ad9b358SMichał Mirosław return dev->features & NETIF_F_SG; 2080d160211SJeremy Fitzhardinge } 2090d160211SJeremy Fitzhardinge 2100d160211SJeremy Fitzhardinge 2110d160211SJeremy Fitzhardinge static void rx_refill_timeout(unsigned long data) 2120d160211SJeremy Fitzhardinge { 2130d160211SJeremy Fitzhardinge struct net_device *dev = (struct net_device *)data; 214bea3348eSStephen Hemminger struct netfront_info *np = netdev_priv(dev); 215288379f0SBen Hutchings napi_schedule(&np->napi); 2160d160211SJeremy Fitzhardinge } 2170d160211SJeremy Fitzhardinge 2180d160211SJeremy Fitzhardinge static int netfront_tx_slot_available(struct netfront_info *np) 2190d160211SJeremy Fitzhardinge { 220807540baSEric Dumazet return (np->tx.req_prod_pvt - np->tx.rsp_cons) < 221807540baSEric Dumazet (TX_MAX_TARGET - MAX_SKB_FRAGS - 2); 2220d160211SJeremy Fitzhardinge } 2230d160211SJeremy Fitzhardinge 2240d160211SJeremy Fitzhardinge static void xennet_maybe_wake_tx(struct net_device *dev) 2250d160211SJeremy Fitzhardinge { 2260d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 2270d160211SJeremy Fitzhardinge 2280d160211SJeremy Fitzhardinge if (unlikely(netif_queue_stopped(dev)) && 2290d160211SJeremy Fitzhardinge netfront_tx_slot_available(np) && 2300d160211SJeremy Fitzhardinge likely(netif_running(dev))) 2310d160211SJeremy Fitzhardinge netif_wake_queue(dev); 2320d160211SJeremy Fitzhardinge } 2330d160211SJeremy Fitzhardinge 2340d160211SJeremy Fitzhardinge static void xennet_alloc_rx_buffers(struct net_device *dev) 2350d160211SJeremy Fitzhardinge { 2360d160211SJeremy Fitzhardinge unsigned short id; 2370d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 2380d160211SJeremy Fitzhardinge struct sk_buff *skb; 2390d160211SJeremy Fitzhardinge struct page *page; 2400d160211SJeremy Fitzhardinge int i, batch_target, notify; 2410d160211SJeremy Fitzhardinge RING_IDX req_prod = np->rx.req_prod_pvt; 2420d160211SJeremy Fitzhardinge grant_ref_t ref; 2430d160211SJeremy Fitzhardinge unsigned long pfn; 2440d160211SJeremy Fitzhardinge void *vaddr; 2450d160211SJeremy Fitzhardinge struct xen_netif_rx_request *req; 2460d160211SJeremy Fitzhardinge 2470d160211SJeremy Fitzhardinge if (unlikely(!netif_carrier_ok(dev))) 2480d160211SJeremy Fitzhardinge return; 2490d160211SJeremy Fitzhardinge 2500d160211SJeremy Fitzhardinge /* 2510d160211SJeremy Fitzhardinge * Allocate skbuffs greedily, even though we batch updates to the 2520d160211SJeremy Fitzhardinge * receive ring. This creates a less bursty demand on the memory 2530d160211SJeremy Fitzhardinge * allocator, so should reduce the chance of failed allocation requests 2540d160211SJeremy Fitzhardinge * both for ourself and for other kernel subsystems. 2550d160211SJeremy Fitzhardinge */ 2560d160211SJeremy Fitzhardinge batch_target = np->rx_target - (req_prod - np->rx.rsp_cons); 2570d160211SJeremy Fitzhardinge for (i = skb_queue_len(&np->rx_batch); i < batch_target; i++) { 258617a20bbSIsaku Yamahata skb = __netdev_alloc_skb(dev, RX_COPY_THRESHOLD + NET_IP_ALIGN, 2590d160211SJeremy Fitzhardinge GFP_ATOMIC | __GFP_NOWARN); 2600d160211SJeremy Fitzhardinge if (unlikely(!skb)) 2610d160211SJeremy Fitzhardinge goto no_skb; 2620d160211SJeremy Fitzhardinge 263617a20bbSIsaku Yamahata /* Align ip header to a 16 bytes boundary */ 264617a20bbSIsaku Yamahata skb_reserve(skb, NET_IP_ALIGN); 265617a20bbSIsaku Yamahata 2660d160211SJeremy Fitzhardinge page = alloc_page(GFP_ATOMIC | __GFP_NOWARN); 2670d160211SJeremy Fitzhardinge if (!page) { 2680d160211SJeremy Fitzhardinge kfree_skb(skb); 2690d160211SJeremy Fitzhardinge no_skb: 2700d160211SJeremy Fitzhardinge /* Any skbuffs queued for refill? Force them out. */ 2710d160211SJeremy Fitzhardinge if (i != 0) 2720d160211SJeremy Fitzhardinge goto refill; 2730d160211SJeremy Fitzhardinge /* Could not allocate any skbuffs. Try again later. */ 2740d160211SJeremy Fitzhardinge mod_timer(&np->rx_refill_timer, 2750d160211SJeremy Fitzhardinge jiffies + (HZ/10)); 2760d160211SJeremy Fitzhardinge break; 2770d160211SJeremy Fitzhardinge } 2780d160211SJeremy Fitzhardinge 27901c68026SIan Campbell __skb_fill_page_desc(skb, 0, page, 0, 0); 2800d160211SJeremy Fitzhardinge skb_shinfo(skb)->nr_frags = 1; 2810d160211SJeremy Fitzhardinge __skb_queue_tail(&np->rx_batch, skb); 2820d160211SJeremy Fitzhardinge } 2830d160211SJeremy Fitzhardinge 2840d160211SJeremy Fitzhardinge /* Is the batch large enough to be worthwhile? */ 2850d160211SJeremy Fitzhardinge if (i < (np->rx_target/2)) { 2860d160211SJeremy Fitzhardinge if (req_prod > np->rx.sring->req_prod) 2870d160211SJeremy Fitzhardinge goto push; 2880d160211SJeremy Fitzhardinge return; 2890d160211SJeremy Fitzhardinge } 2900d160211SJeremy Fitzhardinge 2910d160211SJeremy Fitzhardinge /* Adjust our fill target if we risked running out of buffers. */ 2920d160211SJeremy Fitzhardinge if (((req_prod - np->rx.sring->rsp_prod) < (np->rx_target / 4)) && 2930d160211SJeremy Fitzhardinge ((np->rx_target *= 2) > np->rx_max_target)) 2940d160211SJeremy Fitzhardinge np->rx_target = np->rx_max_target; 2950d160211SJeremy Fitzhardinge 2960d160211SJeremy Fitzhardinge refill: 2975dcddfaeSJeremy Fitzhardinge for (i = 0; ; i++) { 2980d160211SJeremy Fitzhardinge skb = __skb_dequeue(&np->rx_batch); 2990d160211SJeremy Fitzhardinge if (skb == NULL) 3000d160211SJeremy Fitzhardinge break; 3010d160211SJeremy Fitzhardinge 3020d160211SJeremy Fitzhardinge skb->dev = dev; 3030d160211SJeremy Fitzhardinge 3040d160211SJeremy Fitzhardinge id = xennet_rxidx(req_prod + i); 3050d160211SJeremy Fitzhardinge 3060d160211SJeremy Fitzhardinge BUG_ON(np->rx_skbs[id]); 3070d160211SJeremy Fitzhardinge np->rx_skbs[id] = skb; 3080d160211SJeremy Fitzhardinge 3090d160211SJeremy Fitzhardinge ref = gnttab_claim_grant_reference(&np->gref_rx_head); 3100d160211SJeremy Fitzhardinge BUG_ON((signed short)ref < 0); 3110d160211SJeremy Fitzhardinge np->grant_rx_ref[id] = ref; 3120d160211SJeremy Fitzhardinge 31301c68026SIan Campbell pfn = page_to_pfn(skb_frag_page(&skb_shinfo(skb)->frags[0])); 31401c68026SIan Campbell vaddr = page_address(skb_frag_page(&skb_shinfo(skb)->frags[0])); 3150d160211SJeremy Fitzhardinge 3160d160211SJeremy Fitzhardinge req = RING_GET_REQUEST(&np->rx, req_prod + i); 3170d160211SJeremy Fitzhardinge gnttab_grant_foreign_access_ref(ref, 3180d160211SJeremy Fitzhardinge np->xbdev->otherend_id, 3190d160211SJeremy Fitzhardinge pfn_to_mfn(pfn), 3200d160211SJeremy Fitzhardinge 0); 3210d160211SJeremy Fitzhardinge 3220d160211SJeremy Fitzhardinge req->id = id; 3230d160211SJeremy Fitzhardinge req->gref = ref; 3240d160211SJeremy Fitzhardinge } 3250d160211SJeremy Fitzhardinge 3260d160211SJeremy Fitzhardinge wmb(); /* barrier so backend seens requests */ 3270d160211SJeremy Fitzhardinge 3280d160211SJeremy Fitzhardinge /* Above is a suitable barrier to ensure backend will see requests. */ 3290d160211SJeremy Fitzhardinge np->rx.req_prod_pvt = req_prod + i; 3300d160211SJeremy Fitzhardinge push: 3310d160211SJeremy Fitzhardinge RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&np->rx, notify); 3320d160211SJeremy Fitzhardinge if (notify) 3330d160211SJeremy Fitzhardinge notify_remote_via_irq(np->netdev->irq); 3340d160211SJeremy Fitzhardinge } 3350d160211SJeremy Fitzhardinge 3360d160211SJeremy Fitzhardinge static int xennet_open(struct net_device *dev) 3370d160211SJeremy Fitzhardinge { 3380d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 3390d160211SJeremy Fitzhardinge 340bea3348eSStephen Hemminger napi_enable(&np->napi); 341bea3348eSStephen Hemminger 3420d160211SJeremy Fitzhardinge spin_lock_bh(&np->rx_lock); 3430d160211SJeremy Fitzhardinge if (netif_carrier_ok(dev)) { 3440d160211SJeremy Fitzhardinge xennet_alloc_rx_buffers(dev); 3450d160211SJeremy Fitzhardinge np->rx.sring->rsp_event = np->rx.rsp_cons + 1; 3460d160211SJeremy Fitzhardinge if (RING_HAS_UNCONSUMED_RESPONSES(&np->rx)) 347288379f0SBen Hutchings napi_schedule(&np->napi); 3480d160211SJeremy Fitzhardinge } 3490d160211SJeremy Fitzhardinge spin_unlock_bh(&np->rx_lock); 3500d160211SJeremy Fitzhardinge 3510b1ab1b8SEduardo Habkost netif_start_queue(dev); 3520d160211SJeremy Fitzhardinge 3530d160211SJeremy Fitzhardinge return 0; 3540d160211SJeremy Fitzhardinge } 3550d160211SJeremy Fitzhardinge 3560d160211SJeremy Fitzhardinge static void xennet_tx_buf_gc(struct net_device *dev) 3570d160211SJeremy Fitzhardinge { 3580d160211SJeremy Fitzhardinge RING_IDX cons, prod; 3590d160211SJeremy Fitzhardinge unsigned short id; 3600d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 3610d160211SJeremy Fitzhardinge struct sk_buff *skb; 3620d160211SJeremy Fitzhardinge 3630d160211SJeremy Fitzhardinge BUG_ON(!netif_carrier_ok(dev)); 3640d160211SJeremy Fitzhardinge 3650d160211SJeremy Fitzhardinge do { 3660d160211SJeremy Fitzhardinge prod = np->tx.sring->rsp_prod; 3670d160211SJeremy Fitzhardinge rmb(); /* Ensure we see responses up to 'rp'. */ 3680d160211SJeremy Fitzhardinge 3690d160211SJeremy Fitzhardinge for (cons = np->tx.rsp_cons; cons != prod; cons++) { 3700d160211SJeremy Fitzhardinge struct xen_netif_tx_response *txrsp; 3710d160211SJeremy Fitzhardinge 3720d160211SJeremy Fitzhardinge txrsp = RING_GET_RESPONSE(&np->tx, cons); 373f942dc25SIan Campbell if (txrsp->status == XEN_NETIF_RSP_NULL) 3740d160211SJeremy Fitzhardinge continue; 3750d160211SJeremy Fitzhardinge 3760d160211SJeremy Fitzhardinge id = txrsp->id; 3770d160211SJeremy Fitzhardinge skb = np->tx_skbs[id].skb; 3780d160211SJeremy Fitzhardinge if (unlikely(gnttab_query_foreign_access( 3790d160211SJeremy Fitzhardinge np->grant_tx_ref[id]) != 0)) { 3800d160211SJeremy Fitzhardinge printk(KERN_ALERT "xennet_tx_buf_gc: warning " 3810d160211SJeremy Fitzhardinge "-- grant still in use by backend " 3820d160211SJeremy Fitzhardinge "domain.\n"); 3830d160211SJeremy Fitzhardinge BUG(); 3840d160211SJeremy Fitzhardinge } 3850d160211SJeremy Fitzhardinge gnttab_end_foreign_access_ref( 3860d160211SJeremy Fitzhardinge np->grant_tx_ref[id], GNTMAP_readonly); 3870d160211SJeremy Fitzhardinge gnttab_release_grant_reference( 3880d160211SJeremy Fitzhardinge &np->gref_tx_head, np->grant_tx_ref[id]); 3890d160211SJeremy Fitzhardinge np->grant_tx_ref[id] = GRANT_INVALID_REF; 3900d160211SJeremy Fitzhardinge add_id_to_freelist(&np->tx_skb_freelist, np->tx_skbs, id); 3910d160211SJeremy Fitzhardinge dev_kfree_skb_irq(skb); 3920d160211SJeremy Fitzhardinge } 3930d160211SJeremy Fitzhardinge 3940d160211SJeremy Fitzhardinge np->tx.rsp_cons = prod; 3950d160211SJeremy Fitzhardinge 3960d160211SJeremy Fitzhardinge /* 3970d160211SJeremy Fitzhardinge * Set a new event, then check for race with update of tx_cons. 3980d160211SJeremy Fitzhardinge * Note that it is essential to schedule a callback, no matter 3990d160211SJeremy Fitzhardinge * how few buffers are pending. Even if there is space in the 4000d160211SJeremy Fitzhardinge * transmit ring, higher layers may be blocked because too much 4010d160211SJeremy Fitzhardinge * data is outstanding: in such cases notification from Xen is 4020d160211SJeremy Fitzhardinge * likely to be the only kick that we'll get. 4030d160211SJeremy Fitzhardinge */ 4040d160211SJeremy Fitzhardinge np->tx.sring->rsp_event = 4050d160211SJeremy Fitzhardinge prod + ((np->tx.sring->req_prod - prod) >> 1) + 1; 4060d160211SJeremy Fitzhardinge mb(); /* update shared area */ 4070d160211SJeremy Fitzhardinge } while ((cons == prod) && (prod != np->tx.sring->rsp_prod)); 4080d160211SJeremy Fitzhardinge 4090d160211SJeremy Fitzhardinge xennet_maybe_wake_tx(dev); 4100d160211SJeremy Fitzhardinge } 4110d160211SJeremy Fitzhardinge 4120d160211SJeremy Fitzhardinge static void xennet_make_frags(struct sk_buff *skb, struct net_device *dev, 4130d160211SJeremy Fitzhardinge struct xen_netif_tx_request *tx) 4140d160211SJeremy Fitzhardinge { 4150d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 4160d160211SJeremy Fitzhardinge char *data = skb->data; 4170d160211SJeremy Fitzhardinge unsigned long mfn; 4180d160211SJeremy Fitzhardinge RING_IDX prod = np->tx.req_prod_pvt; 4190d160211SJeremy Fitzhardinge int frags = skb_shinfo(skb)->nr_frags; 4200d160211SJeremy Fitzhardinge unsigned int offset = offset_in_page(data); 4210d160211SJeremy Fitzhardinge unsigned int len = skb_headlen(skb); 4220d160211SJeremy Fitzhardinge unsigned int id; 4230d160211SJeremy Fitzhardinge grant_ref_t ref; 4240d160211SJeremy Fitzhardinge int i; 4250d160211SJeremy Fitzhardinge 4260d160211SJeremy Fitzhardinge /* While the header overlaps a page boundary (including being 4270d160211SJeremy Fitzhardinge larger than a page), split it it into page-sized chunks. */ 4280d160211SJeremy Fitzhardinge while (len > PAGE_SIZE - offset) { 4290d160211SJeremy Fitzhardinge tx->size = PAGE_SIZE - offset; 430f942dc25SIan Campbell tx->flags |= XEN_NETTXF_more_data; 4310d160211SJeremy Fitzhardinge len -= tx->size; 4320d160211SJeremy Fitzhardinge data += tx->size; 4330d160211SJeremy Fitzhardinge offset = 0; 4340d160211SJeremy Fitzhardinge 4350d160211SJeremy Fitzhardinge id = get_id_from_freelist(&np->tx_skb_freelist, np->tx_skbs); 4360d160211SJeremy Fitzhardinge np->tx_skbs[id].skb = skb_get(skb); 4370d160211SJeremy Fitzhardinge tx = RING_GET_REQUEST(&np->tx, prod++); 4380d160211SJeremy Fitzhardinge tx->id = id; 4390d160211SJeremy Fitzhardinge ref = gnttab_claim_grant_reference(&np->gref_tx_head); 4400d160211SJeremy Fitzhardinge BUG_ON((signed short)ref < 0); 4410d160211SJeremy Fitzhardinge 4420d160211SJeremy Fitzhardinge mfn = virt_to_mfn(data); 4430d160211SJeremy Fitzhardinge gnttab_grant_foreign_access_ref(ref, np->xbdev->otherend_id, 4440d160211SJeremy Fitzhardinge mfn, GNTMAP_readonly); 4450d160211SJeremy Fitzhardinge 4460d160211SJeremy Fitzhardinge tx->gref = np->grant_tx_ref[id] = ref; 4470d160211SJeremy Fitzhardinge tx->offset = offset; 4480d160211SJeremy Fitzhardinge tx->size = len; 4490d160211SJeremy Fitzhardinge tx->flags = 0; 4500d160211SJeremy Fitzhardinge } 4510d160211SJeremy Fitzhardinge 4520d160211SJeremy Fitzhardinge /* Grant backend access to each skb fragment page. */ 4530d160211SJeremy Fitzhardinge for (i = 0; i < frags; i++) { 4540d160211SJeremy Fitzhardinge skb_frag_t *frag = skb_shinfo(skb)->frags + i; 4550d160211SJeremy Fitzhardinge 456f942dc25SIan Campbell tx->flags |= XEN_NETTXF_more_data; 4570d160211SJeremy Fitzhardinge 4580d160211SJeremy Fitzhardinge id = get_id_from_freelist(&np->tx_skb_freelist, np->tx_skbs); 4590d160211SJeremy Fitzhardinge np->tx_skbs[id].skb = skb_get(skb); 4600d160211SJeremy Fitzhardinge tx = RING_GET_REQUEST(&np->tx, prod++); 4610d160211SJeremy Fitzhardinge tx->id = id; 4620d160211SJeremy Fitzhardinge ref = gnttab_claim_grant_reference(&np->gref_tx_head); 4630d160211SJeremy Fitzhardinge BUG_ON((signed short)ref < 0); 4640d160211SJeremy Fitzhardinge 46501c68026SIan Campbell mfn = pfn_to_mfn(page_to_pfn(skb_frag_page(frag))); 4660d160211SJeremy Fitzhardinge gnttab_grant_foreign_access_ref(ref, np->xbdev->otherend_id, 4670d160211SJeremy Fitzhardinge mfn, GNTMAP_readonly); 4680d160211SJeremy Fitzhardinge 4690d160211SJeremy Fitzhardinge tx->gref = np->grant_tx_ref[id] = ref; 4700d160211SJeremy Fitzhardinge tx->offset = frag->page_offset; 4719e903e08SEric Dumazet tx->size = skb_frag_size(frag); 4720d160211SJeremy Fitzhardinge tx->flags = 0; 4730d160211SJeremy Fitzhardinge } 4740d160211SJeremy Fitzhardinge 4750d160211SJeremy Fitzhardinge np->tx.req_prod_pvt = prod; 4760d160211SJeremy Fitzhardinge } 4770d160211SJeremy Fitzhardinge 4780d160211SJeremy Fitzhardinge static int xennet_start_xmit(struct sk_buff *skb, struct net_device *dev) 4790d160211SJeremy Fitzhardinge { 4800d160211SJeremy Fitzhardinge unsigned short id; 4810d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 482e00f85beSstephen hemminger struct netfront_stats *stats = this_cpu_ptr(np->stats); 4830d160211SJeremy Fitzhardinge struct xen_netif_tx_request *tx; 4840d160211SJeremy Fitzhardinge struct xen_netif_extra_info *extra; 4850d160211SJeremy Fitzhardinge char *data = skb->data; 4860d160211SJeremy Fitzhardinge RING_IDX i; 4870d160211SJeremy Fitzhardinge grant_ref_t ref; 4880d160211SJeremy Fitzhardinge unsigned long mfn; 4890d160211SJeremy Fitzhardinge int notify; 4900d160211SJeremy Fitzhardinge int frags = skb_shinfo(skb)->nr_frags; 4910d160211SJeremy Fitzhardinge unsigned int offset = offset_in_page(data); 4920d160211SJeremy Fitzhardinge unsigned int len = skb_headlen(skb); 493cf66f9d4SKonrad Rzeszutek Wilk unsigned long flags; 4940d160211SJeremy Fitzhardinge 49543526370SJulia Lawall frags += DIV_ROUND_UP(offset + len, PAGE_SIZE); 4960d160211SJeremy Fitzhardinge if (unlikely(frags > MAX_SKB_FRAGS + 1)) { 4970d160211SJeremy Fitzhardinge printk(KERN_ALERT "xennet: skb rides the rocket: %d frags\n", 4980d160211SJeremy Fitzhardinge frags); 4990d160211SJeremy Fitzhardinge dump_stack(); 5000d160211SJeremy Fitzhardinge goto drop; 5010d160211SJeremy Fitzhardinge } 5020d160211SJeremy Fitzhardinge 503cf66f9d4SKonrad Rzeszutek Wilk spin_lock_irqsave(&np->tx_lock, flags); 5040d160211SJeremy Fitzhardinge 5050d160211SJeremy Fitzhardinge if (unlikely(!netif_carrier_ok(dev) || 5060d160211SJeremy Fitzhardinge (frags > 1 && !xennet_can_sg(dev)) || 507fc741216SJesse Gross netif_needs_gso(skb, netif_skb_features(skb)))) { 508cf66f9d4SKonrad Rzeszutek Wilk spin_unlock_irqrestore(&np->tx_lock, flags); 5090d160211SJeremy Fitzhardinge goto drop; 5100d160211SJeremy Fitzhardinge } 5110d160211SJeremy Fitzhardinge 5120d160211SJeremy Fitzhardinge i = np->tx.req_prod_pvt; 5130d160211SJeremy Fitzhardinge 5140d160211SJeremy Fitzhardinge id = get_id_from_freelist(&np->tx_skb_freelist, np->tx_skbs); 5150d160211SJeremy Fitzhardinge np->tx_skbs[id].skb = skb; 5160d160211SJeremy Fitzhardinge 5170d160211SJeremy Fitzhardinge tx = RING_GET_REQUEST(&np->tx, i); 5180d160211SJeremy Fitzhardinge 5190d160211SJeremy Fitzhardinge tx->id = id; 5200d160211SJeremy Fitzhardinge ref = gnttab_claim_grant_reference(&np->gref_tx_head); 5210d160211SJeremy Fitzhardinge BUG_ON((signed short)ref < 0); 5220d160211SJeremy Fitzhardinge mfn = virt_to_mfn(data); 5230d160211SJeremy Fitzhardinge gnttab_grant_foreign_access_ref( 5240d160211SJeremy Fitzhardinge ref, np->xbdev->otherend_id, mfn, GNTMAP_readonly); 5250d160211SJeremy Fitzhardinge tx->gref = np->grant_tx_ref[id] = ref; 5260d160211SJeremy Fitzhardinge tx->offset = offset; 5270d160211SJeremy Fitzhardinge tx->size = len; 5280d160211SJeremy Fitzhardinge extra = NULL; 5290d160211SJeremy Fitzhardinge 5300d160211SJeremy Fitzhardinge tx->flags = 0; 5310d160211SJeremy Fitzhardinge if (skb->ip_summed == CHECKSUM_PARTIAL) 5320d160211SJeremy Fitzhardinge /* local packet? */ 533f942dc25SIan Campbell tx->flags |= XEN_NETTXF_csum_blank | XEN_NETTXF_data_validated; 5340d160211SJeremy Fitzhardinge else if (skb->ip_summed == CHECKSUM_UNNECESSARY) 5350d160211SJeremy Fitzhardinge /* remote but checksummed. */ 536f942dc25SIan Campbell tx->flags |= XEN_NETTXF_data_validated; 5370d160211SJeremy Fitzhardinge 5380d160211SJeremy Fitzhardinge if (skb_shinfo(skb)->gso_size) { 5390d160211SJeremy Fitzhardinge struct xen_netif_extra_info *gso; 5400d160211SJeremy Fitzhardinge 5410d160211SJeremy Fitzhardinge gso = (struct xen_netif_extra_info *) 5420d160211SJeremy Fitzhardinge RING_GET_REQUEST(&np->tx, ++i); 5430d160211SJeremy Fitzhardinge 5440d160211SJeremy Fitzhardinge if (extra) 5450d160211SJeremy Fitzhardinge extra->flags |= XEN_NETIF_EXTRA_FLAG_MORE; 5460d160211SJeremy Fitzhardinge else 547f942dc25SIan Campbell tx->flags |= XEN_NETTXF_extra_info; 5480d160211SJeremy Fitzhardinge 5490d160211SJeremy Fitzhardinge gso->u.gso.size = skb_shinfo(skb)->gso_size; 5500d160211SJeremy Fitzhardinge gso->u.gso.type = XEN_NETIF_GSO_TYPE_TCPV4; 5510d160211SJeremy Fitzhardinge gso->u.gso.pad = 0; 5520d160211SJeremy Fitzhardinge gso->u.gso.features = 0; 5530d160211SJeremy Fitzhardinge 5540d160211SJeremy Fitzhardinge gso->type = XEN_NETIF_EXTRA_TYPE_GSO; 5550d160211SJeremy Fitzhardinge gso->flags = 0; 5560d160211SJeremy Fitzhardinge extra = gso; 5570d160211SJeremy Fitzhardinge } 5580d160211SJeremy Fitzhardinge 5590d160211SJeremy Fitzhardinge np->tx.req_prod_pvt = i + 1; 5600d160211SJeremy Fitzhardinge 5610d160211SJeremy Fitzhardinge xennet_make_frags(skb, dev, tx); 5620d160211SJeremy Fitzhardinge tx->size = skb->len; 5630d160211SJeremy Fitzhardinge 5640d160211SJeremy Fitzhardinge RING_PUSH_REQUESTS_AND_CHECK_NOTIFY(&np->tx, notify); 5650d160211SJeremy Fitzhardinge if (notify) 5660d160211SJeremy Fitzhardinge notify_remote_via_irq(np->netdev->irq); 5670d160211SJeremy Fitzhardinge 568e00f85beSstephen hemminger u64_stats_update_begin(&stats->syncp); 569e00f85beSstephen hemminger stats->tx_bytes += skb->len; 570e00f85beSstephen hemminger stats->tx_packets++; 571e00f85beSstephen hemminger u64_stats_update_end(&stats->syncp); 57210a273a6SJeremy Fitzhardinge 57310a273a6SJeremy Fitzhardinge /* Note: It is not safe to access skb after xennet_tx_buf_gc()! */ 5740d160211SJeremy Fitzhardinge xennet_tx_buf_gc(dev); 5750d160211SJeremy Fitzhardinge 5760d160211SJeremy Fitzhardinge if (!netfront_tx_slot_available(np)) 5770d160211SJeremy Fitzhardinge netif_stop_queue(dev); 5780d160211SJeremy Fitzhardinge 579cf66f9d4SKonrad Rzeszutek Wilk spin_unlock_irqrestore(&np->tx_lock, flags); 5800d160211SJeremy Fitzhardinge 5816ed10654SPatrick McHardy return NETDEV_TX_OK; 5820d160211SJeremy Fitzhardinge 5830d160211SJeremy Fitzhardinge drop: 58409f75cd7SJeff Garzik dev->stats.tx_dropped++; 5850d160211SJeremy Fitzhardinge dev_kfree_skb(skb); 5866ed10654SPatrick McHardy return NETDEV_TX_OK; 5870d160211SJeremy Fitzhardinge } 5880d160211SJeremy Fitzhardinge 5890d160211SJeremy Fitzhardinge static int xennet_close(struct net_device *dev) 5900d160211SJeremy Fitzhardinge { 5910d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 5920d160211SJeremy Fitzhardinge netif_stop_queue(np->netdev); 593bea3348eSStephen Hemminger napi_disable(&np->napi); 5940d160211SJeremy Fitzhardinge return 0; 5950d160211SJeremy Fitzhardinge } 5960d160211SJeremy Fitzhardinge 5970d160211SJeremy Fitzhardinge static void xennet_move_rx_slot(struct netfront_info *np, struct sk_buff *skb, 5980d160211SJeremy Fitzhardinge grant_ref_t ref) 5990d160211SJeremy Fitzhardinge { 6000d160211SJeremy Fitzhardinge int new = xennet_rxidx(np->rx.req_prod_pvt); 6010d160211SJeremy Fitzhardinge 6020d160211SJeremy Fitzhardinge BUG_ON(np->rx_skbs[new]); 6030d160211SJeremy Fitzhardinge np->rx_skbs[new] = skb; 6040d160211SJeremy Fitzhardinge np->grant_rx_ref[new] = ref; 6050d160211SJeremy Fitzhardinge RING_GET_REQUEST(&np->rx, np->rx.req_prod_pvt)->id = new; 6060d160211SJeremy Fitzhardinge RING_GET_REQUEST(&np->rx, np->rx.req_prod_pvt)->gref = ref; 6070d160211SJeremy Fitzhardinge np->rx.req_prod_pvt++; 6080d160211SJeremy Fitzhardinge } 6090d160211SJeremy Fitzhardinge 6100d160211SJeremy Fitzhardinge static int xennet_get_extras(struct netfront_info *np, 6110d160211SJeremy Fitzhardinge struct xen_netif_extra_info *extras, 6120d160211SJeremy Fitzhardinge RING_IDX rp) 6130d160211SJeremy Fitzhardinge 6140d160211SJeremy Fitzhardinge { 6150d160211SJeremy Fitzhardinge struct xen_netif_extra_info *extra; 6160d160211SJeremy Fitzhardinge struct device *dev = &np->netdev->dev; 6170d160211SJeremy Fitzhardinge RING_IDX cons = np->rx.rsp_cons; 6180d160211SJeremy Fitzhardinge int err = 0; 6190d160211SJeremy Fitzhardinge 6200d160211SJeremy Fitzhardinge do { 6210d160211SJeremy Fitzhardinge struct sk_buff *skb; 6220d160211SJeremy Fitzhardinge grant_ref_t ref; 6230d160211SJeremy Fitzhardinge 6240d160211SJeremy Fitzhardinge if (unlikely(cons + 1 == rp)) { 6250d160211SJeremy Fitzhardinge if (net_ratelimit()) 6260d160211SJeremy Fitzhardinge dev_warn(dev, "Missing extra info\n"); 6270d160211SJeremy Fitzhardinge err = -EBADR; 6280d160211SJeremy Fitzhardinge break; 6290d160211SJeremy Fitzhardinge } 6300d160211SJeremy Fitzhardinge 6310d160211SJeremy Fitzhardinge extra = (struct xen_netif_extra_info *) 6320d160211SJeremy Fitzhardinge RING_GET_RESPONSE(&np->rx, ++cons); 6330d160211SJeremy Fitzhardinge 6340d160211SJeremy Fitzhardinge if (unlikely(!extra->type || 6350d160211SJeremy Fitzhardinge extra->type >= XEN_NETIF_EXTRA_TYPE_MAX)) { 6360d160211SJeremy Fitzhardinge if (net_ratelimit()) 6370d160211SJeremy Fitzhardinge dev_warn(dev, "Invalid extra type: %d\n", 6380d160211SJeremy Fitzhardinge extra->type); 6390d160211SJeremy Fitzhardinge err = -EINVAL; 6400d160211SJeremy Fitzhardinge } else { 6410d160211SJeremy Fitzhardinge memcpy(&extras[extra->type - 1], extra, 6420d160211SJeremy Fitzhardinge sizeof(*extra)); 6430d160211SJeremy Fitzhardinge } 6440d160211SJeremy Fitzhardinge 6450d160211SJeremy Fitzhardinge skb = xennet_get_rx_skb(np, cons); 6460d160211SJeremy Fitzhardinge ref = xennet_get_rx_ref(np, cons); 6470d160211SJeremy Fitzhardinge xennet_move_rx_slot(np, skb, ref); 6480d160211SJeremy Fitzhardinge } while (extra->flags & XEN_NETIF_EXTRA_FLAG_MORE); 6490d160211SJeremy Fitzhardinge 6500d160211SJeremy Fitzhardinge np->rx.rsp_cons = cons; 6510d160211SJeremy Fitzhardinge return err; 6520d160211SJeremy Fitzhardinge } 6530d160211SJeremy Fitzhardinge 6540d160211SJeremy Fitzhardinge static int xennet_get_responses(struct netfront_info *np, 6550d160211SJeremy Fitzhardinge struct netfront_rx_info *rinfo, RING_IDX rp, 6560d160211SJeremy Fitzhardinge struct sk_buff_head *list) 6570d160211SJeremy Fitzhardinge { 6580d160211SJeremy Fitzhardinge struct xen_netif_rx_response *rx = &rinfo->rx; 6590d160211SJeremy Fitzhardinge struct xen_netif_extra_info *extras = rinfo->extras; 6600d160211SJeremy Fitzhardinge struct device *dev = &np->netdev->dev; 6610d160211SJeremy Fitzhardinge RING_IDX cons = np->rx.rsp_cons; 6620d160211SJeremy Fitzhardinge struct sk_buff *skb = xennet_get_rx_skb(np, cons); 6630d160211SJeremy Fitzhardinge grant_ref_t ref = xennet_get_rx_ref(np, cons); 6640d160211SJeremy Fitzhardinge int max = MAX_SKB_FRAGS + (rx->status <= RX_COPY_THRESHOLD); 6650d160211SJeremy Fitzhardinge int frags = 1; 6660d160211SJeremy Fitzhardinge int err = 0; 6670d160211SJeremy Fitzhardinge unsigned long ret; 6680d160211SJeremy Fitzhardinge 669f942dc25SIan Campbell if (rx->flags & XEN_NETRXF_extra_info) { 6700d160211SJeremy Fitzhardinge err = xennet_get_extras(np, extras, rp); 6710d160211SJeremy Fitzhardinge cons = np->rx.rsp_cons; 6720d160211SJeremy Fitzhardinge } 6730d160211SJeremy Fitzhardinge 6740d160211SJeremy Fitzhardinge for (;;) { 6750d160211SJeremy Fitzhardinge if (unlikely(rx->status < 0 || 6760d160211SJeremy Fitzhardinge rx->offset + rx->status > PAGE_SIZE)) { 6770d160211SJeremy Fitzhardinge if (net_ratelimit()) 6780d160211SJeremy Fitzhardinge dev_warn(dev, "rx->offset: %x, size: %u\n", 6790d160211SJeremy Fitzhardinge rx->offset, rx->status); 6800d160211SJeremy Fitzhardinge xennet_move_rx_slot(np, skb, ref); 6810d160211SJeremy Fitzhardinge err = -EINVAL; 6820d160211SJeremy Fitzhardinge goto next; 6830d160211SJeremy Fitzhardinge } 6840d160211SJeremy Fitzhardinge 6850d160211SJeremy Fitzhardinge /* 6860d160211SJeremy Fitzhardinge * This definitely indicates a bug, either in this driver or in 6870d160211SJeremy Fitzhardinge * the backend driver. In future this should flag the bad 6880d160211SJeremy Fitzhardinge * situation to the system controller to reboot the backed. 6890d160211SJeremy Fitzhardinge */ 6900d160211SJeremy Fitzhardinge if (ref == GRANT_INVALID_REF) { 6910d160211SJeremy Fitzhardinge if (net_ratelimit()) 6920d160211SJeremy Fitzhardinge dev_warn(dev, "Bad rx response id %d.\n", 6930d160211SJeremy Fitzhardinge rx->id); 6940d160211SJeremy Fitzhardinge err = -EINVAL; 6950d160211SJeremy Fitzhardinge goto next; 6960d160211SJeremy Fitzhardinge } 6970d160211SJeremy Fitzhardinge 6980d160211SJeremy Fitzhardinge ret = gnttab_end_foreign_access_ref(ref, 0); 6990d160211SJeremy Fitzhardinge BUG_ON(!ret); 7000d160211SJeremy Fitzhardinge 7010d160211SJeremy Fitzhardinge gnttab_release_grant_reference(&np->gref_rx_head, ref); 7020d160211SJeremy Fitzhardinge 7030d160211SJeremy Fitzhardinge __skb_queue_tail(list, skb); 7040d160211SJeremy Fitzhardinge 7050d160211SJeremy Fitzhardinge next: 706f942dc25SIan Campbell if (!(rx->flags & XEN_NETRXF_more_data)) 7070d160211SJeremy Fitzhardinge break; 7080d160211SJeremy Fitzhardinge 7090d160211SJeremy Fitzhardinge if (cons + frags == rp) { 7100d160211SJeremy Fitzhardinge if (net_ratelimit()) 7110d160211SJeremy Fitzhardinge dev_warn(dev, "Need more frags\n"); 7120d160211SJeremy Fitzhardinge err = -ENOENT; 7130d160211SJeremy Fitzhardinge break; 7140d160211SJeremy Fitzhardinge } 7150d160211SJeremy Fitzhardinge 7160d160211SJeremy Fitzhardinge rx = RING_GET_RESPONSE(&np->rx, cons + frags); 7170d160211SJeremy Fitzhardinge skb = xennet_get_rx_skb(np, cons + frags); 7180d160211SJeremy Fitzhardinge ref = xennet_get_rx_ref(np, cons + frags); 7190d160211SJeremy Fitzhardinge frags++; 7200d160211SJeremy Fitzhardinge } 7210d160211SJeremy Fitzhardinge 7220d160211SJeremy Fitzhardinge if (unlikely(frags > max)) { 7230d160211SJeremy Fitzhardinge if (net_ratelimit()) 7240d160211SJeremy Fitzhardinge dev_warn(dev, "Too many frags\n"); 7250d160211SJeremy Fitzhardinge err = -E2BIG; 7260d160211SJeremy Fitzhardinge } 7270d160211SJeremy Fitzhardinge 7280d160211SJeremy Fitzhardinge if (unlikely(err)) 7290d160211SJeremy Fitzhardinge np->rx.rsp_cons = cons + frags; 7300d160211SJeremy Fitzhardinge 7310d160211SJeremy Fitzhardinge return err; 7320d160211SJeremy Fitzhardinge } 7330d160211SJeremy Fitzhardinge 7340d160211SJeremy Fitzhardinge static int xennet_set_skb_gso(struct sk_buff *skb, 7350d160211SJeremy Fitzhardinge struct xen_netif_extra_info *gso) 7360d160211SJeremy Fitzhardinge { 7370d160211SJeremy Fitzhardinge if (!gso->u.gso.size) { 7380d160211SJeremy Fitzhardinge if (net_ratelimit()) 7390d160211SJeremy Fitzhardinge printk(KERN_WARNING "GSO size must not be zero.\n"); 7400d160211SJeremy Fitzhardinge return -EINVAL; 7410d160211SJeremy Fitzhardinge } 7420d160211SJeremy Fitzhardinge 7430d160211SJeremy Fitzhardinge /* Currently only TCPv4 S.O. is supported. */ 7440d160211SJeremy Fitzhardinge if (gso->u.gso.type != XEN_NETIF_GSO_TYPE_TCPV4) { 7450d160211SJeremy Fitzhardinge if (net_ratelimit()) 7460d160211SJeremy Fitzhardinge printk(KERN_WARNING "Bad GSO type %d.\n", gso->u.gso.type); 7470d160211SJeremy Fitzhardinge return -EINVAL; 7480d160211SJeremy Fitzhardinge } 7490d160211SJeremy Fitzhardinge 7500d160211SJeremy Fitzhardinge skb_shinfo(skb)->gso_size = gso->u.gso.size; 7510d160211SJeremy Fitzhardinge skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4; 7520d160211SJeremy Fitzhardinge 7530d160211SJeremy Fitzhardinge /* Header must be checked, and gso_segs computed. */ 7540d160211SJeremy Fitzhardinge skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY; 7550d160211SJeremy Fitzhardinge skb_shinfo(skb)->gso_segs = 0; 7560d160211SJeremy Fitzhardinge 7570d160211SJeremy Fitzhardinge return 0; 7580d160211SJeremy Fitzhardinge } 7590d160211SJeremy Fitzhardinge 7600d160211SJeremy Fitzhardinge static RING_IDX xennet_fill_frags(struct netfront_info *np, 7610d160211SJeremy Fitzhardinge struct sk_buff *skb, 7620d160211SJeremy Fitzhardinge struct sk_buff_head *list) 7630d160211SJeremy Fitzhardinge { 7640d160211SJeremy Fitzhardinge struct skb_shared_info *shinfo = skb_shinfo(skb); 7650d160211SJeremy Fitzhardinge int nr_frags = shinfo->nr_frags; 7660d160211SJeremy Fitzhardinge RING_IDX cons = np->rx.rsp_cons; 7670d160211SJeremy Fitzhardinge struct sk_buff *nskb; 7680d160211SJeremy Fitzhardinge 7690d160211SJeremy Fitzhardinge while ((nskb = __skb_dequeue(list))) { 7700d160211SJeremy Fitzhardinge struct xen_netif_rx_response *rx = 7710d160211SJeremy Fitzhardinge RING_GET_RESPONSE(&np->rx, ++cons); 77201c68026SIan Campbell skb_frag_t *nfrag = &skb_shinfo(nskb)->frags[0]; 7730d160211SJeremy Fitzhardinge 77401c68026SIan Campbell __skb_fill_page_desc(skb, nr_frags, 77501c68026SIan Campbell skb_frag_page(nfrag), 77601c68026SIan Campbell rx->offset, rx->status); 7770d160211SJeremy Fitzhardinge 7780d160211SJeremy Fitzhardinge skb->data_len += rx->status; 7790d160211SJeremy Fitzhardinge 7800d160211SJeremy Fitzhardinge skb_shinfo(nskb)->nr_frags = 0; 7810d160211SJeremy Fitzhardinge kfree_skb(nskb); 7820d160211SJeremy Fitzhardinge 7830d160211SJeremy Fitzhardinge nr_frags++; 7840d160211SJeremy Fitzhardinge } 7850d160211SJeremy Fitzhardinge 7860d160211SJeremy Fitzhardinge shinfo->nr_frags = nr_frags; 7870d160211SJeremy Fitzhardinge return cons; 7880d160211SJeremy Fitzhardinge } 7890d160211SJeremy Fitzhardinge 790e0ce4af9SIan Campbell static int checksum_setup(struct net_device *dev, struct sk_buff *skb) 7910d160211SJeremy Fitzhardinge { 7920d160211SJeremy Fitzhardinge struct iphdr *iph; 7930d160211SJeremy Fitzhardinge unsigned char *th; 7940d160211SJeremy Fitzhardinge int err = -EPROTO; 795e0ce4af9SIan Campbell int recalculate_partial_csum = 0; 796e0ce4af9SIan Campbell 797e0ce4af9SIan Campbell /* 798e0ce4af9SIan Campbell * A GSO SKB must be CHECKSUM_PARTIAL. However some buggy 799e0ce4af9SIan Campbell * peers can fail to set NETRXF_csum_blank when sending a GSO 800e0ce4af9SIan Campbell * frame. In this case force the SKB to CHECKSUM_PARTIAL and 801e0ce4af9SIan Campbell * recalculate the partial checksum. 802e0ce4af9SIan Campbell */ 803e0ce4af9SIan Campbell if (skb->ip_summed != CHECKSUM_PARTIAL && skb_is_gso(skb)) { 804e0ce4af9SIan Campbell struct netfront_info *np = netdev_priv(dev); 805e0ce4af9SIan Campbell np->rx_gso_checksum_fixup++; 806e0ce4af9SIan Campbell skb->ip_summed = CHECKSUM_PARTIAL; 807e0ce4af9SIan Campbell recalculate_partial_csum = 1; 808e0ce4af9SIan Campbell } 809e0ce4af9SIan Campbell 810e0ce4af9SIan Campbell /* A non-CHECKSUM_PARTIAL SKB does not require setup. */ 811e0ce4af9SIan Campbell if (skb->ip_summed != CHECKSUM_PARTIAL) 812e0ce4af9SIan Campbell return 0; 8130d160211SJeremy Fitzhardinge 8140d160211SJeremy Fitzhardinge if (skb->protocol != htons(ETH_P_IP)) 8150d160211SJeremy Fitzhardinge goto out; 8160d160211SJeremy Fitzhardinge 8170d160211SJeremy Fitzhardinge iph = (void *)skb->data; 8180d160211SJeremy Fitzhardinge th = skb->data + 4 * iph->ihl; 8190d160211SJeremy Fitzhardinge if (th >= skb_tail_pointer(skb)) 8200d160211SJeremy Fitzhardinge goto out; 8210d160211SJeremy Fitzhardinge 8220d160211SJeremy Fitzhardinge skb->csum_start = th - skb->head; 8230d160211SJeremy Fitzhardinge switch (iph->protocol) { 8240d160211SJeremy Fitzhardinge case IPPROTO_TCP: 8250d160211SJeremy Fitzhardinge skb->csum_offset = offsetof(struct tcphdr, check); 826e0ce4af9SIan Campbell 827e0ce4af9SIan Campbell if (recalculate_partial_csum) { 828e0ce4af9SIan Campbell struct tcphdr *tcph = (struct tcphdr *)th; 829e0ce4af9SIan Campbell tcph->check = ~csum_tcpudp_magic(iph->saddr, iph->daddr, 830e0ce4af9SIan Campbell skb->len - iph->ihl*4, 831e0ce4af9SIan Campbell IPPROTO_TCP, 0); 832e0ce4af9SIan Campbell } 8330d160211SJeremy Fitzhardinge break; 8340d160211SJeremy Fitzhardinge case IPPROTO_UDP: 8350d160211SJeremy Fitzhardinge skb->csum_offset = offsetof(struct udphdr, check); 836e0ce4af9SIan Campbell 837e0ce4af9SIan Campbell if (recalculate_partial_csum) { 838e0ce4af9SIan Campbell struct udphdr *udph = (struct udphdr *)th; 839e0ce4af9SIan Campbell udph->check = ~csum_tcpudp_magic(iph->saddr, iph->daddr, 840e0ce4af9SIan Campbell skb->len - iph->ihl*4, 841e0ce4af9SIan Campbell IPPROTO_UDP, 0); 842e0ce4af9SIan Campbell } 8430d160211SJeremy Fitzhardinge break; 8440d160211SJeremy Fitzhardinge default: 8450d160211SJeremy Fitzhardinge if (net_ratelimit()) 8460d160211SJeremy Fitzhardinge printk(KERN_ERR "Attempting to checksum a non-" 8470d160211SJeremy Fitzhardinge "TCP/UDP packet, dropping a protocol" 8480d160211SJeremy Fitzhardinge " %d packet", iph->protocol); 8490d160211SJeremy Fitzhardinge goto out; 8500d160211SJeremy Fitzhardinge } 8510d160211SJeremy Fitzhardinge 8520d160211SJeremy Fitzhardinge if ((th + skb->csum_offset + 2) > skb_tail_pointer(skb)) 8530d160211SJeremy Fitzhardinge goto out; 8540d160211SJeremy Fitzhardinge 8550d160211SJeremy Fitzhardinge err = 0; 8560d160211SJeremy Fitzhardinge 8570d160211SJeremy Fitzhardinge out: 8580d160211SJeremy Fitzhardinge return err; 8590d160211SJeremy Fitzhardinge } 8600d160211SJeremy Fitzhardinge 8610d160211SJeremy Fitzhardinge static int handle_incoming_queue(struct net_device *dev, 8620d160211SJeremy Fitzhardinge struct sk_buff_head *rxq) 8630d160211SJeremy Fitzhardinge { 864e00f85beSstephen hemminger struct netfront_info *np = netdev_priv(dev); 865e00f85beSstephen hemminger struct netfront_stats *stats = this_cpu_ptr(np->stats); 8660d160211SJeremy Fitzhardinge int packets_dropped = 0; 8670d160211SJeremy Fitzhardinge struct sk_buff *skb; 8680d160211SJeremy Fitzhardinge 8690d160211SJeremy Fitzhardinge while ((skb = __skb_dequeue(rxq)) != NULL) { 8703683243bSIan Campbell int pull_to = NETFRONT_SKB_CB(skb)->pull_to; 8710d160211SJeremy Fitzhardinge 8723683243bSIan Campbell __pskb_pull_tail(skb, pull_to - skb_headlen(skb)); 8730d160211SJeremy Fitzhardinge 8740d160211SJeremy Fitzhardinge /* Ethernet work: Delayed to here as it peeks the header. */ 8750d160211SJeremy Fitzhardinge skb->protocol = eth_type_trans(skb, dev); 8760d160211SJeremy Fitzhardinge 877e0ce4af9SIan Campbell if (checksum_setup(dev, skb)) { 8780d160211SJeremy Fitzhardinge kfree_skb(skb); 8790d160211SJeremy Fitzhardinge packets_dropped++; 88009f75cd7SJeff Garzik dev->stats.rx_errors++; 8810d160211SJeremy Fitzhardinge continue; 8820d160211SJeremy Fitzhardinge } 8830d160211SJeremy Fitzhardinge 884e00f85beSstephen hemminger u64_stats_update_begin(&stats->syncp); 885e00f85beSstephen hemminger stats->rx_packets++; 886e00f85beSstephen hemminger stats->rx_bytes += skb->len; 887e00f85beSstephen hemminger u64_stats_update_end(&stats->syncp); 8880d160211SJeremy Fitzhardinge 8890d160211SJeremy Fitzhardinge /* Pass it up. */ 8900d160211SJeremy Fitzhardinge netif_receive_skb(skb); 8910d160211SJeremy Fitzhardinge } 8920d160211SJeremy Fitzhardinge 8930d160211SJeremy Fitzhardinge return packets_dropped; 8940d160211SJeremy Fitzhardinge } 8950d160211SJeremy Fitzhardinge 896bea3348eSStephen Hemminger static int xennet_poll(struct napi_struct *napi, int budget) 8970d160211SJeremy Fitzhardinge { 898bea3348eSStephen Hemminger struct netfront_info *np = container_of(napi, struct netfront_info, napi); 899bea3348eSStephen Hemminger struct net_device *dev = np->netdev; 9000d160211SJeremy Fitzhardinge struct sk_buff *skb; 9010d160211SJeremy Fitzhardinge struct netfront_rx_info rinfo; 9020d160211SJeremy Fitzhardinge struct xen_netif_rx_response *rx = &rinfo.rx; 9030d160211SJeremy Fitzhardinge struct xen_netif_extra_info *extras = rinfo.extras; 9040d160211SJeremy Fitzhardinge RING_IDX i, rp; 905bea3348eSStephen Hemminger int work_done; 9060d160211SJeremy Fitzhardinge struct sk_buff_head rxq; 9070d160211SJeremy Fitzhardinge struct sk_buff_head errq; 9080d160211SJeremy Fitzhardinge struct sk_buff_head tmpq; 9090d160211SJeremy Fitzhardinge unsigned long flags; 9100d160211SJeremy Fitzhardinge int err; 9110d160211SJeremy Fitzhardinge 9120d160211SJeremy Fitzhardinge spin_lock(&np->rx_lock); 9130d160211SJeremy Fitzhardinge 9140d160211SJeremy Fitzhardinge skb_queue_head_init(&rxq); 9150d160211SJeremy Fitzhardinge skb_queue_head_init(&errq); 9160d160211SJeremy Fitzhardinge skb_queue_head_init(&tmpq); 9170d160211SJeremy Fitzhardinge 9180d160211SJeremy Fitzhardinge rp = np->rx.sring->rsp_prod; 9190d160211SJeremy Fitzhardinge rmb(); /* Ensure we see queued responses up to 'rp'. */ 9200d160211SJeremy Fitzhardinge 9210d160211SJeremy Fitzhardinge i = np->rx.rsp_cons; 9220d160211SJeremy Fitzhardinge work_done = 0; 9230d160211SJeremy Fitzhardinge while ((i != rp) && (work_done < budget)) { 9240d160211SJeremy Fitzhardinge memcpy(rx, RING_GET_RESPONSE(&np->rx, i), sizeof(*rx)); 9250d160211SJeremy Fitzhardinge memset(extras, 0, sizeof(rinfo.extras)); 9260d160211SJeremy Fitzhardinge 9270d160211SJeremy Fitzhardinge err = xennet_get_responses(np, &rinfo, rp, &tmpq); 9280d160211SJeremy Fitzhardinge 9290d160211SJeremy Fitzhardinge if (unlikely(err)) { 9300d160211SJeremy Fitzhardinge err: 9310d160211SJeremy Fitzhardinge while ((skb = __skb_dequeue(&tmpq))) 9320d160211SJeremy Fitzhardinge __skb_queue_tail(&errq, skb); 93309f75cd7SJeff Garzik dev->stats.rx_errors++; 9340d160211SJeremy Fitzhardinge i = np->rx.rsp_cons; 9350d160211SJeremy Fitzhardinge continue; 9360d160211SJeremy Fitzhardinge } 9370d160211SJeremy Fitzhardinge 9380d160211SJeremy Fitzhardinge skb = __skb_dequeue(&tmpq); 9390d160211SJeremy Fitzhardinge 9400d160211SJeremy Fitzhardinge if (extras[XEN_NETIF_EXTRA_TYPE_GSO - 1].type) { 9410d160211SJeremy Fitzhardinge struct xen_netif_extra_info *gso; 9420d160211SJeremy Fitzhardinge gso = &extras[XEN_NETIF_EXTRA_TYPE_GSO - 1]; 9430d160211SJeremy Fitzhardinge 9440d160211SJeremy Fitzhardinge if (unlikely(xennet_set_skb_gso(skb, gso))) { 9450d160211SJeremy Fitzhardinge __skb_queue_head(&tmpq, skb); 9460d160211SJeremy Fitzhardinge np->rx.rsp_cons += skb_queue_len(&tmpq); 9470d160211SJeremy Fitzhardinge goto err; 9480d160211SJeremy Fitzhardinge } 9490d160211SJeremy Fitzhardinge } 9500d160211SJeremy Fitzhardinge 9513683243bSIan Campbell NETFRONT_SKB_CB(skb)->pull_to = rx->status; 9523683243bSIan Campbell if (NETFRONT_SKB_CB(skb)->pull_to > RX_COPY_THRESHOLD) 9533683243bSIan Campbell NETFRONT_SKB_CB(skb)->pull_to = RX_COPY_THRESHOLD; 9540d160211SJeremy Fitzhardinge 9553683243bSIan Campbell skb_shinfo(skb)->frags[0].page_offset = rx->offset; 9563683243bSIan Campbell skb_frag_size_set(&skb_shinfo(skb)->frags[0], rx->status); 9573683243bSIan Campbell skb->data_len = rx->status; 9580d160211SJeremy Fitzhardinge 9590d160211SJeremy Fitzhardinge i = xennet_fill_frags(np, skb, &tmpq); 9600d160211SJeremy Fitzhardinge 9610d160211SJeremy Fitzhardinge /* 9620d160211SJeremy Fitzhardinge * Truesize approximates the size of true data plus 9630d160211SJeremy Fitzhardinge * any supervisor overheads. Adding hypervisor 9640d160211SJeremy Fitzhardinge * overheads has been shown to significantly reduce 9650d160211SJeremy Fitzhardinge * achievable bandwidth with the default receive 9660d160211SJeremy Fitzhardinge * buffer size. It is therefore not wise to account 9670d160211SJeremy Fitzhardinge * for it here. 9680d160211SJeremy Fitzhardinge * 9690d160211SJeremy Fitzhardinge * After alloc_skb(RX_COPY_THRESHOLD), truesize is set 9700d160211SJeremy Fitzhardinge * to RX_COPY_THRESHOLD + the supervisor 9710d160211SJeremy Fitzhardinge * overheads. Here, we add the size of the data pulled 9720d160211SJeremy Fitzhardinge * in xennet_fill_frags(). 9730d160211SJeremy Fitzhardinge * 9740d160211SJeremy Fitzhardinge * We also adjust for any unused space in the main 9750d160211SJeremy Fitzhardinge * data area by subtracting (RX_COPY_THRESHOLD - 9760d160211SJeremy Fitzhardinge * len). This is especially important with drivers 9770d160211SJeremy Fitzhardinge * which split incoming packets into header and data, 9780d160211SJeremy Fitzhardinge * using only 66 bytes of the main data area (see the 9790d160211SJeremy Fitzhardinge * e1000 driver for example.) On such systems, 9800d160211SJeremy Fitzhardinge * without this last adjustement, our achievable 9810d160211SJeremy Fitzhardinge * receive throughout using the standard receive 9820d160211SJeremy Fitzhardinge * buffer size was cut by 25%(!!!). 9830d160211SJeremy Fitzhardinge */ 9843683243bSIan Campbell skb->truesize += skb->data_len - RX_COPY_THRESHOLD; 9850d160211SJeremy Fitzhardinge skb->len += skb->data_len; 9860d160211SJeremy Fitzhardinge 987f942dc25SIan Campbell if (rx->flags & XEN_NETRXF_csum_blank) 9880d160211SJeremy Fitzhardinge skb->ip_summed = CHECKSUM_PARTIAL; 989f942dc25SIan Campbell else if (rx->flags & XEN_NETRXF_data_validated) 9900d160211SJeremy Fitzhardinge skb->ip_summed = CHECKSUM_UNNECESSARY; 9910d160211SJeremy Fitzhardinge 9920d160211SJeremy Fitzhardinge __skb_queue_tail(&rxq, skb); 9930d160211SJeremy Fitzhardinge 9940d160211SJeremy Fitzhardinge np->rx.rsp_cons = ++i; 9950d160211SJeremy Fitzhardinge work_done++; 9960d160211SJeremy Fitzhardinge } 9970d160211SJeremy Fitzhardinge 99856cfe5d0SWang Chen __skb_queue_purge(&errq); 9990d160211SJeremy Fitzhardinge 10000d160211SJeremy Fitzhardinge work_done -= handle_incoming_queue(dev, &rxq); 10010d160211SJeremy Fitzhardinge 10020d160211SJeremy Fitzhardinge /* If we get a callback with very few responses, reduce fill target. */ 10030d160211SJeremy Fitzhardinge /* NB. Note exponential increase, linear decrease. */ 10040d160211SJeremy Fitzhardinge if (((np->rx.req_prod_pvt - np->rx.sring->rsp_prod) > 10050d160211SJeremy Fitzhardinge ((3*np->rx_target) / 4)) && 10060d160211SJeremy Fitzhardinge (--np->rx_target < np->rx_min_target)) 10070d160211SJeremy Fitzhardinge np->rx_target = np->rx_min_target; 10080d160211SJeremy Fitzhardinge 10090d160211SJeremy Fitzhardinge xennet_alloc_rx_buffers(dev); 10100d160211SJeremy Fitzhardinge 10110d160211SJeremy Fitzhardinge if (work_done < budget) { 1012bea3348eSStephen Hemminger int more_to_do = 0; 1013bea3348eSStephen Hemminger 10140d160211SJeremy Fitzhardinge local_irq_save(flags); 10150d160211SJeremy Fitzhardinge 10160d160211SJeremy Fitzhardinge RING_FINAL_CHECK_FOR_RESPONSES(&np->rx, more_to_do); 10170d160211SJeremy Fitzhardinge if (!more_to_do) 1018288379f0SBen Hutchings __napi_complete(napi); 10190d160211SJeremy Fitzhardinge 10200d160211SJeremy Fitzhardinge local_irq_restore(flags); 10210d160211SJeremy Fitzhardinge } 10220d160211SJeremy Fitzhardinge 10230d160211SJeremy Fitzhardinge spin_unlock(&np->rx_lock); 10240d160211SJeremy Fitzhardinge 1025bea3348eSStephen Hemminger return work_done; 10260d160211SJeremy Fitzhardinge } 10270d160211SJeremy Fitzhardinge 10280d160211SJeremy Fitzhardinge static int xennet_change_mtu(struct net_device *dev, int mtu) 10290d160211SJeremy Fitzhardinge { 10300d160211SJeremy Fitzhardinge int max = xennet_can_sg(dev) ? 65535 - ETH_HLEN : ETH_DATA_LEN; 10310d160211SJeremy Fitzhardinge 10320d160211SJeremy Fitzhardinge if (mtu > max) 10330d160211SJeremy Fitzhardinge return -EINVAL; 10340d160211SJeremy Fitzhardinge dev->mtu = mtu; 10350d160211SJeremy Fitzhardinge return 0; 10360d160211SJeremy Fitzhardinge } 10370d160211SJeremy Fitzhardinge 1038e00f85beSstephen hemminger static struct rtnl_link_stats64 *xennet_get_stats64(struct net_device *dev, 1039e00f85beSstephen hemminger struct rtnl_link_stats64 *tot) 1040e00f85beSstephen hemminger { 1041e00f85beSstephen hemminger struct netfront_info *np = netdev_priv(dev); 1042e00f85beSstephen hemminger int cpu; 1043e00f85beSstephen hemminger 1044e00f85beSstephen hemminger for_each_possible_cpu(cpu) { 1045e00f85beSstephen hemminger struct netfront_stats *stats = per_cpu_ptr(np->stats, cpu); 1046e00f85beSstephen hemminger u64 rx_packets, rx_bytes, tx_packets, tx_bytes; 1047e00f85beSstephen hemminger unsigned int start; 1048e00f85beSstephen hemminger 1049e00f85beSstephen hemminger do { 1050e00f85beSstephen hemminger start = u64_stats_fetch_begin_bh(&stats->syncp); 1051e00f85beSstephen hemminger 1052e00f85beSstephen hemminger rx_packets = stats->rx_packets; 1053e00f85beSstephen hemminger tx_packets = stats->tx_packets; 1054e00f85beSstephen hemminger rx_bytes = stats->rx_bytes; 1055e00f85beSstephen hemminger tx_bytes = stats->tx_bytes; 1056e00f85beSstephen hemminger } while (u64_stats_fetch_retry_bh(&stats->syncp, start)); 1057e00f85beSstephen hemminger 1058e00f85beSstephen hemminger tot->rx_packets += rx_packets; 1059e00f85beSstephen hemminger tot->tx_packets += tx_packets; 1060e00f85beSstephen hemminger tot->rx_bytes += rx_bytes; 1061e00f85beSstephen hemminger tot->tx_bytes += tx_bytes; 1062e00f85beSstephen hemminger } 1063e00f85beSstephen hemminger 1064e00f85beSstephen hemminger tot->rx_errors = dev->stats.rx_errors; 1065e00f85beSstephen hemminger tot->tx_dropped = dev->stats.tx_dropped; 1066e00f85beSstephen hemminger 1067e00f85beSstephen hemminger return tot; 1068e00f85beSstephen hemminger } 1069e00f85beSstephen hemminger 10700d160211SJeremy Fitzhardinge static void xennet_release_tx_bufs(struct netfront_info *np) 10710d160211SJeremy Fitzhardinge { 10720d160211SJeremy Fitzhardinge struct sk_buff *skb; 10730d160211SJeremy Fitzhardinge int i; 10740d160211SJeremy Fitzhardinge 10750d160211SJeremy Fitzhardinge for (i = 0; i < NET_TX_RING_SIZE; i++) { 10760d160211SJeremy Fitzhardinge /* Skip over entries which are actually freelist references */ 10771ffb40b8SIsaku Yamahata if (skb_entry_is_link(&np->tx_skbs[i])) 10780d160211SJeremy Fitzhardinge continue; 10790d160211SJeremy Fitzhardinge 10800d160211SJeremy Fitzhardinge skb = np->tx_skbs[i].skb; 10810d160211SJeremy Fitzhardinge gnttab_end_foreign_access_ref(np->grant_tx_ref[i], 10820d160211SJeremy Fitzhardinge GNTMAP_readonly); 10830d160211SJeremy Fitzhardinge gnttab_release_grant_reference(&np->gref_tx_head, 10840d160211SJeremy Fitzhardinge np->grant_tx_ref[i]); 10850d160211SJeremy Fitzhardinge np->grant_tx_ref[i] = GRANT_INVALID_REF; 10860d160211SJeremy Fitzhardinge add_id_to_freelist(&np->tx_skb_freelist, np->tx_skbs, i); 10870d160211SJeremy Fitzhardinge dev_kfree_skb_irq(skb); 10880d160211SJeremy Fitzhardinge } 10890d160211SJeremy Fitzhardinge } 10900d160211SJeremy Fitzhardinge 10910d160211SJeremy Fitzhardinge static void xennet_release_rx_bufs(struct netfront_info *np) 10920d160211SJeremy Fitzhardinge { 10930d160211SJeremy Fitzhardinge struct mmu_update *mmu = np->rx_mmu; 10940d160211SJeremy Fitzhardinge struct multicall_entry *mcl = np->rx_mcl; 10950d160211SJeremy Fitzhardinge struct sk_buff_head free_list; 10960d160211SJeremy Fitzhardinge struct sk_buff *skb; 10970d160211SJeremy Fitzhardinge unsigned long mfn; 10980d160211SJeremy Fitzhardinge int xfer = 0, noxfer = 0, unused = 0; 10990d160211SJeremy Fitzhardinge int id, ref; 11000d160211SJeremy Fitzhardinge 11010d160211SJeremy Fitzhardinge dev_warn(&np->netdev->dev, "%s: fix me for copying receiver.\n", 11020d160211SJeremy Fitzhardinge __func__); 11030d160211SJeremy Fitzhardinge return; 11040d160211SJeremy Fitzhardinge 11050d160211SJeremy Fitzhardinge skb_queue_head_init(&free_list); 11060d160211SJeremy Fitzhardinge 11070d160211SJeremy Fitzhardinge spin_lock_bh(&np->rx_lock); 11080d160211SJeremy Fitzhardinge 11090d160211SJeremy Fitzhardinge for (id = 0; id < NET_RX_RING_SIZE; id++) { 11100d160211SJeremy Fitzhardinge ref = np->grant_rx_ref[id]; 11110d160211SJeremy Fitzhardinge if (ref == GRANT_INVALID_REF) { 11120d160211SJeremy Fitzhardinge unused++; 11130d160211SJeremy Fitzhardinge continue; 11140d160211SJeremy Fitzhardinge } 11150d160211SJeremy Fitzhardinge 11160d160211SJeremy Fitzhardinge skb = np->rx_skbs[id]; 11170d160211SJeremy Fitzhardinge mfn = gnttab_end_foreign_transfer_ref(ref); 11180d160211SJeremy Fitzhardinge gnttab_release_grant_reference(&np->gref_rx_head, ref); 11190d160211SJeremy Fitzhardinge np->grant_rx_ref[id] = GRANT_INVALID_REF; 11200d160211SJeremy Fitzhardinge 11210d160211SJeremy Fitzhardinge if (0 == mfn) { 11220d160211SJeremy Fitzhardinge skb_shinfo(skb)->nr_frags = 0; 11230d160211SJeremy Fitzhardinge dev_kfree_skb(skb); 11240d160211SJeremy Fitzhardinge noxfer++; 11250d160211SJeremy Fitzhardinge continue; 11260d160211SJeremy Fitzhardinge } 11270d160211SJeremy Fitzhardinge 11280d160211SJeremy Fitzhardinge if (!xen_feature(XENFEAT_auto_translated_physmap)) { 11290d160211SJeremy Fitzhardinge /* Remap the page. */ 113001c68026SIan Campbell const struct page *page = 113101c68026SIan Campbell skb_frag_page(&skb_shinfo(skb)->frags[0]); 11320d160211SJeremy Fitzhardinge unsigned long pfn = page_to_pfn(page); 11330d160211SJeremy Fitzhardinge void *vaddr = page_address(page); 11340d160211SJeremy Fitzhardinge 11350d160211SJeremy Fitzhardinge MULTI_update_va_mapping(mcl, (unsigned long)vaddr, 11360d160211SJeremy Fitzhardinge mfn_pte(mfn, PAGE_KERNEL), 11370d160211SJeremy Fitzhardinge 0); 11380d160211SJeremy Fitzhardinge mcl++; 11390d160211SJeremy Fitzhardinge mmu->ptr = ((u64)mfn << PAGE_SHIFT) 11400d160211SJeremy Fitzhardinge | MMU_MACHPHYS_UPDATE; 11410d160211SJeremy Fitzhardinge mmu->val = pfn; 11420d160211SJeremy Fitzhardinge mmu++; 11430d160211SJeremy Fitzhardinge 11440d160211SJeremy Fitzhardinge set_phys_to_machine(pfn, mfn); 11450d160211SJeremy Fitzhardinge } 11460d160211SJeremy Fitzhardinge __skb_queue_tail(&free_list, skb); 11470d160211SJeremy Fitzhardinge xfer++; 11480d160211SJeremy Fitzhardinge } 11490d160211SJeremy Fitzhardinge 11500d160211SJeremy Fitzhardinge dev_info(&np->netdev->dev, "%s: %d xfer, %d noxfer, %d unused\n", 11510d160211SJeremy Fitzhardinge __func__, xfer, noxfer, unused); 11520d160211SJeremy Fitzhardinge 11530d160211SJeremy Fitzhardinge if (xfer) { 11540d160211SJeremy Fitzhardinge if (!xen_feature(XENFEAT_auto_translated_physmap)) { 11550d160211SJeremy Fitzhardinge /* Do all the remapping work and M2P updates. */ 11560d160211SJeremy Fitzhardinge MULTI_mmu_update(mcl, np->rx_mmu, mmu - np->rx_mmu, 115779ea13ceSAl Viro NULL, DOMID_SELF); 11580d160211SJeremy Fitzhardinge mcl++; 11590d160211SJeremy Fitzhardinge HYPERVISOR_multicall(np->rx_mcl, mcl - np->rx_mcl); 11600d160211SJeremy Fitzhardinge } 11610d160211SJeremy Fitzhardinge } 11620d160211SJeremy Fitzhardinge 116356cfe5d0SWang Chen __skb_queue_purge(&free_list); 11640d160211SJeremy Fitzhardinge 11650d160211SJeremy Fitzhardinge spin_unlock_bh(&np->rx_lock); 11660d160211SJeremy Fitzhardinge } 11670d160211SJeremy Fitzhardinge 11680d160211SJeremy Fitzhardinge static void xennet_uninit(struct net_device *dev) 11690d160211SJeremy Fitzhardinge { 11700d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 11710d160211SJeremy Fitzhardinge xennet_release_tx_bufs(np); 11720d160211SJeremy Fitzhardinge xennet_release_rx_bufs(np); 11730d160211SJeremy Fitzhardinge gnttab_free_grant_references(np->gref_tx_head); 11740d160211SJeremy Fitzhardinge gnttab_free_grant_references(np->gref_rx_head); 11750d160211SJeremy Fitzhardinge } 11760d160211SJeremy Fitzhardinge 1177c8f44affSMichał Mirosław static netdev_features_t xennet_fix_features(struct net_device *dev, 1178c8f44affSMichał Mirosław netdev_features_t features) 11798f7b01a1SEric Dumazet { 11808f7b01a1SEric Dumazet struct netfront_info *np = netdev_priv(dev); 11818f7b01a1SEric Dumazet int val; 11828f7b01a1SEric Dumazet 11838f7b01a1SEric Dumazet if (features & NETIF_F_SG) { 11848f7b01a1SEric Dumazet if (xenbus_scanf(XBT_NIL, np->xbdev->otherend, "feature-sg", 11858f7b01a1SEric Dumazet "%d", &val) < 0) 11868f7b01a1SEric Dumazet val = 0; 11878f7b01a1SEric Dumazet 11888f7b01a1SEric Dumazet if (!val) 11898f7b01a1SEric Dumazet features &= ~NETIF_F_SG; 11908f7b01a1SEric Dumazet } 11918f7b01a1SEric Dumazet 11928f7b01a1SEric Dumazet if (features & NETIF_F_TSO) { 11938f7b01a1SEric Dumazet if (xenbus_scanf(XBT_NIL, np->xbdev->otherend, 11948f7b01a1SEric Dumazet "feature-gso-tcpv4", "%d", &val) < 0) 11958f7b01a1SEric Dumazet val = 0; 11968f7b01a1SEric Dumazet 11978f7b01a1SEric Dumazet if (!val) 11988f7b01a1SEric Dumazet features &= ~NETIF_F_TSO; 11998f7b01a1SEric Dumazet } 12008f7b01a1SEric Dumazet 12018f7b01a1SEric Dumazet return features; 12028f7b01a1SEric Dumazet } 12038f7b01a1SEric Dumazet 1204c8f44affSMichał Mirosław static int xennet_set_features(struct net_device *dev, 1205c8f44affSMichał Mirosław netdev_features_t features) 12068f7b01a1SEric Dumazet { 12078f7b01a1SEric Dumazet if (!(features & NETIF_F_SG) && dev->mtu > ETH_DATA_LEN) { 12088f7b01a1SEric Dumazet netdev_info(dev, "Reducing MTU because no SG offload"); 12098f7b01a1SEric Dumazet dev->mtu = ETH_DATA_LEN; 12108f7b01a1SEric Dumazet } 12118f7b01a1SEric Dumazet 12128f7b01a1SEric Dumazet return 0; 12138f7b01a1SEric Dumazet } 12148f7b01a1SEric Dumazet 1215cf66f9d4SKonrad Rzeszutek Wilk static irqreturn_t xennet_interrupt(int irq, void *dev_id) 1216cf66f9d4SKonrad Rzeszutek Wilk { 1217cf66f9d4SKonrad Rzeszutek Wilk struct net_device *dev = dev_id; 1218cf66f9d4SKonrad Rzeszutek Wilk struct netfront_info *np = netdev_priv(dev); 1219cf66f9d4SKonrad Rzeszutek Wilk unsigned long flags; 1220cf66f9d4SKonrad Rzeszutek Wilk 1221cf66f9d4SKonrad Rzeszutek Wilk spin_lock_irqsave(&np->tx_lock, flags); 1222cf66f9d4SKonrad Rzeszutek Wilk 1223cf66f9d4SKonrad Rzeszutek Wilk if (likely(netif_carrier_ok(dev))) { 1224cf66f9d4SKonrad Rzeszutek Wilk xennet_tx_buf_gc(dev); 1225cf66f9d4SKonrad Rzeszutek Wilk /* Under tx_lock: protects access to rx shared-ring indexes. */ 1226cf66f9d4SKonrad Rzeszutek Wilk if (RING_HAS_UNCONSUMED_RESPONSES(&np->rx)) 1227cf66f9d4SKonrad Rzeszutek Wilk napi_schedule(&np->napi); 1228cf66f9d4SKonrad Rzeszutek Wilk } 1229cf66f9d4SKonrad Rzeszutek Wilk 1230cf66f9d4SKonrad Rzeszutek Wilk spin_unlock_irqrestore(&np->tx_lock, flags); 1231cf66f9d4SKonrad Rzeszutek Wilk 1232cf66f9d4SKonrad Rzeszutek Wilk return IRQ_HANDLED; 1233cf66f9d4SKonrad Rzeszutek Wilk } 1234cf66f9d4SKonrad Rzeszutek Wilk 1235cf66f9d4SKonrad Rzeszutek Wilk #ifdef CONFIG_NET_POLL_CONTROLLER 1236cf66f9d4SKonrad Rzeszutek Wilk static void xennet_poll_controller(struct net_device *dev) 1237cf66f9d4SKonrad Rzeszutek Wilk { 1238cf66f9d4SKonrad Rzeszutek Wilk xennet_interrupt(0, dev); 1239cf66f9d4SKonrad Rzeszutek Wilk } 1240cf66f9d4SKonrad Rzeszutek Wilk #endif 1241cf66f9d4SKonrad Rzeszutek Wilk 12420a0b9d2eSStephen Hemminger static const struct net_device_ops xennet_netdev_ops = { 12430a0b9d2eSStephen Hemminger .ndo_open = xennet_open, 12440a0b9d2eSStephen Hemminger .ndo_uninit = xennet_uninit, 12450a0b9d2eSStephen Hemminger .ndo_stop = xennet_close, 12460a0b9d2eSStephen Hemminger .ndo_start_xmit = xennet_start_xmit, 12470a0b9d2eSStephen Hemminger .ndo_change_mtu = xennet_change_mtu, 1248e00f85beSstephen hemminger .ndo_get_stats64 = xennet_get_stats64, 12490a0b9d2eSStephen Hemminger .ndo_set_mac_address = eth_mac_addr, 12500a0b9d2eSStephen Hemminger .ndo_validate_addr = eth_validate_addr, 1251fb507934SMichał Mirosław .ndo_fix_features = xennet_fix_features, 1252fb507934SMichał Mirosław .ndo_set_features = xennet_set_features, 1253cf66f9d4SKonrad Rzeszutek Wilk #ifdef CONFIG_NET_POLL_CONTROLLER 1254cf66f9d4SKonrad Rzeszutek Wilk .ndo_poll_controller = xennet_poll_controller, 1255cf66f9d4SKonrad Rzeszutek Wilk #endif 12560a0b9d2eSStephen Hemminger }; 12570a0b9d2eSStephen Hemminger 12580d160211SJeremy Fitzhardinge static struct net_device * __devinit xennet_create_dev(struct xenbus_device *dev) 12590d160211SJeremy Fitzhardinge { 12600d160211SJeremy Fitzhardinge int i, err; 12610d160211SJeremy Fitzhardinge struct net_device *netdev; 12620d160211SJeremy Fitzhardinge struct netfront_info *np; 12630d160211SJeremy Fitzhardinge 12640d160211SJeremy Fitzhardinge netdev = alloc_etherdev(sizeof(struct netfront_info)); 126541de8d4cSJoe Perches if (!netdev) 12660d160211SJeremy Fitzhardinge return ERR_PTR(-ENOMEM); 12670d160211SJeremy Fitzhardinge 12680d160211SJeremy Fitzhardinge np = netdev_priv(netdev); 12690d160211SJeremy Fitzhardinge np->xbdev = dev; 12700d160211SJeremy Fitzhardinge 12710d160211SJeremy Fitzhardinge spin_lock_init(&np->tx_lock); 12720d160211SJeremy Fitzhardinge spin_lock_init(&np->rx_lock); 12730d160211SJeremy Fitzhardinge 12740d160211SJeremy Fitzhardinge skb_queue_head_init(&np->rx_batch); 12750d160211SJeremy Fitzhardinge np->rx_target = RX_DFL_MIN_TARGET; 12760d160211SJeremy Fitzhardinge np->rx_min_target = RX_DFL_MIN_TARGET; 12770d160211SJeremy Fitzhardinge np->rx_max_target = RX_MAX_TARGET; 12780d160211SJeremy Fitzhardinge 12790d160211SJeremy Fitzhardinge init_timer(&np->rx_refill_timer); 12800d160211SJeremy Fitzhardinge np->rx_refill_timer.data = (unsigned long)netdev; 12810d160211SJeremy Fitzhardinge np->rx_refill_timer.function = rx_refill_timeout; 12820d160211SJeremy Fitzhardinge 1283e00f85beSstephen hemminger err = -ENOMEM; 1284e00f85beSstephen hemminger np->stats = alloc_percpu(struct netfront_stats); 1285e00f85beSstephen hemminger if (np->stats == NULL) 1286e00f85beSstephen hemminger goto exit; 1287e00f85beSstephen hemminger 12880d160211SJeremy Fitzhardinge /* Initialise tx_skbs as a free chain containing every entry. */ 12890d160211SJeremy Fitzhardinge np->tx_skb_freelist = 0; 12900d160211SJeremy Fitzhardinge for (i = 0; i < NET_TX_RING_SIZE; i++) { 12911ffb40b8SIsaku Yamahata skb_entry_set_link(&np->tx_skbs[i], i+1); 12920d160211SJeremy Fitzhardinge np->grant_tx_ref[i] = GRANT_INVALID_REF; 12930d160211SJeremy Fitzhardinge } 12940d160211SJeremy Fitzhardinge 12950d160211SJeremy Fitzhardinge /* Clear out rx_skbs */ 12960d160211SJeremy Fitzhardinge for (i = 0; i < NET_RX_RING_SIZE; i++) { 12970d160211SJeremy Fitzhardinge np->rx_skbs[i] = NULL; 12980d160211SJeremy Fitzhardinge np->grant_rx_ref[i] = GRANT_INVALID_REF; 12990d160211SJeremy Fitzhardinge } 13000d160211SJeremy Fitzhardinge 13010d160211SJeremy Fitzhardinge /* A grant for every tx ring slot */ 13020d160211SJeremy Fitzhardinge if (gnttab_alloc_grant_references(TX_MAX_TARGET, 13030d160211SJeremy Fitzhardinge &np->gref_tx_head) < 0) { 13040d160211SJeremy Fitzhardinge printk(KERN_ALERT "#### netfront can't alloc tx grant refs\n"); 13050d160211SJeremy Fitzhardinge err = -ENOMEM; 1306e00f85beSstephen hemminger goto exit_free_stats; 13070d160211SJeremy Fitzhardinge } 13080d160211SJeremy Fitzhardinge /* A grant for every rx ring slot */ 13090d160211SJeremy Fitzhardinge if (gnttab_alloc_grant_references(RX_MAX_TARGET, 13100d160211SJeremy Fitzhardinge &np->gref_rx_head) < 0) { 13110d160211SJeremy Fitzhardinge printk(KERN_ALERT "#### netfront can't alloc rx grant refs\n"); 13120d160211SJeremy Fitzhardinge err = -ENOMEM; 13130d160211SJeremy Fitzhardinge goto exit_free_tx; 13140d160211SJeremy Fitzhardinge } 13150d160211SJeremy Fitzhardinge 13160a0b9d2eSStephen Hemminger netdev->netdev_ops = &xennet_netdev_ops; 13170a0b9d2eSStephen Hemminger 1318bea3348eSStephen Hemminger netif_napi_add(netdev, &np->napi, xennet_poll, 64); 1319fb507934SMichał Mirosław netdev->features = NETIF_F_IP_CSUM | NETIF_F_RXCSUM | 1320fb507934SMichał Mirosław NETIF_F_GSO_ROBUST; 1321fb507934SMichał Mirosław netdev->hw_features = NETIF_F_IP_CSUM | NETIF_F_SG | NETIF_F_TSO; 13220d160211SJeremy Fitzhardinge 1323fc3e5941SIan Campbell /* 1324fc3e5941SIan Campbell * Assume that all hw features are available for now. This set 1325fc3e5941SIan Campbell * will be adjusted by the call to netdev_update_features() in 1326fc3e5941SIan Campbell * xennet_connect() which is the earliest point where we can 1327fc3e5941SIan Campbell * negotiate with the backend regarding supported features. 1328fc3e5941SIan Campbell */ 1329fc3e5941SIan Campbell netdev->features |= netdev->hw_features; 1330fc3e5941SIan Campbell 13310d160211SJeremy Fitzhardinge SET_ETHTOOL_OPS(netdev, &xennet_ethtool_ops); 13320d160211SJeremy Fitzhardinge SET_NETDEV_DEV(netdev, &dev->dev); 13330d160211SJeremy Fitzhardinge 13340d160211SJeremy Fitzhardinge np->netdev = netdev; 13350d160211SJeremy Fitzhardinge 13360d160211SJeremy Fitzhardinge netif_carrier_off(netdev); 13370d160211SJeremy Fitzhardinge 13380d160211SJeremy Fitzhardinge return netdev; 13390d160211SJeremy Fitzhardinge 13400d160211SJeremy Fitzhardinge exit_free_tx: 13410d160211SJeremy Fitzhardinge gnttab_free_grant_references(np->gref_tx_head); 1342e00f85beSstephen hemminger exit_free_stats: 1343e00f85beSstephen hemminger free_percpu(np->stats); 13440d160211SJeremy Fitzhardinge exit: 13450d160211SJeremy Fitzhardinge free_netdev(netdev); 13460d160211SJeremy Fitzhardinge return ERR_PTR(err); 13470d160211SJeremy Fitzhardinge } 13480d160211SJeremy Fitzhardinge 13490d160211SJeremy Fitzhardinge /** 13500d160211SJeremy Fitzhardinge * Entry point to this code when a new device is created. Allocate the basic 13510d160211SJeremy Fitzhardinge * structures and the ring buffers for communication with the backend, and 13520d160211SJeremy Fitzhardinge * inform the backend of the appropriate details for those. 13530d160211SJeremy Fitzhardinge */ 13540d160211SJeremy Fitzhardinge static int __devinit netfront_probe(struct xenbus_device *dev, 13550d160211SJeremy Fitzhardinge const struct xenbus_device_id *id) 13560d160211SJeremy Fitzhardinge { 13570d160211SJeremy Fitzhardinge int err; 13580d160211SJeremy Fitzhardinge struct net_device *netdev; 13590d160211SJeremy Fitzhardinge struct netfront_info *info; 13600d160211SJeremy Fitzhardinge 13610d160211SJeremy Fitzhardinge netdev = xennet_create_dev(dev); 13620d160211SJeremy Fitzhardinge if (IS_ERR(netdev)) { 13630d160211SJeremy Fitzhardinge err = PTR_ERR(netdev); 13640d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "creating netdev"); 13650d160211SJeremy Fitzhardinge return err; 13660d160211SJeremy Fitzhardinge } 13670d160211SJeremy Fitzhardinge 13680d160211SJeremy Fitzhardinge info = netdev_priv(netdev); 13691b713e00SGreg Kroah-Hartman dev_set_drvdata(&dev->dev, info); 13700d160211SJeremy Fitzhardinge 13710d160211SJeremy Fitzhardinge err = register_netdev(info->netdev); 13720d160211SJeremy Fitzhardinge if (err) { 13730d160211SJeremy Fitzhardinge printk(KERN_WARNING "%s: register_netdev err=%d\n", 13740d160211SJeremy Fitzhardinge __func__, err); 13750d160211SJeremy Fitzhardinge goto fail; 13760d160211SJeremy Fitzhardinge } 13770d160211SJeremy Fitzhardinge 13780d160211SJeremy Fitzhardinge err = xennet_sysfs_addif(info->netdev); 13790d160211SJeremy Fitzhardinge if (err) { 13800d160211SJeremy Fitzhardinge unregister_netdev(info->netdev); 13810d160211SJeremy Fitzhardinge printk(KERN_WARNING "%s: add sysfs failed err=%d\n", 13820d160211SJeremy Fitzhardinge __func__, err); 13830d160211SJeremy Fitzhardinge goto fail; 13840d160211SJeremy Fitzhardinge } 13850d160211SJeremy Fitzhardinge 13860d160211SJeremy Fitzhardinge return 0; 13870d160211SJeremy Fitzhardinge 13880d160211SJeremy Fitzhardinge fail: 13890d160211SJeremy Fitzhardinge free_netdev(netdev); 13901b713e00SGreg Kroah-Hartman dev_set_drvdata(&dev->dev, NULL); 13910d160211SJeremy Fitzhardinge return err; 13920d160211SJeremy Fitzhardinge } 13930d160211SJeremy Fitzhardinge 13940d160211SJeremy Fitzhardinge static void xennet_end_access(int ref, void *page) 13950d160211SJeremy Fitzhardinge { 13960d160211SJeremy Fitzhardinge /* This frees the page as a side-effect */ 13970d160211SJeremy Fitzhardinge if (ref != GRANT_INVALID_REF) 13980d160211SJeremy Fitzhardinge gnttab_end_foreign_access(ref, 0, (unsigned long)page); 13990d160211SJeremy Fitzhardinge } 14000d160211SJeremy Fitzhardinge 14010d160211SJeremy Fitzhardinge static void xennet_disconnect_backend(struct netfront_info *info) 14020d160211SJeremy Fitzhardinge { 14030d160211SJeremy Fitzhardinge /* Stop old i/f to prevent errors whilst we rebuild the state. */ 14040d160211SJeremy Fitzhardinge spin_lock_bh(&info->rx_lock); 14050d160211SJeremy Fitzhardinge spin_lock_irq(&info->tx_lock); 14060d160211SJeremy Fitzhardinge netif_carrier_off(info->netdev); 14070d160211SJeremy Fitzhardinge spin_unlock_irq(&info->tx_lock); 14080d160211SJeremy Fitzhardinge spin_unlock_bh(&info->rx_lock); 14090d160211SJeremy Fitzhardinge 14100d160211SJeremy Fitzhardinge if (info->netdev->irq) 14110d160211SJeremy Fitzhardinge unbind_from_irqhandler(info->netdev->irq, info->netdev); 14120d160211SJeremy Fitzhardinge info->evtchn = info->netdev->irq = 0; 14130d160211SJeremy Fitzhardinge 14140d160211SJeremy Fitzhardinge /* End access and free the pages */ 14150d160211SJeremy Fitzhardinge xennet_end_access(info->tx_ring_ref, info->tx.sring); 14160d160211SJeremy Fitzhardinge xennet_end_access(info->rx_ring_ref, info->rx.sring); 14170d160211SJeremy Fitzhardinge 14180d160211SJeremy Fitzhardinge info->tx_ring_ref = GRANT_INVALID_REF; 14190d160211SJeremy Fitzhardinge info->rx_ring_ref = GRANT_INVALID_REF; 14200d160211SJeremy Fitzhardinge info->tx.sring = NULL; 14210d160211SJeremy Fitzhardinge info->rx.sring = NULL; 14220d160211SJeremy Fitzhardinge } 14230d160211SJeremy Fitzhardinge 14240d160211SJeremy Fitzhardinge /** 14250d160211SJeremy Fitzhardinge * We are reconnecting to the backend, due to a suspend/resume, or a backend 14260d160211SJeremy Fitzhardinge * driver restart. We tear down our netif structure and recreate it, but 14270d160211SJeremy Fitzhardinge * leave the device-layer structures intact so that this is transparent to the 14280d160211SJeremy Fitzhardinge * rest of the kernel. 14290d160211SJeremy Fitzhardinge */ 14300d160211SJeremy Fitzhardinge static int netfront_resume(struct xenbus_device *dev) 14310d160211SJeremy Fitzhardinge { 14321b713e00SGreg Kroah-Hartman struct netfront_info *info = dev_get_drvdata(&dev->dev); 14330d160211SJeremy Fitzhardinge 14340d160211SJeremy Fitzhardinge dev_dbg(&dev->dev, "%s\n", dev->nodename); 14350d160211SJeremy Fitzhardinge 14360d160211SJeremy Fitzhardinge xennet_disconnect_backend(info); 14370d160211SJeremy Fitzhardinge return 0; 14380d160211SJeremy Fitzhardinge } 14390d160211SJeremy Fitzhardinge 14400d160211SJeremy Fitzhardinge static int xen_net_read_mac(struct xenbus_device *dev, u8 mac[]) 14410d160211SJeremy Fitzhardinge { 14420d160211SJeremy Fitzhardinge char *s, *e, *macstr; 14430d160211SJeremy Fitzhardinge int i; 14440d160211SJeremy Fitzhardinge 14450d160211SJeremy Fitzhardinge macstr = s = xenbus_read(XBT_NIL, dev->nodename, "mac", NULL); 14460d160211SJeremy Fitzhardinge if (IS_ERR(macstr)) 14470d160211SJeremy Fitzhardinge return PTR_ERR(macstr); 14480d160211SJeremy Fitzhardinge 14490d160211SJeremy Fitzhardinge for (i = 0; i < ETH_ALEN; i++) { 14500d160211SJeremy Fitzhardinge mac[i] = simple_strtoul(s, &e, 16); 14510d160211SJeremy Fitzhardinge if ((s == e) || (*e != ((i == ETH_ALEN-1) ? '\0' : ':'))) { 14520d160211SJeremy Fitzhardinge kfree(macstr); 14530d160211SJeremy Fitzhardinge return -ENOENT; 14540d160211SJeremy Fitzhardinge } 14550d160211SJeremy Fitzhardinge s = e+1; 14560d160211SJeremy Fitzhardinge } 14570d160211SJeremy Fitzhardinge 14580d160211SJeremy Fitzhardinge kfree(macstr); 14590d160211SJeremy Fitzhardinge return 0; 14600d160211SJeremy Fitzhardinge } 14610d160211SJeremy Fitzhardinge 14620d160211SJeremy Fitzhardinge static int setup_netfront(struct xenbus_device *dev, struct netfront_info *info) 14630d160211SJeremy Fitzhardinge { 14640d160211SJeremy Fitzhardinge struct xen_netif_tx_sring *txs; 14650d160211SJeremy Fitzhardinge struct xen_netif_rx_sring *rxs; 14660d160211SJeremy Fitzhardinge int err; 14670d160211SJeremy Fitzhardinge struct net_device *netdev = info->netdev; 14680d160211SJeremy Fitzhardinge 14690d160211SJeremy Fitzhardinge info->tx_ring_ref = GRANT_INVALID_REF; 14700d160211SJeremy Fitzhardinge info->rx_ring_ref = GRANT_INVALID_REF; 14710d160211SJeremy Fitzhardinge info->rx.sring = NULL; 14720d160211SJeremy Fitzhardinge info->tx.sring = NULL; 14730d160211SJeremy Fitzhardinge netdev->irq = 0; 14740d160211SJeremy Fitzhardinge 14750d160211SJeremy Fitzhardinge err = xen_net_read_mac(dev, netdev->dev_addr); 14760d160211SJeremy Fitzhardinge if (err) { 14770d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "parsing %s/mac", dev->nodename); 14780d160211SJeremy Fitzhardinge goto fail; 14790d160211SJeremy Fitzhardinge } 14800d160211SJeremy Fitzhardinge 1481a144ff09SIan Campbell txs = (struct xen_netif_tx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH); 14820d160211SJeremy Fitzhardinge if (!txs) { 14830d160211SJeremy Fitzhardinge err = -ENOMEM; 14840d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "allocating tx ring page"); 14850d160211SJeremy Fitzhardinge goto fail; 14860d160211SJeremy Fitzhardinge } 14870d160211SJeremy Fitzhardinge SHARED_RING_INIT(txs); 14880d160211SJeremy Fitzhardinge FRONT_RING_INIT(&info->tx, txs, PAGE_SIZE); 14890d160211SJeremy Fitzhardinge 14900d160211SJeremy Fitzhardinge err = xenbus_grant_ring(dev, virt_to_mfn(txs)); 14910d160211SJeremy Fitzhardinge if (err < 0) { 14920d160211SJeremy Fitzhardinge free_page((unsigned long)txs); 14930d160211SJeremy Fitzhardinge goto fail; 14940d160211SJeremy Fitzhardinge } 14950d160211SJeremy Fitzhardinge 14960d160211SJeremy Fitzhardinge info->tx_ring_ref = err; 1497a144ff09SIan Campbell rxs = (struct xen_netif_rx_sring *)get_zeroed_page(GFP_NOIO | __GFP_HIGH); 14980d160211SJeremy Fitzhardinge if (!rxs) { 14990d160211SJeremy Fitzhardinge err = -ENOMEM; 15000d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "allocating rx ring page"); 15010d160211SJeremy Fitzhardinge goto fail; 15020d160211SJeremy Fitzhardinge } 15030d160211SJeremy Fitzhardinge SHARED_RING_INIT(rxs); 15040d160211SJeremy Fitzhardinge FRONT_RING_INIT(&info->rx, rxs, PAGE_SIZE); 15050d160211SJeremy Fitzhardinge 15060d160211SJeremy Fitzhardinge err = xenbus_grant_ring(dev, virt_to_mfn(rxs)); 15070d160211SJeremy Fitzhardinge if (err < 0) { 15080d160211SJeremy Fitzhardinge free_page((unsigned long)rxs); 15090d160211SJeremy Fitzhardinge goto fail; 15100d160211SJeremy Fitzhardinge } 15110d160211SJeremy Fitzhardinge info->rx_ring_ref = err; 15120d160211SJeremy Fitzhardinge 15130d160211SJeremy Fitzhardinge err = xenbus_alloc_evtchn(dev, &info->evtchn); 15140d160211SJeremy Fitzhardinge if (err) 15150d160211SJeremy Fitzhardinge goto fail; 15160d160211SJeremy Fitzhardinge 15170d160211SJeremy Fitzhardinge err = bind_evtchn_to_irqhandler(info->evtchn, xennet_interrupt, 1518ab392d2dSJavier Martinez Canillas 0, netdev->name, netdev); 15190d160211SJeremy Fitzhardinge if (err < 0) 15200d160211SJeremy Fitzhardinge goto fail; 15210d160211SJeremy Fitzhardinge netdev->irq = err; 15220d160211SJeremy Fitzhardinge return 0; 15230d160211SJeremy Fitzhardinge 15240d160211SJeremy Fitzhardinge fail: 15250d160211SJeremy Fitzhardinge return err; 15260d160211SJeremy Fitzhardinge } 15270d160211SJeremy Fitzhardinge 15280d160211SJeremy Fitzhardinge /* Common code used when first setting up, and when resuming. */ 1529f502bf2bSIan Campbell static int talk_to_netback(struct xenbus_device *dev, 15300d160211SJeremy Fitzhardinge struct netfront_info *info) 15310d160211SJeremy Fitzhardinge { 15320d160211SJeremy Fitzhardinge const char *message; 15330d160211SJeremy Fitzhardinge struct xenbus_transaction xbt; 15340d160211SJeremy Fitzhardinge int err; 15350d160211SJeremy Fitzhardinge 15360d160211SJeremy Fitzhardinge /* Create shared ring, alloc event channel. */ 15370d160211SJeremy Fitzhardinge err = setup_netfront(dev, info); 15380d160211SJeremy Fitzhardinge if (err) 15390d160211SJeremy Fitzhardinge goto out; 15400d160211SJeremy Fitzhardinge 15410d160211SJeremy Fitzhardinge again: 15420d160211SJeremy Fitzhardinge err = xenbus_transaction_start(&xbt); 15430d160211SJeremy Fitzhardinge if (err) { 15440d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "starting transaction"); 15450d160211SJeremy Fitzhardinge goto destroy_ring; 15460d160211SJeremy Fitzhardinge } 15470d160211SJeremy Fitzhardinge 15480d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, "tx-ring-ref", "%u", 15490d160211SJeremy Fitzhardinge info->tx_ring_ref); 15500d160211SJeremy Fitzhardinge if (err) { 15510d160211SJeremy Fitzhardinge message = "writing tx ring-ref"; 15520d160211SJeremy Fitzhardinge goto abort_transaction; 15530d160211SJeremy Fitzhardinge } 15540d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, "rx-ring-ref", "%u", 15550d160211SJeremy Fitzhardinge info->rx_ring_ref); 15560d160211SJeremy Fitzhardinge if (err) { 15570d160211SJeremy Fitzhardinge message = "writing rx ring-ref"; 15580d160211SJeremy Fitzhardinge goto abort_transaction; 15590d160211SJeremy Fitzhardinge } 15600d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, 15610d160211SJeremy Fitzhardinge "event-channel", "%u", info->evtchn); 15620d160211SJeremy Fitzhardinge if (err) { 15630d160211SJeremy Fitzhardinge message = "writing event-channel"; 15640d160211SJeremy Fitzhardinge goto abort_transaction; 15650d160211SJeremy Fitzhardinge } 15660d160211SJeremy Fitzhardinge 15670d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, "request-rx-copy", "%u", 15680d160211SJeremy Fitzhardinge 1); 15690d160211SJeremy Fitzhardinge if (err) { 15700d160211SJeremy Fitzhardinge message = "writing request-rx-copy"; 15710d160211SJeremy Fitzhardinge goto abort_transaction; 15720d160211SJeremy Fitzhardinge } 15730d160211SJeremy Fitzhardinge 15740d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, "feature-rx-notify", "%d", 1); 15750d160211SJeremy Fitzhardinge if (err) { 15760d160211SJeremy Fitzhardinge message = "writing feature-rx-notify"; 15770d160211SJeremy Fitzhardinge goto abort_transaction; 15780d160211SJeremy Fitzhardinge } 15790d160211SJeremy Fitzhardinge 15800d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, "feature-sg", "%d", 1); 15810d160211SJeremy Fitzhardinge if (err) { 15820d160211SJeremy Fitzhardinge message = "writing feature-sg"; 15830d160211SJeremy Fitzhardinge goto abort_transaction; 15840d160211SJeremy Fitzhardinge } 15850d160211SJeremy Fitzhardinge 15860d160211SJeremy Fitzhardinge err = xenbus_printf(xbt, dev->nodename, "feature-gso-tcpv4", "%d", 1); 15870d160211SJeremy Fitzhardinge if (err) { 15880d160211SJeremy Fitzhardinge message = "writing feature-gso-tcpv4"; 15890d160211SJeremy Fitzhardinge goto abort_transaction; 15900d160211SJeremy Fitzhardinge } 15910d160211SJeremy Fitzhardinge 15920d160211SJeremy Fitzhardinge err = xenbus_transaction_end(xbt, 0); 15930d160211SJeremy Fitzhardinge if (err) { 15940d160211SJeremy Fitzhardinge if (err == -EAGAIN) 15950d160211SJeremy Fitzhardinge goto again; 15960d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "completing transaction"); 15970d160211SJeremy Fitzhardinge goto destroy_ring; 15980d160211SJeremy Fitzhardinge } 15990d160211SJeremy Fitzhardinge 16000d160211SJeremy Fitzhardinge return 0; 16010d160211SJeremy Fitzhardinge 16020d160211SJeremy Fitzhardinge abort_transaction: 16030d160211SJeremy Fitzhardinge xenbus_transaction_end(xbt, 1); 16040d160211SJeremy Fitzhardinge xenbus_dev_fatal(dev, err, "%s", message); 16050d160211SJeremy Fitzhardinge destroy_ring: 16060d160211SJeremy Fitzhardinge xennet_disconnect_backend(info); 16070d160211SJeremy Fitzhardinge out: 16080d160211SJeremy Fitzhardinge return err; 16090d160211SJeremy Fitzhardinge } 16100d160211SJeremy Fitzhardinge 16110d160211SJeremy Fitzhardinge static int xennet_connect(struct net_device *dev) 16120d160211SJeremy Fitzhardinge { 16130d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(dev); 16140d160211SJeremy Fitzhardinge int i, requeue_idx, err; 16150d160211SJeremy Fitzhardinge struct sk_buff *skb; 16160d160211SJeremy Fitzhardinge grant_ref_t ref; 16170d160211SJeremy Fitzhardinge struct xen_netif_rx_request *req; 16180d160211SJeremy Fitzhardinge unsigned int feature_rx_copy; 16190d160211SJeremy Fitzhardinge 16200d160211SJeremy Fitzhardinge err = xenbus_scanf(XBT_NIL, np->xbdev->otherend, 16210d160211SJeremy Fitzhardinge "feature-rx-copy", "%u", &feature_rx_copy); 16220d160211SJeremy Fitzhardinge if (err != 1) 16230d160211SJeremy Fitzhardinge feature_rx_copy = 0; 16240d160211SJeremy Fitzhardinge 16250d160211SJeremy Fitzhardinge if (!feature_rx_copy) { 16260d160211SJeremy Fitzhardinge dev_info(&dev->dev, 1627898eb71cSJoe Perches "backend does not support copying receive path\n"); 16280d160211SJeremy Fitzhardinge return -ENODEV; 16290d160211SJeremy Fitzhardinge } 16300d160211SJeremy Fitzhardinge 1631f502bf2bSIan Campbell err = talk_to_netback(np->xbdev, np); 16320d160211SJeremy Fitzhardinge if (err) 16330d160211SJeremy Fitzhardinge return err; 16340d160211SJeremy Fitzhardinge 16351ba37c51SIan Campbell rtnl_lock(); 1636fb507934SMichał Mirosław netdev_update_features(dev); 16371ba37c51SIan Campbell rtnl_unlock(); 16380d160211SJeremy Fitzhardinge 16390d160211SJeremy Fitzhardinge spin_lock_bh(&np->rx_lock); 16400d160211SJeremy Fitzhardinge spin_lock_irq(&np->tx_lock); 16410d160211SJeremy Fitzhardinge 16420d160211SJeremy Fitzhardinge /* Step 1: Discard all pending TX packet fragments. */ 16430d160211SJeremy Fitzhardinge xennet_release_tx_bufs(np); 16440d160211SJeremy Fitzhardinge 16450d160211SJeremy Fitzhardinge /* Step 2: Rebuild the RX buffer freelist and the RX ring itself. */ 16460d160211SJeremy Fitzhardinge for (requeue_idx = 0, i = 0; i < NET_RX_RING_SIZE; i++) { 164701c68026SIan Campbell skb_frag_t *frag; 164801c68026SIan Campbell const struct page *page; 16490d160211SJeremy Fitzhardinge if (!np->rx_skbs[i]) 16500d160211SJeremy Fitzhardinge continue; 16510d160211SJeremy Fitzhardinge 16520d160211SJeremy Fitzhardinge skb = np->rx_skbs[requeue_idx] = xennet_get_rx_skb(np, i); 16530d160211SJeremy Fitzhardinge ref = np->grant_rx_ref[requeue_idx] = xennet_get_rx_ref(np, i); 16540d160211SJeremy Fitzhardinge req = RING_GET_REQUEST(&np->rx, requeue_idx); 16550d160211SJeremy Fitzhardinge 165601c68026SIan Campbell frag = &skb_shinfo(skb)->frags[0]; 165701c68026SIan Campbell page = skb_frag_page(frag); 16580d160211SJeremy Fitzhardinge gnttab_grant_foreign_access_ref( 16590d160211SJeremy Fitzhardinge ref, np->xbdev->otherend_id, 166001c68026SIan Campbell pfn_to_mfn(page_to_pfn(page)), 16610d160211SJeremy Fitzhardinge 0); 16620d160211SJeremy Fitzhardinge req->gref = ref; 16630d160211SJeremy Fitzhardinge req->id = requeue_idx; 16640d160211SJeremy Fitzhardinge 16650d160211SJeremy Fitzhardinge requeue_idx++; 16660d160211SJeremy Fitzhardinge } 16670d160211SJeremy Fitzhardinge 16680d160211SJeremy Fitzhardinge np->rx.req_prod_pvt = requeue_idx; 16690d160211SJeremy Fitzhardinge 16700d160211SJeremy Fitzhardinge /* 16710d160211SJeremy Fitzhardinge * Step 3: All public and private state should now be sane. Get 16720d160211SJeremy Fitzhardinge * ready to start sending and receiving packets and give the driver 16730d160211SJeremy Fitzhardinge * domain a kick because we've probably just requeued some 16740d160211SJeremy Fitzhardinge * packets. 16750d160211SJeremy Fitzhardinge */ 16760d160211SJeremy Fitzhardinge netif_carrier_on(np->netdev); 16770d160211SJeremy Fitzhardinge notify_remote_via_irq(np->netdev->irq); 16780d160211SJeremy Fitzhardinge xennet_tx_buf_gc(dev); 16790d160211SJeremy Fitzhardinge xennet_alloc_rx_buffers(dev); 16800d160211SJeremy Fitzhardinge 16810d160211SJeremy Fitzhardinge spin_unlock_irq(&np->tx_lock); 16820d160211SJeremy Fitzhardinge spin_unlock_bh(&np->rx_lock); 16830d160211SJeremy Fitzhardinge 16840d160211SJeremy Fitzhardinge return 0; 16850d160211SJeremy Fitzhardinge } 16860d160211SJeremy Fitzhardinge 16870d160211SJeremy Fitzhardinge /** 16880d160211SJeremy Fitzhardinge * Callback received when the backend's state changes. 16890d160211SJeremy Fitzhardinge */ 1690f502bf2bSIan Campbell static void netback_changed(struct xenbus_device *dev, 16910d160211SJeremy Fitzhardinge enum xenbus_state backend_state) 16920d160211SJeremy Fitzhardinge { 16931b713e00SGreg Kroah-Hartman struct netfront_info *np = dev_get_drvdata(&dev->dev); 16940d160211SJeremy Fitzhardinge struct net_device *netdev = np->netdev; 16950d160211SJeremy Fitzhardinge 16960d160211SJeremy Fitzhardinge dev_dbg(&dev->dev, "%s\n", xenbus_strstate(backend_state)); 16970d160211SJeremy Fitzhardinge 16980d160211SJeremy Fitzhardinge switch (backend_state) { 16990d160211SJeremy Fitzhardinge case XenbusStateInitialising: 17000d160211SJeremy Fitzhardinge case XenbusStateInitialised: 1701b78c9512SNoboru Iwamatsu case XenbusStateReconfiguring: 1702b78c9512SNoboru Iwamatsu case XenbusStateReconfigured: 17030d160211SJeremy Fitzhardinge case XenbusStateUnknown: 17040d160211SJeremy Fitzhardinge case XenbusStateClosed: 17050d160211SJeremy Fitzhardinge break; 17060d160211SJeremy Fitzhardinge 17070d160211SJeremy Fitzhardinge case XenbusStateInitWait: 17080d160211SJeremy Fitzhardinge if (dev->state != XenbusStateInitialising) 17090d160211SJeremy Fitzhardinge break; 17100d160211SJeremy Fitzhardinge if (xennet_connect(netdev) != 0) 17110d160211SJeremy Fitzhardinge break; 17120d160211SJeremy Fitzhardinge xenbus_switch_state(dev, XenbusStateConnected); 171308e34eb1SLaszlo Ersek break; 171408e34eb1SLaszlo Ersek 171508e34eb1SLaszlo Ersek case XenbusStateConnected: 171659297067SIan Campbell netif_notify_peers(netdev); 17170d160211SJeremy Fitzhardinge break; 17180d160211SJeremy Fitzhardinge 17190d160211SJeremy Fitzhardinge case XenbusStateClosing: 17200d160211SJeremy Fitzhardinge xenbus_frontend_closed(dev); 17210d160211SJeremy Fitzhardinge break; 17220d160211SJeremy Fitzhardinge } 17230d160211SJeremy Fitzhardinge } 17240d160211SJeremy Fitzhardinge 1725e0ce4af9SIan Campbell static const struct xennet_stat { 1726e0ce4af9SIan Campbell char name[ETH_GSTRING_LEN]; 1727e0ce4af9SIan Campbell u16 offset; 1728e0ce4af9SIan Campbell } xennet_stats[] = { 1729e0ce4af9SIan Campbell { 1730e0ce4af9SIan Campbell "rx_gso_checksum_fixup", 1731e0ce4af9SIan Campbell offsetof(struct netfront_info, rx_gso_checksum_fixup) 1732e0ce4af9SIan Campbell }, 1733e0ce4af9SIan Campbell }; 1734e0ce4af9SIan Campbell 1735e0ce4af9SIan Campbell static int xennet_get_sset_count(struct net_device *dev, int string_set) 1736e0ce4af9SIan Campbell { 1737e0ce4af9SIan Campbell switch (string_set) { 1738e0ce4af9SIan Campbell case ETH_SS_STATS: 1739e0ce4af9SIan Campbell return ARRAY_SIZE(xennet_stats); 1740e0ce4af9SIan Campbell default: 1741e0ce4af9SIan Campbell return -EINVAL; 1742e0ce4af9SIan Campbell } 1743e0ce4af9SIan Campbell } 1744e0ce4af9SIan Campbell 1745e0ce4af9SIan Campbell static void xennet_get_ethtool_stats(struct net_device *dev, 1746e0ce4af9SIan Campbell struct ethtool_stats *stats, u64 * data) 1747e0ce4af9SIan Campbell { 1748e0ce4af9SIan Campbell void *np = netdev_priv(dev); 1749e0ce4af9SIan Campbell int i; 1750e0ce4af9SIan Campbell 1751e0ce4af9SIan Campbell for (i = 0; i < ARRAY_SIZE(xennet_stats); i++) 175248f26d51SEric Dumazet data[i] = *(unsigned long *)(np + xennet_stats[i].offset); 1753e0ce4af9SIan Campbell } 1754e0ce4af9SIan Campbell 1755e0ce4af9SIan Campbell static void xennet_get_strings(struct net_device *dev, u32 stringset, u8 * data) 1756e0ce4af9SIan Campbell { 1757e0ce4af9SIan Campbell int i; 1758e0ce4af9SIan Campbell 1759e0ce4af9SIan Campbell switch (stringset) { 1760e0ce4af9SIan Campbell case ETH_SS_STATS: 1761e0ce4af9SIan Campbell for (i = 0; i < ARRAY_SIZE(xennet_stats); i++) 1762e0ce4af9SIan Campbell memcpy(data + i * ETH_GSTRING_LEN, 1763e0ce4af9SIan Campbell xennet_stats[i].name, ETH_GSTRING_LEN); 1764e0ce4af9SIan Campbell break; 1765e0ce4af9SIan Campbell } 1766e0ce4af9SIan Campbell } 1767e0ce4af9SIan Campbell 17680fc0b732SStephen Hemminger static const struct ethtool_ops xennet_ethtool_ops = 17690d160211SJeremy Fitzhardinge { 17700d160211SJeremy Fitzhardinge .get_link = ethtool_op_get_link, 1771e0ce4af9SIan Campbell 1772e0ce4af9SIan Campbell .get_sset_count = xennet_get_sset_count, 1773e0ce4af9SIan Campbell .get_ethtool_stats = xennet_get_ethtool_stats, 1774e0ce4af9SIan Campbell .get_strings = xennet_get_strings, 17750d160211SJeremy Fitzhardinge }; 17760d160211SJeremy Fitzhardinge 17770d160211SJeremy Fitzhardinge #ifdef CONFIG_SYSFS 17780d160211SJeremy Fitzhardinge static ssize_t show_rxbuf_min(struct device *dev, 17790d160211SJeremy Fitzhardinge struct device_attribute *attr, char *buf) 17800d160211SJeremy Fitzhardinge { 17810d160211SJeremy Fitzhardinge struct net_device *netdev = to_net_dev(dev); 17820d160211SJeremy Fitzhardinge struct netfront_info *info = netdev_priv(netdev); 17830d160211SJeremy Fitzhardinge 17840d160211SJeremy Fitzhardinge return sprintf(buf, "%u\n", info->rx_min_target); 17850d160211SJeremy Fitzhardinge } 17860d160211SJeremy Fitzhardinge 17870d160211SJeremy Fitzhardinge static ssize_t store_rxbuf_min(struct device *dev, 17880d160211SJeremy Fitzhardinge struct device_attribute *attr, 17890d160211SJeremy Fitzhardinge const char *buf, size_t len) 17900d160211SJeremy Fitzhardinge { 17910d160211SJeremy Fitzhardinge struct net_device *netdev = to_net_dev(dev); 17920d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(netdev); 17930d160211SJeremy Fitzhardinge char *endp; 17940d160211SJeremy Fitzhardinge unsigned long target; 17950d160211SJeremy Fitzhardinge 17960d160211SJeremy Fitzhardinge if (!capable(CAP_NET_ADMIN)) 17970d160211SJeremy Fitzhardinge return -EPERM; 17980d160211SJeremy Fitzhardinge 17990d160211SJeremy Fitzhardinge target = simple_strtoul(buf, &endp, 0); 18000d160211SJeremy Fitzhardinge if (endp == buf) 18010d160211SJeremy Fitzhardinge return -EBADMSG; 18020d160211SJeremy Fitzhardinge 18030d160211SJeremy Fitzhardinge if (target < RX_MIN_TARGET) 18040d160211SJeremy Fitzhardinge target = RX_MIN_TARGET; 18050d160211SJeremy Fitzhardinge if (target > RX_MAX_TARGET) 18060d160211SJeremy Fitzhardinge target = RX_MAX_TARGET; 18070d160211SJeremy Fitzhardinge 18080d160211SJeremy Fitzhardinge spin_lock_bh(&np->rx_lock); 18090d160211SJeremy Fitzhardinge if (target > np->rx_max_target) 18100d160211SJeremy Fitzhardinge np->rx_max_target = target; 18110d160211SJeremy Fitzhardinge np->rx_min_target = target; 18120d160211SJeremy Fitzhardinge if (target > np->rx_target) 18130d160211SJeremy Fitzhardinge np->rx_target = target; 18140d160211SJeremy Fitzhardinge 18150d160211SJeremy Fitzhardinge xennet_alloc_rx_buffers(netdev); 18160d160211SJeremy Fitzhardinge 18170d160211SJeremy Fitzhardinge spin_unlock_bh(&np->rx_lock); 18180d160211SJeremy Fitzhardinge return len; 18190d160211SJeremy Fitzhardinge } 18200d160211SJeremy Fitzhardinge 18210d160211SJeremy Fitzhardinge static ssize_t show_rxbuf_max(struct device *dev, 18220d160211SJeremy Fitzhardinge struct device_attribute *attr, char *buf) 18230d160211SJeremy Fitzhardinge { 18240d160211SJeremy Fitzhardinge struct net_device *netdev = to_net_dev(dev); 18250d160211SJeremy Fitzhardinge struct netfront_info *info = netdev_priv(netdev); 18260d160211SJeremy Fitzhardinge 18270d160211SJeremy Fitzhardinge return sprintf(buf, "%u\n", info->rx_max_target); 18280d160211SJeremy Fitzhardinge } 18290d160211SJeremy Fitzhardinge 18300d160211SJeremy Fitzhardinge static ssize_t store_rxbuf_max(struct device *dev, 18310d160211SJeremy Fitzhardinge struct device_attribute *attr, 18320d160211SJeremy Fitzhardinge const char *buf, size_t len) 18330d160211SJeremy Fitzhardinge { 18340d160211SJeremy Fitzhardinge struct net_device *netdev = to_net_dev(dev); 18350d160211SJeremy Fitzhardinge struct netfront_info *np = netdev_priv(netdev); 18360d160211SJeremy Fitzhardinge char *endp; 18370d160211SJeremy Fitzhardinge unsigned long target; 18380d160211SJeremy Fitzhardinge 18390d160211SJeremy Fitzhardinge if (!capable(CAP_NET_ADMIN)) 18400d160211SJeremy Fitzhardinge return -EPERM; 18410d160211SJeremy Fitzhardinge 18420d160211SJeremy Fitzhardinge target = simple_strtoul(buf, &endp, 0); 18430d160211SJeremy Fitzhardinge if (endp == buf) 18440d160211SJeremy Fitzhardinge return -EBADMSG; 18450d160211SJeremy Fitzhardinge 18460d160211SJeremy Fitzhardinge if (target < RX_MIN_TARGET) 18470d160211SJeremy Fitzhardinge target = RX_MIN_TARGET; 18480d160211SJeremy Fitzhardinge if (target > RX_MAX_TARGET) 18490d160211SJeremy Fitzhardinge target = RX_MAX_TARGET; 18500d160211SJeremy Fitzhardinge 18510d160211SJeremy Fitzhardinge spin_lock_bh(&np->rx_lock); 18520d160211SJeremy Fitzhardinge if (target < np->rx_min_target) 18530d160211SJeremy Fitzhardinge np->rx_min_target = target; 18540d160211SJeremy Fitzhardinge np->rx_max_target = target; 18550d160211SJeremy Fitzhardinge if (target < np->rx_target) 18560d160211SJeremy Fitzhardinge np->rx_target = target; 18570d160211SJeremy Fitzhardinge 18580d160211SJeremy Fitzhardinge xennet_alloc_rx_buffers(netdev); 18590d160211SJeremy Fitzhardinge 18600d160211SJeremy Fitzhardinge spin_unlock_bh(&np->rx_lock); 18610d160211SJeremy Fitzhardinge return len; 18620d160211SJeremy Fitzhardinge } 18630d160211SJeremy Fitzhardinge 18640d160211SJeremy Fitzhardinge static ssize_t show_rxbuf_cur(struct device *dev, 18650d160211SJeremy Fitzhardinge struct device_attribute *attr, char *buf) 18660d160211SJeremy Fitzhardinge { 18670d160211SJeremy Fitzhardinge struct net_device *netdev = to_net_dev(dev); 18680d160211SJeremy Fitzhardinge struct netfront_info *info = netdev_priv(netdev); 18690d160211SJeremy Fitzhardinge 18700d160211SJeremy Fitzhardinge return sprintf(buf, "%u\n", info->rx_target); 18710d160211SJeremy Fitzhardinge } 18720d160211SJeremy Fitzhardinge 18730d160211SJeremy Fitzhardinge static struct device_attribute xennet_attrs[] = { 18740d160211SJeremy Fitzhardinge __ATTR(rxbuf_min, S_IRUGO|S_IWUSR, show_rxbuf_min, store_rxbuf_min), 18750d160211SJeremy Fitzhardinge __ATTR(rxbuf_max, S_IRUGO|S_IWUSR, show_rxbuf_max, store_rxbuf_max), 18760d160211SJeremy Fitzhardinge __ATTR(rxbuf_cur, S_IRUGO, show_rxbuf_cur, NULL), 18770d160211SJeremy Fitzhardinge }; 18780d160211SJeremy Fitzhardinge 18790d160211SJeremy Fitzhardinge static int xennet_sysfs_addif(struct net_device *netdev) 18800d160211SJeremy Fitzhardinge { 18810d160211SJeremy Fitzhardinge int i; 18820d160211SJeremy Fitzhardinge int err; 18830d160211SJeremy Fitzhardinge 18840d160211SJeremy Fitzhardinge for (i = 0; i < ARRAY_SIZE(xennet_attrs); i++) { 18850d160211SJeremy Fitzhardinge err = device_create_file(&netdev->dev, 18860d160211SJeremy Fitzhardinge &xennet_attrs[i]); 18870d160211SJeremy Fitzhardinge if (err) 18880d160211SJeremy Fitzhardinge goto fail; 18890d160211SJeremy Fitzhardinge } 18900d160211SJeremy Fitzhardinge return 0; 18910d160211SJeremy Fitzhardinge 18920d160211SJeremy Fitzhardinge fail: 18930d160211SJeremy Fitzhardinge while (--i >= 0) 18940d160211SJeremy Fitzhardinge device_remove_file(&netdev->dev, &xennet_attrs[i]); 18950d160211SJeremy Fitzhardinge return err; 18960d160211SJeremy Fitzhardinge } 18970d160211SJeremy Fitzhardinge 18980d160211SJeremy Fitzhardinge static void xennet_sysfs_delif(struct net_device *netdev) 18990d160211SJeremy Fitzhardinge { 19000d160211SJeremy Fitzhardinge int i; 19010d160211SJeremy Fitzhardinge 19020d160211SJeremy Fitzhardinge for (i = 0; i < ARRAY_SIZE(xennet_attrs); i++) 19030d160211SJeremy Fitzhardinge device_remove_file(&netdev->dev, &xennet_attrs[i]); 19040d160211SJeremy Fitzhardinge } 19050d160211SJeremy Fitzhardinge 19060d160211SJeremy Fitzhardinge #endif /* CONFIG_SYSFS */ 19070d160211SJeremy Fitzhardinge 190873db144bSJan Beulich static const struct xenbus_device_id netfront_ids[] = { 19090d160211SJeremy Fitzhardinge { "vif" }, 19100d160211SJeremy Fitzhardinge { "" } 19110d160211SJeremy Fitzhardinge }; 19120d160211SJeremy Fitzhardinge 19130d160211SJeremy Fitzhardinge 19140d160211SJeremy Fitzhardinge static int __devexit xennet_remove(struct xenbus_device *dev) 19150d160211SJeremy Fitzhardinge { 19161b713e00SGreg Kroah-Hartman struct netfront_info *info = dev_get_drvdata(&dev->dev); 19170d160211SJeremy Fitzhardinge 19180d160211SJeremy Fitzhardinge dev_dbg(&dev->dev, "%s\n", dev->nodename); 19190d160211SJeremy Fitzhardinge 19200d160211SJeremy Fitzhardinge xennet_disconnect_backend(info); 19210d160211SJeremy Fitzhardinge 19220d160211SJeremy Fitzhardinge xennet_sysfs_delif(info->netdev); 19230d160211SJeremy Fitzhardinge 19246bc96d04SIan Campbell unregister_netdev(info->netdev); 19256bc96d04SIan Campbell 19266bc96d04SIan Campbell del_timer_sync(&info->rx_refill_timer); 19276bc96d04SIan Campbell 1928e00f85beSstephen hemminger free_percpu(info->stats); 1929e00f85beSstephen hemminger 19300d160211SJeremy Fitzhardinge free_netdev(info->netdev); 19310d160211SJeremy Fitzhardinge 19320d160211SJeremy Fitzhardinge return 0; 19330d160211SJeremy Fitzhardinge } 19340d160211SJeremy Fitzhardinge 193573db144bSJan Beulich static DEFINE_XENBUS_DRIVER(netfront, , 19360d160211SJeremy Fitzhardinge .probe = netfront_probe, 19370d160211SJeremy Fitzhardinge .remove = __devexit_p(xennet_remove), 19380d160211SJeremy Fitzhardinge .resume = netfront_resume, 1939f502bf2bSIan Campbell .otherend_changed = netback_changed, 194073db144bSJan Beulich ); 19410d160211SJeremy Fitzhardinge 19420d160211SJeremy Fitzhardinge static int __init netif_init(void) 19430d160211SJeremy Fitzhardinge { 19446e833587SJeremy Fitzhardinge if (!xen_domain()) 19450d160211SJeremy Fitzhardinge return -ENODEV; 19460d160211SJeremy Fitzhardinge 1947e95ae5a4SIgor Mammedov if (xen_hvm_domain() && !xen_platform_pci_unplug) 1948b9136d20SIgor Mammedov return -ENODEV; 1949b9136d20SIgor Mammedov 19500d160211SJeremy Fitzhardinge printk(KERN_INFO "Initialising Xen virtual ethernet driver.\n"); 19510d160211SJeremy Fitzhardinge 1952ffb78a26SAl Viro return xenbus_register_frontend(&netfront_driver); 19530d160211SJeremy Fitzhardinge } 19540d160211SJeremy Fitzhardinge module_init(netif_init); 19550d160211SJeremy Fitzhardinge 19560d160211SJeremy Fitzhardinge 19570d160211SJeremy Fitzhardinge static void __exit netif_exit(void) 19580d160211SJeremy Fitzhardinge { 1959ffb78a26SAl Viro xenbus_unregister_driver(&netfront_driver); 19600d160211SJeremy Fitzhardinge } 19610d160211SJeremy Fitzhardinge module_exit(netif_exit); 19620d160211SJeremy Fitzhardinge 19630d160211SJeremy Fitzhardinge MODULE_DESCRIPTION("Xen virtual network device frontend"); 19640d160211SJeremy Fitzhardinge MODULE_LICENSE("GPL"); 1965d2f0c52bSMark McLoughlin MODULE_ALIAS("xen:vif"); 19664f93f09bSMark McLoughlin MODULE_ALIAS("xennet"); 1967