xref: /openbmc/linux/drivers/net/virtio_net.c (revision 0a888fd1)
1296f96fcSRusty Russell /* A simple network driver using virtio.
2296f96fcSRusty Russell  *
3296f96fcSRusty Russell  * Copyright 2007 Rusty Russell <rusty@rustcorp.com.au> IBM Corporation
4296f96fcSRusty Russell  *
5296f96fcSRusty Russell  * This program is free software; you can redistribute it and/or modify
6296f96fcSRusty Russell  * it under the terms of the GNU General Public License as published by
7296f96fcSRusty Russell  * the Free Software Foundation; either version 2 of the License, or
8296f96fcSRusty Russell  * (at your option) any later version.
9296f96fcSRusty Russell  *
10296f96fcSRusty Russell  * This program is distributed in the hope that it will be useful,
11296f96fcSRusty Russell  * but WITHOUT ANY WARRANTY; without even the implied warranty of
12296f96fcSRusty Russell  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13296f96fcSRusty Russell  * GNU General Public License for more details.
14296f96fcSRusty Russell  *
15296f96fcSRusty Russell  * You should have received a copy of the GNU General Public License
16296f96fcSRusty Russell  * along with this program; if not, write to the Free Software
17296f96fcSRusty Russell  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
18296f96fcSRusty Russell  */
19296f96fcSRusty Russell //#define DEBUG
20296f96fcSRusty Russell #include <linux/netdevice.h>
21296f96fcSRusty Russell #include <linux/etherdevice.h>
22a9ea3fc6SHerbert Xu #include <linux/ethtool.h>
23296f96fcSRusty Russell #include <linux/module.h>
24296f96fcSRusty Russell #include <linux/virtio.h>
25296f96fcSRusty Russell #include <linux/virtio_net.h>
26296f96fcSRusty Russell #include <linux/scatterlist.h>
27296f96fcSRusty Russell 
286c0cd7c0SDor Laor static int napi_weight = 128;
296c0cd7c0SDor Laor module_param(napi_weight, int, 0444);
306c0cd7c0SDor Laor 
3134a48579SRusty Russell static int csum = 1, gso = 1;
3234a48579SRusty Russell module_param(csum, bool, 0444);
3334a48579SRusty Russell module_param(gso, bool, 0444);
3434a48579SRusty Russell 
35296f96fcSRusty Russell /* FIXME: MTU in config. */
36296f96fcSRusty Russell #define MAX_PACKET_LEN (ETH_HLEN+ETH_DATA_LEN)
37296f96fcSRusty Russell 
38296f96fcSRusty Russell struct virtnet_info
39296f96fcSRusty Russell {
40296f96fcSRusty Russell 	struct virtio_device *vdev;
41296f96fcSRusty Russell 	struct virtqueue *rvq, *svq;
42296f96fcSRusty Russell 	struct net_device *dev;
43296f96fcSRusty Russell 	struct napi_struct napi;
44296f96fcSRusty Russell 
4599ffc696SRusty Russell 	/* The skb we couldn't send because buffers were full. */
4699ffc696SRusty Russell 	struct sk_buff *last_xmit_skb;
4799ffc696SRusty Russell 
48363f1514SRusty Russell 	/* If we need to free in a timer, this is it. */
4914c998f0SMark McLoughlin 	struct timer_list xmit_free_timer;
5014c998f0SMark McLoughlin 
51296f96fcSRusty Russell 	/* Number of input buffers, and max we've ever had. */
52296f96fcSRusty Russell 	unsigned int num, max;
53296f96fcSRusty Russell 
5411a3a154SRusty Russell 	/* For cleaning up after transmission. */
5511a3a154SRusty Russell 	struct tasklet_struct tasklet;
56363f1514SRusty Russell 	bool free_in_tasklet;
5711a3a154SRusty Russell 
5897402b96SHerbert Xu 	/* I like... big packets and I cannot lie! */
5997402b96SHerbert Xu 	bool big_packets;
6097402b96SHerbert Xu 
61296f96fcSRusty Russell 	/* Receive & send queues. */
62296f96fcSRusty Russell 	struct sk_buff_head recv;
63296f96fcSRusty Russell 	struct sk_buff_head send;
64fb6813f4SRusty Russell 
65fb6813f4SRusty Russell 	/* Chain pages by the private ptr. */
66fb6813f4SRusty Russell 	struct page *pages;
67296f96fcSRusty Russell };
68296f96fcSRusty Russell 
69296f96fcSRusty Russell static inline struct virtio_net_hdr *skb_vnet_hdr(struct sk_buff *skb)
70296f96fcSRusty Russell {
71296f96fcSRusty Russell 	return (struct virtio_net_hdr *)skb->cb;
72296f96fcSRusty Russell }
73296f96fcSRusty Russell 
74296f96fcSRusty Russell static inline void vnet_hdr_to_sg(struct scatterlist *sg, struct sk_buff *skb)
75296f96fcSRusty Russell {
76296f96fcSRusty Russell 	sg_init_one(sg, skb_vnet_hdr(skb), sizeof(struct virtio_net_hdr));
77296f96fcSRusty Russell }
78296f96fcSRusty Russell 
79fb6813f4SRusty Russell static void give_a_page(struct virtnet_info *vi, struct page *page)
80fb6813f4SRusty Russell {
81fb6813f4SRusty Russell 	page->private = (unsigned long)vi->pages;
82fb6813f4SRusty Russell 	vi->pages = page;
83fb6813f4SRusty Russell }
84fb6813f4SRusty Russell 
850a888fd1SMark McLoughlin static void trim_pages(struct virtnet_info *vi, struct sk_buff *skb)
860a888fd1SMark McLoughlin {
870a888fd1SMark McLoughlin 	unsigned int i;
880a888fd1SMark McLoughlin 
890a888fd1SMark McLoughlin 	for (i = 0; i < skb_shinfo(skb)->nr_frags; i++)
900a888fd1SMark McLoughlin 		give_a_page(vi, skb_shinfo(skb)->frags[i].page);
910a888fd1SMark McLoughlin 	skb_shinfo(skb)->nr_frags = 0;
920a888fd1SMark McLoughlin 	skb->data_len = 0;
930a888fd1SMark McLoughlin }
940a888fd1SMark McLoughlin 
95fb6813f4SRusty Russell static struct page *get_a_page(struct virtnet_info *vi, gfp_t gfp_mask)
96fb6813f4SRusty Russell {
97fb6813f4SRusty Russell 	struct page *p = vi->pages;
98fb6813f4SRusty Russell 
99fb6813f4SRusty Russell 	if (p)
100fb6813f4SRusty Russell 		vi->pages = (struct page *)p->private;
101fb6813f4SRusty Russell 	else
102fb6813f4SRusty Russell 		p = alloc_page(gfp_mask);
103fb6813f4SRusty Russell 	return p;
104fb6813f4SRusty Russell }
105fb6813f4SRusty Russell 
1062cb9c6baSRusty Russell static void skb_xmit_done(struct virtqueue *svq)
107296f96fcSRusty Russell {
1082cb9c6baSRusty Russell 	struct virtnet_info *vi = svq->vdev->priv;
109296f96fcSRusty Russell 
1102cb9c6baSRusty Russell 	/* Suppress further interrupts. */
1112cb9c6baSRusty Russell 	svq->vq_ops->disable_cb(svq);
11211a3a154SRusty Russell 
113363f1514SRusty Russell 	/* We were probably waiting for more output buffers. */
114296f96fcSRusty Russell 	netif_wake_queue(vi->dev);
11511a3a154SRusty Russell 
11611a3a154SRusty Russell 	/* Make sure we re-xmit last_xmit_skb: if there are no more packets
11711a3a154SRusty Russell 	 * queued, start_xmit won't be called. */
11811a3a154SRusty Russell 	tasklet_schedule(&vi->tasklet);
119296f96fcSRusty Russell }
120296f96fcSRusty Russell 
121296f96fcSRusty Russell static void receive_skb(struct net_device *dev, struct sk_buff *skb,
122296f96fcSRusty Russell 			unsigned len)
123296f96fcSRusty Russell {
124296f96fcSRusty Russell 	struct virtio_net_hdr *hdr = skb_vnet_hdr(skb);
12597402b96SHerbert Xu 	int err;
126296f96fcSRusty Russell 
127296f96fcSRusty Russell 	if (unlikely(len < sizeof(struct virtio_net_hdr) + ETH_HLEN)) {
128296f96fcSRusty Russell 		pr_debug("%s: short packet %i\n", dev->name, len);
129296f96fcSRusty Russell 		dev->stats.rx_length_errors++;
130296f96fcSRusty Russell 		goto drop;
131296f96fcSRusty Russell 	}
132296f96fcSRusty Russell 	len -= sizeof(struct virtio_net_hdr);
133296f96fcSRusty Russell 
1340a888fd1SMark McLoughlin 	if (len <= MAX_PACKET_LEN)
1350a888fd1SMark McLoughlin 		trim_pages(netdev_priv(dev), skb);
136fb6813f4SRusty Russell 
13797402b96SHerbert Xu 	err = pskb_trim(skb, len);
13897402b96SHerbert Xu 	if (err) {
13997402b96SHerbert Xu 		pr_debug("%s: pskb_trim failed %i %d\n", dev->name, len, err);
14097402b96SHerbert Xu 		dev->stats.rx_dropped++;
14197402b96SHerbert Xu 		goto drop;
14297402b96SHerbert Xu 	}
14397402b96SHerbert Xu 	skb->truesize += skb->data_len;
144296f96fcSRusty Russell 	dev->stats.rx_bytes += skb->len;
145296f96fcSRusty Russell 	dev->stats.rx_packets++;
146296f96fcSRusty Russell 
147296f96fcSRusty Russell 	if (hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) {
148296f96fcSRusty Russell 		pr_debug("Needs csum!\n");
149f35d9d8aSRusty Russell 		if (!skb_partial_csum_set(skb,hdr->csum_start,hdr->csum_offset))
150296f96fcSRusty Russell 			goto frame_err;
151296f96fcSRusty Russell 	}
152296f96fcSRusty Russell 
15323cde76dSMark McLoughlin 	skb->protocol = eth_type_trans(skb, dev);
15423cde76dSMark McLoughlin 	pr_debug("Receiving skb proto 0x%04x len %i type %i\n",
15523cde76dSMark McLoughlin 		 ntohs(skb->protocol), skb->len, skb->pkt_type);
15623cde76dSMark McLoughlin 
157296f96fcSRusty Russell 	if (hdr->gso_type != VIRTIO_NET_HDR_GSO_NONE) {
158296f96fcSRusty Russell 		pr_debug("GSO!\n");
15934a48579SRusty Russell 		switch (hdr->gso_type & ~VIRTIO_NET_HDR_GSO_ECN) {
160296f96fcSRusty Russell 		case VIRTIO_NET_HDR_GSO_TCPV4:
161296f96fcSRusty Russell 			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
162296f96fcSRusty Russell 			break;
163296f96fcSRusty Russell 		case VIRTIO_NET_HDR_GSO_UDP:
164296f96fcSRusty Russell 			skb_shinfo(skb)->gso_type = SKB_GSO_UDP;
165296f96fcSRusty Russell 			break;
166296f96fcSRusty Russell 		case VIRTIO_NET_HDR_GSO_TCPV6:
167296f96fcSRusty Russell 			skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
168296f96fcSRusty Russell 			break;
169296f96fcSRusty Russell 		default:
170296f96fcSRusty Russell 			if (net_ratelimit())
171296f96fcSRusty Russell 				printk(KERN_WARNING "%s: bad gso type %u.\n",
172296f96fcSRusty Russell 				       dev->name, hdr->gso_type);
173296f96fcSRusty Russell 			goto frame_err;
174296f96fcSRusty Russell 		}
175296f96fcSRusty Russell 
17634a48579SRusty Russell 		if (hdr->gso_type & VIRTIO_NET_HDR_GSO_ECN)
17734a48579SRusty Russell 			skb_shinfo(skb)->gso_type |= SKB_GSO_TCP_ECN;
17834a48579SRusty Russell 
179296f96fcSRusty Russell 		skb_shinfo(skb)->gso_size = hdr->gso_size;
180296f96fcSRusty Russell 		if (skb_shinfo(skb)->gso_size == 0) {
181296f96fcSRusty Russell 			if (net_ratelimit())
182296f96fcSRusty Russell 				printk(KERN_WARNING "%s: zero gso size.\n",
183296f96fcSRusty Russell 				       dev->name);
184296f96fcSRusty Russell 			goto frame_err;
185296f96fcSRusty Russell 		}
186296f96fcSRusty Russell 
187296f96fcSRusty Russell 		/* Header must be checked, and gso_segs computed. */
188296f96fcSRusty Russell 		skb_shinfo(skb)->gso_type |= SKB_GSO_DODGY;
189296f96fcSRusty Russell 		skb_shinfo(skb)->gso_segs = 0;
190296f96fcSRusty Russell 	}
191296f96fcSRusty Russell 
192296f96fcSRusty Russell 	netif_receive_skb(skb);
193296f96fcSRusty Russell 	return;
194296f96fcSRusty Russell 
195296f96fcSRusty Russell frame_err:
196296f96fcSRusty Russell 	dev->stats.rx_frame_errors++;
197296f96fcSRusty Russell drop:
198296f96fcSRusty Russell 	dev_kfree_skb(skb);
199296f96fcSRusty Russell }
200296f96fcSRusty Russell 
201296f96fcSRusty Russell static void try_fill_recv(struct virtnet_info *vi)
202296f96fcSRusty Russell {
203296f96fcSRusty Russell 	struct sk_buff *skb;
20405271685SRusty Russell 	struct scatterlist sg[2+MAX_SKB_FRAGS];
20597402b96SHerbert Xu 	int num, err, i;
206296f96fcSRusty Russell 
20705271685SRusty Russell 	sg_init_table(sg, 2+MAX_SKB_FRAGS);
208296f96fcSRusty Russell 	for (;;) {
209296f96fcSRusty Russell 		skb = netdev_alloc_skb(vi->dev, MAX_PACKET_LEN);
210296f96fcSRusty Russell 		if (unlikely(!skb))
211296f96fcSRusty Russell 			break;
212296f96fcSRusty Russell 
213296f96fcSRusty Russell 		skb_put(skb, MAX_PACKET_LEN);
214296f96fcSRusty Russell 		vnet_hdr_to_sg(sg, skb);
21597402b96SHerbert Xu 
21697402b96SHerbert Xu 		if (vi->big_packets) {
21797402b96SHerbert Xu 			for (i = 0; i < MAX_SKB_FRAGS; i++) {
21897402b96SHerbert Xu 				skb_frag_t *f = &skb_shinfo(skb)->frags[i];
219fb6813f4SRusty Russell 				f->page = get_a_page(vi, GFP_ATOMIC);
22097402b96SHerbert Xu 				if (!f->page)
22197402b96SHerbert Xu 					break;
22297402b96SHerbert Xu 
22397402b96SHerbert Xu 				f->page_offset = 0;
22497402b96SHerbert Xu 				f->size = PAGE_SIZE;
22597402b96SHerbert Xu 
22697402b96SHerbert Xu 				skb->data_len += PAGE_SIZE;
22797402b96SHerbert Xu 				skb->len += PAGE_SIZE;
22897402b96SHerbert Xu 
22997402b96SHerbert Xu 				skb_shinfo(skb)->nr_frags++;
23097402b96SHerbert Xu 			}
23197402b96SHerbert Xu 		}
23297402b96SHerbert Xu 
233296f96fcSRusty Russell 		num = skb_to_sgvec(skb, sg+1, 0, skb->len) + 1;
234296f96fcSRusty Russell 		skb_queue_head(&vi->recv, skb);
235296f96fcSRusty Russell 
236296f96fcSRusty Russell 		err = vi->rvq->vq_ops->add_buf(vi->rvq, sg, 0, num, skb);
237296f96fcSRusty Russell 		if (err) {
238296f96fcSRusty Russell 			skb_unlink(skb, &vi->recv);
2390a888fd1SMark McLoughlin 			trim_pages(vi, skb);
240296f96fcSRusty Russell 			kfree_skb(skb);
241296f96fcSRusty Russell 			break;
242296f96fcSRusty Russell 		}
243296f96fcSRusty Russell 		vi->num++;
244296f96fcSRusty Russell 	}
245296f96fcSRusty Russell 	if (unlikely(vi->num > vi->max))
246296f96fcSRusty Russell 		vi->max = vi->num;
247296f96fcSRusty Russell 	vi->rvq->vq_ops->kick(vi->rvq);
248296f96fcSRusty Russell }
249296f96fcSRusty Russell 
25018445c4dSRusty Russell static void skb_recv_done(struct virtqueue *rvq)
251296f96fcSRusty Russell {
252296f96fcSRusty Russell 	struct virtnet_info *vi = rvq->vdev->priv;
25318445c4dSRusty Russell 	/* Schedule NAPI, Suppress further interrupts if successful. */
25418445c4dSRusty Russell 	if (netif_rx_schedule_prep(vi->dev, &vi->napi)) {
25518445c4dSRusty Russell 		rvq->vq_ops->disable_cb(rvq);
25618445c4dSRusty Russell 		__netif_rx_schedule(vi->dev, &vi->napi);
25718445c4dSRusty Russell 	}
258296f96fcSRusty Russell }
259296f96fcSRusty Russell 
260296f96fcSRusty Russell static int virtnet_poll(struct napi_struct *napi, int budget)
261296f96fcSRusty Russell {
262296f96fcSRusty Russell 	struct virtnet_info *vi = container_of(napi, struct virtnet_info, napi);
263296f96fcSRusty Russell 	struct sk_buff *skb = NULL;
264296f96fcSRusty Russell 	unsigned int len, received = 0;
265296f96fcSRusty Russell 
266296f96fcSRusty Russell again:
267296f96fcSRusty Russell 	while (received < budget &&
268296f96fcSRusty Russell 	       (skb = vi->rvq->vq_ops->get_buf(vi->rvq, &len)) != NULL) {
269296f96fcSRusty Russell 		__skb_unlink(skb, &vi->recv);
270296f96fcSRusty Russell 		receive_skb(vi->dev, skb, len);
271296f96fcSRusty Russell 		vi->num--;
272296f96fcSRusty Russell 		received++;
273296f96fcSRusty Russell 	}
274296f96fcSRusty Russell 
275296f96fcSRusty Russell 	/* FIXME: If we oom and completely run out of inbufs, we need
276296f96fcSRusty Russell 	 * to start a timer trying to fill more. */
277296f96fcSRusty Russell 	if (vi->num < vi->max / 2)
278296f96fcSRusty Russell 		try_fill_recv(vi);
279296f96fcSRusty Russell 
2808329d98eSRusty Russell 	/* Out of packets? */
2818329d98eSRusty Russell 	if (received < budget) {
282296f96fcSRusty Russell 		netif_rx_complete(vi->dev, napi);
28318445c4dSRusty Russell 		if (unlikely(!vi->rvq->vq_ops->enable_cb(vi->rvq))
2844265f161SChristian Borntraeger 		    && napi_schedule_prep(napi)) {
2854265f161SChristian Borntraeger 			vi->rvq->vq_ops->disable_cb(vi->rvq);
2864265f161SChristian Borntraeger 			__netif_rx_schedule(vi->dev, napi);
287296f96fcSRusty Russell 			goto again;
288296f96fcSRusty Russell 		}
2894265f161SChristian Borntraeger 	}
290296f96fcSRusty Russell 
291296f96fcSRusty Russell 	return received;
292296f96fcSRusty Russell }
293296f96fcSRusty Russell 
294296f96fcSRusty Russell static void free_old_xmit_skbs(struct virtnet_info *vi)
295296f96fcSRusty Russell {
296296f96fcSRusty Russell 	struct sk_buff *skb;
297296f96fcSRusty Russell 	unsigned int len;
298296f96fcSRusty Russell 
299296f96fcSRusty Russell 	while ((skb = vi->svq->vq_ops->get_buf(vi->svq, &len)) != NULL) {
300296f96fcSRusty Russell 		pr_debug("Sent skb %p\n", skb);
301296f96fcSRusty Russell 		__skb_unlink(skb, &vi->send);
302655aa31fSRusty Russell 		vi->dev->stats.tx_bytes += skb->len;
303296f96fcSRusty Russell 		vi->dev->stats.tx_packets++;
304296f96fcSRusty Russell 		kfree_skb(skb);
305296f96fcSRusty Russell 	}
306296f96fcSRusty Russell }
307296f96fcSRusty Russell 
308363f1514SRusty Russell /* If the virtio transport doesn't always notify us when all in-flight packets
309363f1514SRusty Russell  * are consumed, we fall back to using this function on a timer to free them. */
31014c998f0SMark McLoughlin static void xmit_free(unsigned long data)
31114c998f0SMark McLoughlin {
31214c998f0SMark McLoughlin 	struct virtnet_info *vi = (void *)data;
31314c998f0SMark McLoughlin 
31414c998f0SMark McLoughlin 	netif_tx_lock(vi->dev);
31514c998f0SMark McLoughlin 
31614c998f0SMark McLoughlin 	free_old_xmit_skbs(vi);
31714c998f0SMark McLoughlin 
31814c998f0SMark McLoughlin 	if (!skb_queue_empty(&vi->send))
31914c998f0SMark McLoughlin 		mod_timer(&vi->xmit_free_timer, jiffies + (HZ/10));
32014c998f0SMark McLoughlin 
32114c998f0SMark McLoughlin 	netif_tx_unlock(vi->dev);
32214c998f0SMark McLoughlin }
32314c998f0SMark McLoughlin 
32499ffc696SRusty Russell static int xmit_skb(struct virtnet_info *vi, struct sk_buff *skb)
325296f96fcSRusty Russell {
32614c998f0SMark McLoughlin 	int num, err;
32705271685SRusty Russell 	struct scatterlist sg[2+MAX_SKB_FRAGS];
328296f96fcSRusty Russell 	struct virtio_net_hdr *hdr;
329296f96fcSRusty Russell 	const unsigned char *dest = ((struct ethhdr *)skb->data)->h_dest;
330296f96fcSRusty Russell 
33105271685SRusty Russell 	sg_init_table(sg, 2+MAX_SKB_FRAGS);
3324d125de3SRusty Russell 
333e174961cSJohannes Berg 	pr_debug("%s: xmit %p %pM\n", vi->dev->name, skb, dest);
334296f96fcSRusty Russell 
335296f96fcSRusty Russell 	/* Encode metadata header at front. */
336296f96fcSRusty Russell 	hdr = skb_vnet_hdr(skb);
337296f96fcSRusty Russell 	if (skb->ip_summed == CHECKSUM_PARTIAL) {
338296f96fcSRusty Russell 		hdr->flags = VIRTIO_NET_HDR_F_NEEDS_CSUM;
339296f96fcSRusty Russell 		hdr->csum_start = skb->csum_start - skb_headroom(skb);
340296f96fcSRusty Russell 		hdr->csum_offset = skb->csum_offset;
341296f96fcSRusty Russell 	} else {
342296f96fcSRusty Russell 		hdr->flags = 0;
343296f96fcSRusty Russell 		hdr->csum_offset = hdr->csum_start = 0;
344296f96fcSRusty Russell 	}
345296f96fcSRusty Russell 
346296f96fcSRusty Russell 	if (skb_is_gso(skb)) {
34750c8ea80SRusty Russell 		hdr->hdr_len = skb_transport_header(skb) - skb->data;
348296f96fcSRusty Russell 		hdr->gso_size = skb_shinfo(skb)->gso_size;
34934a48579SRusty Russell 		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV4)
350296f96fcSRusty Russell 			hdr->gso_type = VIRTIO_NET_HDR_GSO_TCPV4;
351296f96fcSRusty Russell 		else if (skb_shinfo(skb)->gso_type & SKB_GSO_TCPV6)
352296f96fcSRusty Russell 			hdr->gso_type = VIRTIO_NET_HDR_GSO_TCPV6;
353296f96fcSRusty Russell 		else if (skb_shinfo(skb)->gso_type & SKB_GSO_UDP)
354296f96fcSRusty Russell 			hdr->gso_type = VIRTIO_NET_HDR_GSO_UDP;
355296f96fcSRusty Russell 		else
356296f96fcSRusty Russell 			BUG();
35734a48579SRusty Russell 		if (skb_shinfo(skb)->gso_type & SKB_GSO_TCP_ECN)
35834a48579SRusty Russell 			hdr->gso_type |= VIRTIO_NET_HDR_GSO_ECN;
359296f96fcSRusty Russell 	} else {
360296f96fcSRusty Russell 		hdr->gso_type = VIRTIO_NET_HDR_GSO_NONE;
36150c8ea80SRusty Russell 		hdr->gso_size = hdr->hdr_len = 0;
362296f96fcSRusty Russell 	}
363296f96fcSRusty Russell 
364296f96fcSRusty Russell 	vnet_hdr_to_sg(sg, skb);
365296f96fcSRusty Russell 	num = skb_to_sgvec(skb, sg+1, 0, skb->len) + 1;
36699ffc696SRusty Russell 
36714c998f0SMark McLoughlin 	err = vi->svq->vq_ops->add_buf(vi->svq, sg, num, 0, skb);
368363f1514SRusty Russell 	if (!err && !vi->free_in_tasklet)
36914c998f0SMark McLoughlin 		mod_timer(&vi->xmit_free_timer, jiffies + (HZ/10));
37014c998f0SMark McLoughlin 
37114c998f0SMark McLoughlin 	return err;
37299ffc696SRusty Russell }
37399ffc696SRusty Russell 
37411a3a154SRusty Russell static void xmit_tasklet(unsigned long data)
37511a3a154SRusty Russell {
37611a3a154SRusty Russell 	struct virtnet_info *vi = (void *)data;
37711a3a154SRusty Russell 
37811a3a154SRusty Russell 	netif_tx_lock_bh(vi->dev);
37911a3a154SRusty Russell 	if (vi->last_xmit_skb && xmit_skb(vi, vi->last_xmit_skb) == 0) {
38011a3a154SRusty Russell 		vi->svq->vq_ops->kick(vi->svq);
38111a3a154SRusty Russell 		vi->last_xmit_skb = NULL;
38211a3a154SRusty Russell 	}
383363f1514SRusty Russell 	if (vi->free_in_tasklet)
384363f1514SRusty Russell 		free_old_xmit_skbs(vi);
38511a3a154SRusty Russell 	netif_tx_unlock_bh(vi->dev);
38611a3a154SRusty Russell }
38711a3a154SRusty Russell 
38899ffc696SRusty Russell static int start_xmit(struct sk_buff *skb, struct net_device *dev)
38999ffc696SRusty Russell {
39099ffc696SRusty Russell 	struct virtnet_info *vi = netdev_priv(dev);
3912cb9c6baSRusty Russell 
3922cb9c6baSRusty Russell again:
3932cb9c6baSRusty Russell 	/* Free up any pending old buffers before queueing new ones. */
3942cb9c6baSRusty Russell 	free_old_xmit_skbs(vi);
39599ffc696SRusty Russell 
39699ffc696SRusty Russell 	/* If we has a buffer left over from last time, send it now. */
3979953ca6cSMark McLoughlin 	if (unlikely(vi->last_xmit_skb) &&
3989953ca6cSMark McLoughlin 	    xmit_skb(vi, vi->last_xmit_skb) != 0)
39999ffc696SRusty Russell 		goto stop_queue;
4009953ca6cSMark McLoughlin 
40199ffc696SRusty Russell 	vi->last_xmit_skb = NULL;
40299ffc696SRusty Russell 
40399ffc696SRusty Russell 	/* Put new one in send queue and do transmit */
4047eb2e251SRusty Russell 	if (likely(skb)) {
40599ffc696SRusty Russell 		__skb_queue_head(&vi->send, skb);
40699ffc696SRusty Russell 		if (xmit_skb(vi, skb) != 0) {
40799ffc696SRusty Russell 			vi->last_xmit_skb = skb;
4087eb2e251SRusty Russell 			skb = NULL;
40999ffc696SRusty Russell 			goto stop_queue;
41099ffc696SRusty Russell 		}
4117eb2e251SRusty Russell 	}
41299ffc696SRusty Russell done:
41399ffc696SRusty Russell 	vi->svq->vq_ops->kick(vi->svq);
41499ffc696SRusty Russell 	return NETDEV_TX_OK;
41599ffc696SRusty Russell 
41699ffc696SRusty Russell stop_queue:
417296f96fcSRusty Russell 	pr_debug("%s: virtio not prepared to send\n", dev->name);
418296f96fcSRusty Russell 	netif_stop_queue(dev);
4192cb9c6baSRusty Russell 
4204265f161SChristian Borntraeger 	/* Activate callback for using skbs: if this returns false it
4212cb9c6baSRusty Russell 	 * means some were used in the meantime. */
4222cb9c6baSRusty Russell 	if (unlikely(!vi->svq->vq_ops->enable_cb(vi->svq))) {
4234265f161SChristian Borntraeger 		vi->svq->vq_ops->disable_cb(vi->svq);
4242cb9c6baSRusty Russell 		netif_start_queue(dev);
4252cb9c6baSRusty Russell 		goto again;
4262cb9c6baSRusty Russell 	}
4279953ca6cSMark McLoughlin 	if (skb) {
4289953ca6cSMark McLoughlin 		/* Drop this skb: we only queue one. */
4299953ca6cSMark McLoughlin 		vi->dev->stats.tx_dropped++;
4309953ca6cSMark McLoughlin 		kfree_skb(skb);
4319953ca6cSMark McLoughlin 	}
43299ffc696SRusty Russell 	goto done;
433296f96fcSRusty Russell }
434296f96fcSRusty Russell 
435da74e89dSAmit Shah #ifdef CONFIG_NET_POLL_CONTROLLER
436da74e89dSAmit Shah static void virtnet_netpoll(struct net_device *dev)
437da74e89dSAmit Shah {
438da74e89dSAmit Shah 	struct virtnet_info *vi = netdev_priv(dev);
439da74e89dSAmit Shah 
440da74e89dSAmit Shah 	napi_schedule(&vi->napi);
441da74e89dSAmit Shah }
442da74e89dSAmit Shah #endif
443da74e89dSAmit Shah 
444296f96fcSRusty Russell static int virtnet_open(struct net_device *dev)
445296f96fcSRusty Russell {
446296f96fcSRusty Russell 	struct virtnet_info *vi = netdev_priv(dev);
447296f96fcSRusty Russell 
448296f96fcSRusty Russell 	napi_enable(&vi->napi);
449a48bd8f6SRusty Russell 
450a48bd8f6SRusty Russell 	/* If all buffers were filled by other side before we napi_enabled, we
451a48bd8f6SRusty Russell 	 * won't get another interrupt, so process any outstanding packets
452370076d9SChristian Borntraeger 	 * now.  virtnet_poll wants re-enable the queue, so we disable here.
453370076d9SChristian Borntraeger 	 * We synchronize against interrupts via NAPI_STATE_SCHED */
454370076d9SChristian Borntraeger 	if (netif_rx_schedule_prep(dev, &vi->napi)) {
455a48bd8f6SRusty Russell 		vi->rvq->vq_ops->disable_cb(vi->rvq);
456370076d9SChristian Borntraeger 		__netif_rx_schedule(dev, &vi->napi);
457370076d9SChristian Borntraeger 	}
458296f96fcSRusty Russell 	return 0;
459296f96fcSRusty Russell }
460296f96fcSRusty Russell 
461296f96fcSRusty Russell static int virtnet_close(struct net_device *dev)
462296f96fcSRusty Russell {
463296f96fcSRusty Russell 	struct virtnet_info *vi = netdev_priv(dev);
464296f96fcSRusty Russell 
465296f96fcSRusty Russell 	napi_disable(&vi->napi);
466296f96fcSRusty Russell 
467296f96fcSRusty Russell 	return 0;
468296f96fcSRusty Russell }
469296f96fcSRusty Russell 
470a9ea3fc6SHerbert Xu static int virtnet_set_tx_csum(struct net_device *dev, u32 data)
471a9ea3fc6SHerbert Xu {
472a9ea3fc6SHerbert Xu 	struct virtnet_info *vi = netdev_priv(dev);
473a9ea3fc6SHerbert Xu 	struct virtio_device *vdev = vi->vdev;
474a9ea3fc6SHerbert Xu 
475a9ea3fc6SHerbert Xu 	if (data && !virtio_has_feature(vdev, VIRTIO_NET_F_CSUM))
476a9ea3fc6SHerbert Xu 		return -ENOSYS;
477a9ea3fc6SHerbert Xu 
478a9ea3fc6SHerbert Xu 	return ethtool_op_set_tx_hw_csum(dev, data);
479a9ea3fc6SHerbert Xu }
480a9ea3fc6SHerbert Xu 
481a9ea3fc6SHerbert Xu static struct ethtool_ops virtnet_ethtool_ops = {
482a9ea3fc6SHerbert Xu 	.set_tx_csum = virtnet_set_tx_csum,
483a9ea3fc6SHerbert Xu 	.set_sg = ethtool_op_set_sg,
484a9ea3fc6SHerbert Xu };
485a9ea3fc6SHerbert Xu 
486296f96fcSRusty Russell static int virtnet_probe(struct virtio_device *vdev)
487296f96fcSRusty Russell {
488296f96fcSRusty Russell 	int err;
489296f96fcSRusty Russell 	struct net_device *dev;
490296f96fcSRusty Russell 	struct virtnet_info *vi;
491296f96fcSRusty Russell 
492296f96fcSRusty Russell 	/* Allocate ourselves a network device with room for our info */
493296f96fcSRusty Russell 	dev = alloc_etherdev(sizeof(struct virtnet_info));
494296f96fcSRusty Russell 	if (!dev)
495296f96fcSRusty Russell 		return -ENOMEM;
496296f96fcSRusty Russell 
497296f96fcSRusty Russell 	/* Set up network device as normal. */
498296f96fcSRusty Russell 	dev->open = virtnet_open;
499296f96fcSRusty Russell 	dev->stop = virtnet_close;
500296f96fcSRusty Russell 	dev->hard_start_xmit = start_xmit;
501296f96fcSRusty Russell 	dev->features = NETIF_F_HIGHDMA;
502da74e89dSAmit Shah #ifdef CONFIG_NET_POLL_CONTROLLER
503da74e89dSAmit Shah 	dev->poll_controller = virtnet_netpoll;
504da74e89dSAmit Shah #endif
505a9ea3fc6SHerbert Xu 	SET_ETHTOOL_OPS(dev, &virtnet_ethtool_ops);
506296f96fcSRusty Russell 	SET_NETDEV_DEV(dev, &vdev->dev);
507296f96fcSRusty Russell 
508296f96fcSRusty Russell 	/* Do we support "hardware" checksums? */
509c45a6816SRusty Russell 	if (csum && virtio_has_feature(vdev, VIRTIO_NET_F_CSUM)) {
510296f96fcSRusty Russell 		/* This opens up the world of extra features. */
511296f96fcSRusty Russell 		dev->features |= NETIF_F_HW_CSUM|NETIF_F_SG|NETIF_F_FRAGLIST;
512c45a6816SRusty Russell 		if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_GSO)) {
51334a48579SRusty Russell 			dev->features |= NETIF_F_TSO | NETIF_F_UFO
51434a48579SRusty Russell 				| NETIF_F_TSO_ECN | NETIF_F_TSO6;
51534a48579SRusty Russell 		}
5165539ae96SRusty Russell 		/* Individual feature bits: what can host handle? */
517c45a6816SRusty Russell 		if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO4))
5185539ae96SRusty Russell 			dev->features |= NETIF_F_TSO;
519c45a6816SRusty Russell 		if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_TSO6))
5205539ae96SRusty Russell 			dev->features |= NETIF_F_TSO6;
521c45a6816SRusty Russell 		if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_ECN))
5225539ae96SRusty Russell 			dev->features |= NETIF_F_TSO_ECN;
523c45a6816SRusty Russell 		if (gso && virtio_has_feature(vdev, VIRTIO_NET_F_HOST_UFO))
5245539ae96SRusty Russell 			dev->features |= NETIF_F_UFO;
525296f96fcSRusty Russell 	}
526296f96fcSRusty Russell 
527296f96fcSRusty Russell 	/* Configuration may specify what MAC to use.  Otherwise random. */
528c45a6816SRusty Russell 	if (virtio_has_feature(vdev, VIRTIO_NET_F_MAC)) {
529a586d4f6SRusty Russell 		vdev->config->get(vdev,
530a586d4f6SRusty Russell 				  offsetof(struct virtio_net_config, mac),
531a586d4f6SRusty Russell 				  dev->dev_addr, dev->addr_len);
532296f96fcSRusty Russell 	} else
533296f96fcSRusty Russell 		random_ether_addr(dev->dev_addr);
534296f96fcSRusty Russell 
535296f96fcSRusty Russell 	/* Set up our device-specific information */
536296f96fcSRusty Russell 	vi = netdev_priv(dev);
5376c0cd7c0SDor Laor 	netif_napi_add(dev, &vi->napi, virtnet_poll, napi_weight);
538296f96fcSRusty Russell 	vi->dev = dev;
539296f96fcSRusty Russell 	vi->vdev = vdev;
540d9d5dcc8SChristian Borntraeger 	vdev->priv = vi;
541fb6813f4SRusty Russell 	vi->pages = NULL;
542296f96fcSRusty Russell 
543363f1514SRusty Russell 	/* If they give us a callback when all buffers are done, we don't need
544363f1514SRusty Russell 	 * the timer. */
545363f1514SRusty Russell 	vi->free_in_tasklet = virtio_has_feature(vdev,VIRTIO_F_NOTIFY_ON_EMPTY);
546363f1514SRusty Russell 
54797402b96SHerbert Xu 	/* If we can receive ANY GSO packets, we must allocate large ones. */
54897402b96SHerbert Xu 	if (virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO4)
54997402b96SHerbert Xu 	    || virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_TSO6)
55097402b96SHerbert Xu 	    || virtio_has_feature(vdev, VIRTIO_NET_F_GUEST_ECN))
55197402b96SHerbert Xu 		vi->big_packets = true;
55297402b96SHerbert Xu 
553296f96fcSRusty Russell 	/* We expect two virtqueues, receive then send. */
554a586d4f6SRusty Russell 	vi->rvq = vdev->config->find_vq(vdev, 0, skb_recv_done);
555296f96fcSRusty Russell 	if (IS_ERR(vi->rvq)) {
556296f96fcSRusty Russell 		err = PTR_ERR(vi->rvq);
557296f96fcSRusty Russell 		goto free;
558296f96fcSRusty Russell 	}
559296f96fcSRusty Russell 
560a586d4f6SRusty Russell 	vi->svq = vdev->config->find_vq(vdev, 1, skb_xmit_done);
561296f96fcSRusty Russell 	if (IS_ERR(vi->svq)) {
562296f96fcSRusty Russell 		err = PTR_ERR(vi->svq);
563296f96fcSRusty Russell 		goto free_recv;
564296f96fcSRusty Russell 	}
565296f96fcSRusty Russell 
566296f96fcSRusty Russell 	/* Initialize our empty receive and send queues. */
567296f96fcSRusty Russell 	skb_queue_head_init(&vi->recv);
568296f96fcSRusty Russell 	skb_queue_head_init(&vi->send);
569296f96fcSRusty Russell 
57011a3a154SRusty Russell 	tasklet_init(&vi->tasklet, xmit_tasklet, (unsigned long)vi);
57111a3a154SRusty Russell 
572363f1514SRusty Russell 	if (!vi->free_in_tasklet)
57314c998f0SMark McLoughlin 		setup_timer(&vi->xmit_free_timer, xmit_free, (unsigned long)vi);
57414c998f0SMark McLoughlin 
575296f96fcSRusty Russell 	err = register_netdev(dev);
576296f96fcSRusty Russell 	if (err) {
577296f96fcSRusty Russell 		pr_debug("virtio_net: registering device failed\n");
578296f96fcSRusty Russell 		goto free_send;
579296f96fcSRusty Russell 	}
580b3369c1fSRusty Russell 
581b3369c1fSRusty Russell 	/* Last of all, set up some receive buffers. */
582b3369c1fSRusty Russell 	try_fill_recv(vi);
583b3369c1fSRusty Russell 
584b3369c1fSRusty Russell 	/* If we didn't even get one input buffer, we're useless. */
585b3369c1fSRusty Russell 	if (vi->num == 0) {
586b3369c1fSRusty Russell 		err = -ENOMEM;
587b3369c1fSRusty Russell 		goto unregister;
588b3369c1fSRusty Russell 	}
589b3369c1fSRusty Russell 
590296f96fcSRusty Russell 	pr_debug("virtnet: registered device %s\n", dev->name);
591296f96fcSRusty Russell 	return 0;
592296f96fcSRusty Russell 
593b3369c1fSRusty Russell unregister:
594b3369c1fSRusty Russell 	unregister_netdev(dev);
595296f96fcSRusty Russell free_send:
596296f96fcSRusty Russell 	vdev->config->del_vq(vi->svq);
597296f96fcSRusty Russell free_recv:
598296f96fcSRusty Russell 	vdev->config->del_vq(vi->rvq);
599296f96fcSRusty Russell free:
600296f96fcSRusty Russell 	free_netdev(dev);
601296f96fcSRusty Russell 	return err;
602296f96fcSRusty Russell }
603296f96fcSRusty Russell 
604296f96fcSRusty Russell static void virtnet_remove(struct virtio_device *vdev)
605296f96fcSRusty Russell {
60674b2553fSRusty Russell 	struct virtnet_info *vi = vdev->priv;
607b3369c1fSRusty Russell 	struct sk_buff *skb;
608b3369c1fSRusty Russell 
6096e5aa7efSRusty Russell 	/* Stop all the virtqueues. */
6106e5aa7efSRusty Russell 	vdev->config->reset(vdev);
6116e5aa7efSRusty Russell 
612363f1514SRusty Russell 	if (!vi->free_in_tasklet)
61314c998f0SMark McLoughlin 		del_timer_sync(&vi->xmit_free_timer);
61414c998f0SMark McLoughlin 
615b3369c1fSRusty Russell 	/* Free our skbs in send and recv queues, if any. */
616b3369c1fSRusty Russell 	while ((skb = __skb_dequeue(&vi->recv)) != NULL) {
617b3369c1fSRusty Russell 		kfree_skb(skb);
618b3369c1fSRusty Russell 		vi->num--;
619b3369c1fSRusty Russell 	}
620288369ccSWang Chen 	__skb_queue_purge(&vi->send);
621b3369c1fSRusty Russell 
622b3369c1fSRusty Russell 	BUG_ON(vi->num != 0);
62374b2553fSRusty Russell 
62474b2553fSRusty Russell 	vdev->config->del_vq(vi->svq);
62574b2553fSRusty Russell 	vdev->config->del_vq(vi->rvq);
62674b2553fSRusty Russell 	unregister_netdev(vi->dev);
627fb6813f4SRusty Russell 
628fb6813f4SRusty Russell 	while (vi->pages)
629fb6813f4SRusty Russell 		__free_pages(get_a_page(vi, GFP_KERNEL), 0);
630fb6813f4SRusty Russell 
63174b2553fSRusty Russell 	free_netdev(vi->dev);
632296f96fcSRusty Russell }
633296f96fcSRusty Russell 
634296f96fcSRusty Russell static struct virtio_device_id id_table[] = {
635296f96fcSRusty Russell 	{ VIRTIO_ID_NET, VIRTIO_DEV_ANY_ID },
636296f96fcSRusty Russell 	{ 0 },
637296f96fcSRusty Russell };
638296f96fcSRusty Russell 
639c45a6816SRusty Russell static unsigned int features[] = {
6405e4fe5c4SMark McLoughlin 	VIRTIO_NET_F_CSUM, VIRTIO_NET_F_GUEST_CSUM,
6415e4fe5c4SMark McLoughlin 	VIRTIO_NET_F_GSO, VIRTIO_NET_F_MAC,
642c45a6816SRusty Russell 	VIRTIO_NET_F_HOST_TSO4, VIRTIO_NET_F_HOST_UFO, VIRTIO_NET_F_HOST_TSO6,
64397402b96SHerbert Xu 	VIRTIO_NET_F_HOST_ECN, VIRTIO_NET_F_GUEST_TSO4, VIRTIO_NET_F_GUEST_TSO6,
64497402b96SHerbert Xu 	VIRTIO_NET_F_GUEST_ECN, /* We don't yet handle UFO input. */
64597402b96SHerbert Xu 	VIRTIO_F_NOTIFY_ON_EMPTY,
646c45a6816SRusty Russell };
647c45a6816SRusty Russell 
648296f96fcSRusty Russell static struct virtio_driver virtio_net = {
649c45a6816SRusty Russell 	.feature_table = features,
650c45a6816SRusty Russell 	.feature_table_size = ARRAY_SIZE(features),
651296f96fcSRusty Russell 	.driver.name =	KBUILD_MODNAME,
652296f96fcSRusty Russell 	.driver.owner =	THIS_MODULE,
653296f96fcSRusty Russell 	.id_table =	id_table,
654296f96fcSRusty Russell 	.probe =	virtnet_probe,
655296f96fcSRusty Russell 	.remove =	__devexit_p(virtnet_remove),
656296f96fcSRusty Russell };
657296f96fcSRusty Russell 
658296f96fcSRusty Russell static int __init init(void)
659296f96fcSRusty Russell {
660296f96fcSRusty Russell 	return register_virtio_driver(&virtio_net);
661296f96fcSRusty Russell }
662296f96fcSRusty Russell 
663296f96fcSRusty Russell static void __exit fini(void)
664296f96fcSRusty Russell {
665296f96fcSRusty Russell 	unregister_virtio_driver(&virtio_net);
666296f96fcSRusty Russell }
667296f96fcSRusty Russell module_init(init);
668296f96fcSRusty Russell module_exit(fini);
669296f96fcSRusty Russell 
670296f96fcSRusty Russell MODULE_DEVICE_TABLE(virtio, id_table);
671296f96fcSRusty Russell MODULE_DESCRIPTION("Virtio network driver");
672296f96fcSRusty Russell MODULE_LICENSE("GPL");
673