1ccb1352eSJesse Gross /*
2caf2ee14SRaju Subramanian  * Copyright (c) 2007-2012 Nicira, Inc.
3ccb1352eSJesse Gross  *
4ccb1352eSJesse Gross  * This program is free software; you can redistribute it and/or
5ccb1352eSJesse Gross  * modify it under the terms of version 2 of the GNU General Public
6ccb1352eSJesse Gross  * License as published by the Free Software Foundation.
7ccb1352eSJesse Gross  *
8ccb1352eSJesse Gross  * This program is distributed in the hope that it will be useful, but
9ccb1352eSJesse Gross  * WITHOUT ANY WARRANTY; without even the implied warranty of
10ccb1352eSJesse Gross  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
11ccb1352eSJesse Gross  * General Public License for more details.
12ccb1352eSJesse Gross  *
13ccb1352eSJesse Gross  * You should have received a copy of the GNU General Public License
14ccb1352eSJesse Gross  * along with this program; if not, write to the Free Software
15ccb1352eSJesse Gross  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
16ccb1352eSJesse Gross  * 02110-1301, USA
17ccb1352eSJesse Gross  */
18ccb1352eSJesse Gross 
19ccb1352eSJesse Gross #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
20ccb1352eSJesse Gross 
21ccb1352eSJesse Gross #include <linux/if_arp.h>
22ccb1352eSJesse Gross #include <linux/if_bridge.h>
23ccb1352eSJesse Gross #include <linux/if_vlan.h>
24ccb1352eSJesse Gross #include <linux/kernel.h>
25ccb1352eSJesse Gross #include <linux/llc.h>
26ccb1352eSJesse Gross #include <linux/rtnetlink.h>
27ccb1352eSJesse Gross #include <linux/skbuff.h>
282537b4ddSJiri Pirko #include <linux/openvswitch.h>
29dcc38c03SThomas Graf #include <linux/export.h>
30ccb1352eSJesse Gross 
31614732eaSThomas Graf #include <net/ip_tunnels.h>
32614732eaSThomas Graf #include <net/rtnetlink.h>
33ccb1352eSJesse Gross 
34ccb1352eSJesse Gross #include "datapath.h"
35614732eaSThomas Graf #include "vport.h"
36ccb1352eSJesse Gross #include "vport-internal_dev.h"
37ccb1352eSJesse Gross #include "vport-netdev.h"
38ccb1352eSJesse Gross 
3962b9c8d0SThomas Graf static struct vport_ops ovs_netdev_vport_ops;
4062b9c8d0SThomas Graf 
41ccb1352eSJesse Gross /* Must be called with rcu_read_lock. */
42ccb1352eSJesse Gross static void netdev_port_receive(struct vport *vport, struct sk_buff *skb)
43ccb1352eSJesse Gross {
44d9d59089SJesse Gross 	if (unlikely(!vport))
45d9d59089SJesse Gross 		goto error;
46d9d59089SJesse Gross 
47d9d59089SJesse Gross 	if (unlikely(skb_warn_if_lro(skb)))
48d9d59089SJesse Gross 		goto error;
49ccb1352eSJesse Gross 
50ccb1352eSJesse Gross 	/* Make our own copy of the packet.  Otherwise we will mangle the
51ccb1352eSJesse Gross 	 * packet for anyone who came before us (e.g. tcpdump via AF_PACKET).
52d176ca2aSCong Wang 	 */
53ccb1352eSJesse Gross 	skb = skb_share_check(skb, GFP_ATOMIC);
54ccb1352eSJesse Gross 	if (unlikely(!skb))
55ccb1352eSJesse Gross 		return;
56ccb1352eSJesse Gross 
57ccb1352eSJesse Gross 	skb_push(skb, ETH_HLEN);
58b34df5e8SPravin B Shelar 	ovs_skb_postpush_rcsum(skb, skb->data, ETH_HLEN);
59b34df5e8SPravin B Shelar 
6061adedf3SJiri Benc 	ovs_vport_receive(vport, skb, skb_tunnel_info(skb));
61d9d59089SJesse Gross 	return;
62d9d59089SJesse Gross 
63d9d59089SJesse Gross error:
64d9d59089SJesse Gross 	kfree_skb(skb);
65ccb1352eSJesse Gross }
66ccb1352eSJesse Gross 
67ccb1352eSJesse Gross /* Called with rcu_read_lock and bottom-halves disabled. */
68ccb1352eSJesse Gross static rx_handler_result_t netdev_frame_hook(struct sk_buff **pskb)
69ccb1352eSJesse Gross {
70ccb1352eSJesse Gross 	struct sk_buff *skb = *pskb;
71ccb1352eSJesse Gross 	struct vport *vport;
72ccb1352eSJesse Gross 
73ccb1352eSJesse Gross 	if (unlikely(skb->pkt_type == PACKET_LOOPBACK))
74ccb1352eSJesse Gross 		return RX_HANDLER_PASS;
75ccb1352eSJesse Gross 
76ccb1352eSJesse Gross 	vport = ovs_netdev_get_vport(skb->dev);
77ccb1352eSJesse Gross 
78ccb1352eSJesse Gross 	netdev_port_receive(vport, skb);
79ccb1352eSJesse Gross 
80ccb1352eSJesse Gross 	return RX_HANDLER_CONSUMED;
81ccb1352eSJesse Gross }
82ccb1352eSJesse Gross 
8312eb18f7SThomas Graf static struct net_device *get_dpdev(const struct datapath *dp)
842537b4ddSJiri Pirko {
852537b4ddSJiri Pirko 	struct vport *local;
862537b4ddSJiri Pirko 
872537b4ddSJiri Pirko 	local = ovs_vport_ovsl(dp, OVSP_LOCAL);
882537b4ddSJiri Pirko 	BUG_ON(!local);
89be4ace6eSThomas Graf 	return local->dev;
902537b4ddSJiri Pirko }
912537b4ddSJiri Pirko 
92dcc38c03SThomas Graf struct vport *ovs_netdev_link(struct vport *vport, const char *name)
93ccb1352eSJesse Gross {
94ccb1352eSJesse Gross 	int err;
95ccb1352eSJesse Gross 
96be4ace6eSThomas Graf 	vport->dev = dev_get_by_name(ovs_dp_get_net(vport->dp), name);
97be4ace6eSThomas Graf 	if (!vport->dev) {
98ccb1352eSJesse Gross 		err = -ENODEV;
99ccb1352eSJesse Gross 		goto error_free_vport;
100ccb1352eSJesse Gross 	}
101ccb1352eSJesse Gross 
102be4ace6eSThomas Graf 	if (vport->dev->flags & IFF_LOOPBACK ||
103be4ace6eSThomas Graf 	    vport->dev->type != ARPHRD_ETHER ||
104be4ace6eSThomas Graf 	    ovs_is_internal_dev(vport->dev)) {
105ccb1352eSJesse Gross 		err = -EINVAL;
106ccb1352eSJesse Gross 		goto error_put;
107ccb1352eSJesse Gross 	}
108ccb1352eSJesse Gross 
1098e4e1713SPravin B Shelar 	rtnl_lock();
110be4ace6eSThomas Graf 	err = netdev_master_upper_dev_link(vport->dev,
1112537b4ddSJiri Pirko 					   get_dpdev(vport->dp));
1122537b4ddSJiri Pirko 	if (err)
1132537b4ddSJiri Pirko 		goto error_unlock;
1142537b4ddSJiri Pirko 
115be4ace6eSThomas Graf 	err = netdev_rx_handler_register(vport->dev, netdev_frame_hook,
116ccb1352eSJesse Gross 					 vport);
117ccb1352eSJesse Gross 	if (err)
1182537b4ddSJiri Pirko 		goto error_master_upper_dev_unlink;
119ccb1352eSJesse Gross 
120be4ace6eSThomas Graf 	dev_disable_lro(vport->dev);
121be4ace6eSThomas Graf 	dev_set_promiscuity(vport->dev, 1);
122be4ace6eSThomas Graf 	vport->dev->priv_flags |= IFF_OVS_DATAPATH;
1238e4e1713SPravin B Shelar 	rtnl_unlock();
124ccb1352eSJesse Gross 
125ccb1352eSJesse Gross 	return vport;
126ccb1352eSJesse Gross 
1272537b4ddSJiri Pirko error_master_upper_dev_unlink:
128be4ace6eSThomas Graf 	netdev_upper_dev_unlink(vport->dev, get_dpdev(vport->dp));
1298e4e1713SPravin B Shelar error_unlock:
1308e4e1713SPravin B Shelar 	rtnl_unlock();
131ccb1352eSJesse Gross error_put:
132be4ace6eSThomas Graf 	dev_put(vport->dev);
133ccb1352eSJesse Gross error_free_vport:
134ccb1352eSJesse Gross 	ovs_vport_free(vport);
135ccb1352eSJesse Gross 	return ERR_PTR(err);
136ccb1352eSJesse Gross }
137dcc38c03SThomas Graf EXPORT_SYMBOL_GPL(ovs_netdev_link);
138ccb1352eSJesse Gross 
139be4ace6eSThomas Graf static struct vport *netdev_create(const struct vport_parms *parms)
140be4ace6eSThomas Graf {
141be4ace6eSThomas Graf 	struct vport *vport;
142be4ace6eSThomas Graf 
143be4ace6eSThomas Graf 	vport = ovs_vport_alloc(0, &ovs_netdev_vport_ops, parms);
144be4ace6eSThomas Graf 	if (IS_ERR(vport))
145be4ace6eSThomas Graf 		return vport;
146be4ace6eSThomas Graf 
147dcc38c03SThomas Graf 	return ovs_netdev_link(vport, parms->name);
148be4ace6eSThomas Graf }
149be4ace6eSThomas Graf 
150a9020fdeSPravin B Shelar static void vport_netdev_free(struct rcu_head *rcu)
15192eb1d47SJesse Gross {
152be4ace6eSThomas Graf 	struct vport *vport = container_of(rcu, struct vport, rcu);
15392eb1d47SJesse Gross 
154614732eaSThomas Graf 	if (vport->dev)
155be4ace6eSThomas Graf 		dev_put(vport->dev);
156be4ace6eSThomas Graf 	ovs_vport_free(vport);
15792eb1d47SJesse Gross }
15892eb1d47SJesse Gross 
159b07c2651SAlexei Starovoitov void ovs_netdev_detach_dev(struct vport *vport)
160b07c2651SAlexei Starovoitov {
161b07c2651SAlexei Starovoitov 	ASSERT_RTNL();
162be4ace6eSThomas Graf 	vport->dev->priv_flags &= ~IFF_OVS_DATAPATH;
163be4ace6eSThomas Graf 	netdev_rx_handler_unregister(vport->dev);
164be4ace6eSThomas Graf 	netdev_upper_dev_unlink(vport->dev,
165be4ace6eSThomas Graf 				netdev_master_upper_dev_get(vport->dev));
166be4ace6eSThomas Graf 	dev_set_promiscuity(vport->dev, -1);
167b07c2651SAlexei Starovoitov }
168dcc38c03SThomas Graf EXPORT_SYMBOL_GPL(ovs_netdev_detach_dev);
169b07c2651SAlexei Starovoitov 
170ccb1352eSJesse Gross static void netdev_destroy(struct vport *vport)
171ccb1352eSJesse Gross {
1728e4e1713SPravin B Shelar 	rtnl_lock();
173be4ace6eSThomas Graf 	if (vport->dev->priv_flags & IFF_OVS_DATAPATH)
174b07c2651SAlexei Starovoitov 		ovs_netdev_detach_dev(vport);
1758e4e1713SPravin B Shelar 	rtnl_unlock();
176ccb1352eSJesse Gross 
177a9020fdeSPravin B Shelar 	call_rcu(&vport->rcu, vport_netdev_free);
178ccb1352eSJesse Gross }
179ccb1352eSJesse Gross 
180a9020fdeSPravin B Shelar void ovs_netdev_tunnel_destroy(struct vport *vport)
181a9020fdeSPravin B Shelar {
182a9020fdeSPravin B Shelar 	rtnl_lock();
183a9020fdeSPravin B Shelar 	if (vport->dev->priv_flags & IFF_OVS_DATAPATH)
184a9020fdeSPravin B Shelar 		ovs_netdev_detach_dev(vport);
185a9020fdeSPravin B Shelar 
186a9020fdeSPravin B Shelar 	/* Early release so we can unregister the device */
187a9020fdeSPravin B Shelar 	dev_put(vport->dev);
188a9020fdeSPravin B Shelar 	rtnl_delete_link(vport->dev);
189a9020fdeSPravin B Shelar 	vport->dev = NULL;
190a9020fdeSPravin B Shelar 	rtnl_unlock();
191a9020fdeSPravin B Shelar 
192a9020fdeSPravin B Shelar 	call_rcu(&vport->rcu, vport_netdev_free);
193a9020fdeSPravin B Shelar }
194a9020fdeSPravin B Shelar EXPORT_SYMBOL_GPL(ovs_netdev_tunnel_destroy);
195a9020fdeSPravin B Shelar 
19695c96174SEric Dumazet static unsigned int packet_length(const struct sk_buff *skb)
197ccb1352eSJesse Gross {
19895c96174SEric Dumazet 	unsigned int length = skb->len - ETH_HLEN;
199ccb1352eSJesse Gross 
200ccb1352eSJesse Gross 	if (skb->protocol == htons(ETH_P_8021Q))
201ccb1352eSJesse Gross 		length -= VLAN_HLEN;
202ccb1352eSJesse Gross 
203ccb1352eSJesse Gross 	return length;
204ccb1352eSJesse Gross }
205ccb1352eSJesse Gross 
206dcc38c03SThomas Graf int ovs_netdev_send(struct vport *vport, struct sk_buff *skb)
207ccb1352eSJesse Gross {
208be4ace6eSThomas Graf 	int mtu = vport->dev->mtu;
209ccb1352eSJesse Gross 	int len;
210ccb1352eSJesse Gross 
211ccb1352eSJesse Gross 	if (unlikely(packet_length(skb) > mtu && !skb_is_gso(skb))) {
212e87cc472SJoe Perches 		net_warn_ratelimited("%s: dropped over-mtu packet: %d > %d\n",
213be4ace6eSThomas Graf 				     vport->dev->name,
214e87cc472SJoe Perches 				     packet_length(skb), mtu);
21591b7514cSPravin B Shelar 		goto drop;
216ccb1352eSJesse Gross 	}
217ccb1352eSJesse Gross 
218be4ace6eSThomas Graf 	skb->dev = vport->dev;
219ccb1352eSJesse Gross 	len = skb->len;
220ccb1352eSJesse Gross 	dev_queue_xmit(skb);
221ccb1352eSJesse Gross 
222ccb1352eSJesse Gross 	return len;
223ccb1352eSJesse Gross 
22491b7514cSPravin B Shelar drop:
225ccb1352eSJesse Gross 	kfree_skb(skb);
226ccb1352eSJesse Gross 	return 0;
227ccb1352eSJesse Gross }
228dcc38c03SThomas Graf EXPORT_SYMBOL_GPL(ovs_netdev_send);
229ccb1352eSJesse Gross 
230ccb1352eSJesse Gross /* Returns null if this device is not attached to a datapath. */
231ccb1352eSJesse Gross struct vport *ovs_netdev_get_vport(struct net_device *dev)
232ccb1352eSJesse Gross {
233ccb1352eSJesse Gross 	if (likely(dev->priv_flags & IFF_OVS_DATAPATH))
234ccb1352eSJesse Gross 		return (struct vport *)
235ccb1352eSJesse Gross 			rcu_dereference_rtnl(dev->rx_handler_data);
236ccb1352eSJesse Gross 	else
237ccb1352eSJesse Gross 		return NULL;
238ccb1352eSJesse Gross }
239ccb1352eSJesse Gross 
24062b9c8d0SThomas Graf static struct vport_ops ovs_netdev_vport_ops = {
241ccb1352eSJesse Gross 	.type		= OVS_VPORT_TYPE_NETDEV,
242ccb1352eSJesse Gross 	.create		= netdev_create,
243ccb1352eSJesse Gross 	.destroy	= netdev_destroy,
244dcc38c03SThomas Graf 	.send		= ovs_netdev_send,
245ccb1352eSJesse Gross };
24662b9c8d0SThomas Graf 
24762b9c8d0SThomas Graf int __init ovs_netdev_init(void)
24862b9c8d0SThomas Graf {
249dcc38c03SThomas Graf 	return ovs_vport_ops_register(&ovs_netdev_vport_ops);
25062b9c8d0SThomas Graf }
25162b9c8d0SThomas Graf 
25262b9c8d0SThomas Graf void ovs_netdev_exit(void)
25362b9c8d0SThomas Graf {
25462b9c8d0SThomas Graf 	ovs_vport_ops_unregister(&ovs_netdev_vport_ops);
25562b9c8d0SThomas Graf }
256