xref: /openbmc/linux/net/ipv4/ip_tunnel.c (revision 4baf4a2919b2a13a7f67d63f34b03f823ea7c0e8)
1c9422999SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2c5441932SPravin B Shelar /*
3c5441932SPravin B Shelar  * Copyright (c) 2013 Nicira, Inc.
4c5441932SPravin B Shelar  */
5c5441932SPravin B Shelar 
6c5441932SPravin B Shelar #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
7c5441932SPravin B Shelar 
8c5441932SPravin B Shelar #include <linux/capability.h>
9c5441932SPravin B Shelar #include <linux/module.h>
10c5441932SPravin B Shelar #include <linux/types.h>
11c5441932SPravin B Shelar #include <linux/kernel.h>
12c5441932SPravin B Shelar #include <linux/slab.h>
13c5441932SPravin B Shelar #include <linux/uaccess.h>
14c5441932SPravin B Shelar #include <linux/skbuff.h>
15c5441932SPravin B Shelar #include <linux/netdevice.h>
16c5441932SPravin B Shelar #include <linux/in.h>
17c5441932SPravin B Shelar #include <linux/tcp.h>
18c5441932SPravin B Shelar #include <linux/udp.h>
19c5441932SPravin B Shelar #include <linux/if_arp.h>
20c5441932SPravin B Shelar #include <linux/init.h>
21c5441932SPravin B Shelar #include <linux/in6.h>
22c5441932SPravin B Shelar #include <linux/inetdevice.h>
23c5441932SPravin B Shelar #include <linux/igmp.h>
24c5441932SPravin B Shelar #include <linux/netfilter_ipv4.h>
25c5441932SPravin B Shelar #include <linux/etherdevice.h>
26c5441932SPravin B Shelar #include <linux/if_ether.h>
27c5441932SPravin B Shelar #include <linux/if_vlan.h>
28c5441932SPravin B Shelar #include <linux/rculist.h>
2927d79f3bSSachin Kamat #include <linux/err.h>
30c5441932SPravin B Shelar 
31c5441932SPravin B Shelar #include <net/sock.h>
32c5441932SPravin B Shelar #include <net/ip.h>
33c5441932SPravin B Shelar #include <net/icmp.h>
34c5441932SPravin B Shelar #include <net/protocol.h>
35c5441932SPravin B Shelar #include <net/ip_tunnels.h>
36c5441932SPravin B Shelar #include <net/arp.h>
37c5441932SPravin B Shelar #include <net/checksum.h>
38c5441932SPravin B Shelar #include <net/dsfield.h>
39c5441932SPravin B Shelar #include <net/inet_ecn.h>
40c5441932SPravin B Shelar #include <net/xfrm.h>
41c5441932SPravin B Shelar #include <net/net_namespace.h>
42c5441932SPravin B Shelar #include <net/netns/generic.h>
43c5441932SPravin B Shelar #include <net/rtnetlink.h>
4456328486STom Herbert #include <net/udp.h>
45cfc7381bSAlexei Starovoitov #include <net/dst_metadata.h>
463b1a7fb7SIdo Schimmel #include <net/inet_dscp.h>
4763487babSTom Herbert 
48c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
49c5441932SPravin B Shelar #include <net/ipv6.h>
50c5441932SPravin B Shelar #include <net/ip6_fib.h>
51c5441932SPravin B Shelar #include <net/ip6_route.h>
52c5441932SPravin B Shelar #endif
53c5441932SPravin B Shelar 
ip_tunnel_hash(__be32 key,__be32 remote)54967680e0SDuan Jiong static unsigned int ip_tunnel_hash(__be32 key, __be32 remote)
55c5441932SPravin B Shelar {
56c5441932SPravin B Shelar 	return hash_32((__force u32)key ^ (__force u32)remote,
57c5441932SPravin B Shelar 			 IP_TNL_HASH_BITS);
58c5441932SPravin B Shelar }
59c5441932SPravin B Shelar 
ip_tunnel_key_match(const struct ip_tunnel_parm * p,__be16 flags,__be32 key)60c5441932SPravin B Shelar static bool ip_tunnel_key_match(const struct ip_tunnel_parm *p,
61c5441932SPravin B Shelar 				__be16 flags, __be32 key)
62c5441932SPravin B Shelar {
63c5441932SPravin B Shelar 	if (p->i_flags & TUNNEL_KEY) {
64c5441932SPravin B Shelar 		if (flags & TUNNEL_KEY)
65c5441932SPravin B Shelar 			return key == p->i_key;
66c5441932SPravin B Shelar 		else
67c5441932SPravin B Shelar 			/* key expected, none present */
68c5441932SPravin B Shelar 			return false;
69c5441932SPravin B Shelar 	} else
70c5441932SPravin B Shelar 		return !(flags & TUNNEL_KEY);
71c5441932SPravin B Shelar }
72c5441932SPravin B Shelar 
73c5441932SPravin B Shelar /* Fallback tunnel: no source, no destination, no key, no options
74c5441932SPravin B Shelar 
75c5441932SPravin B Shelar    Tunnel hash table:
76c5441932SPravin B Shelar    We require exact key match i.e. if a key is present in packet
77c5441932SPravin B Shelar    it will match only tunnel with the same key; if it is not present,
78c5441932SPravin B Shelar    it will match only keyless tunnel.
79c5441932SPravin B Shelar 
80c5441932SPravin B Shelar    All keysless packets, if not matched configured keyless tunnels
81c5441932SPravin B Shelar    will match fallback tunnel.
82c5441932SPravin B Shelar    Given src, dst and key, find appropriate for input tunnel.
83c5441932SPravin B Shelar */
ip_tunnel_lookup(struct ip_tunnel_net * itn,int link,__be16 flags,__be32 remote,__be32 local,__be32 key)84c5441932SPravin B Shelar struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn,
85c5441932SPravin B Shelar 				   int link, __be16 flags,
86c5441932SPravin B Shelar 				   __be32 remote, __be32 local,
87c5441932SPravin B Shelar 				   __be32 key)
88c5441932SPravin B Shelar {
89c5441932SPravin B Shelar 	struct ip_tunnel *t, *cand = NULL;
90c5441932SPravin B Shelar 	struct hlist_head *head;
91ba61539cSTaehee Yoo 	struct net_device *ndev;
92ba61539cSTaehee Yoo 	unsigned int hash;
93c5441932SPravin B Shelar 
94967680e0SDuan Jiong 	hash = ip_tunnel_hash(key, remote);
95c5441932SPravin B Shelar 	head = &itn->tunnels[hash];
96c5441932SPravin B Shelar 
97c5441932SPravin B Shelar 	hlist_for_each_entry_rcu(t, head, hash_node) {
98c5441932SPravin B Shelar 		if (local != t->parms.iph.saddr ||
99c5441932SPravin B Shelar 		    remote != t->parms.iph.daddr ||
100c5441932SPravin B Shelar 		    !(t->dev->flags & IFF_UP))
101c5441932SPravin B Shelar 			continue;
102c5441932SPravin B Shelar 
103c5441932SPravin B Shelar 		if (!ip_tunnel_key_match(&t->parms, flags, key))
104c5441932SPravin B Shelar 			continue;
105c5441932SPravin B Shelar 
10677b1e00fSEric Dumazet 		if (READ_ONCE(t->parms.link) == link)
107c5441932SPravin B Shelar 			return t;
108c5441932SPravin B Shelar 		cand = t;
109c5441932SPravin B Shelar 	}
110c5441932SPravin B Shelar 
111c5441932SPravin B Shelar 	hlist_for_each_entry_rcu(t, head, hash_node) {
112c5441932SPravin B Shelar 		if (remote != t->parms.iph.daddr ||
113e0056593SDmitry Popov 		    t->parms.iph.saddr != 0 ||
114c5441932SPravin B Shelar 		    !(t->dev->flags & IFF_UP))
115c5441932SPravin B Shelar 			continue;
116c5441932SPravin B Shelar 
117c5441932SPravin B Shelar 		if (!ip_tunnel_key_match(&t->parms, flags, key))
118c5441932SPravin B Shelar 			continue;
119c5441932SPravin B Shelar 
12077b1e00fSEric Dumazet 		if (READ_ONCE(t->parms.link) == link)
121c5441932SPravin B Shelar 			return t;
12277b1e00fSEric Dumazet 		if (!cand)
123c5441932SPravin B Shelar 			cand = t;
124c5441932SPravin B Shelar 	}
125c5441932SPravin B Shelar 
126967680e0SDuan Jiong 	hash = ip_tunnel_hash(key, 0);
127c5441932SPravin B Shelar 	head = &itn->tunnels[hash];
128c5441932SPravin B Shelar 
129c5441932SPravin B Shelar 	hlist_for_each_entry_rcu(t, head, hash_node) {
130e0056593SDmitry Popov 		if ((local != t->parms.iph.saddr || t->parms.iph.daddr != 0) &&
131e0056593SDmitry Popov 		    (local != t->parms.iph.daddr || !ipv4_is_multicast(local)))
132e0056593SDmitry Popov 			continue;
133e0056593SDmitry Popov 
134e0056593SDmitry Popov 		if (!(t->dev->flags & IFF_UP))
135c5441932SPravin B Shelar 			continue;
136c5441932SPravin B Shelar 
137c5441932SPravin B Shelar 		if (!ip_tunnel_key_match(&t->parms, flags, key))
138c5441932SPravin B Shelar 			continue;
139c5441932SPravin B Shelar 
14077b1e00fSEric Dumazet 		if (READ_ONCE(t->parms.link) == link)
141c5441932SPravin B Shelar 			return t;
14277b1e00fSEric Dumazet 		if (!cand)
143c5441932SPravin B Shelar 			cand = t;
144c5441932SPravin B Shelar 	}
145c5441932SPravin B Shelar 
146c5441932SPravin B Shelar 	hlist_for_each_entry_rcu(t, head, hash_node) {
14725629fdaSWilliam Dauchy 		if ((!(flags & TUNNEL_NO_KEY) && t->parms.i_key != key) ||
148e0056593SDmitry Popov 		    t->parms.iph.saddr != 0 ||
149e0056593SDmitry Popov 		    t->parms.iph.daddr != 0 ||
150c5441932SPravin B Shelar 		    !(t->dev->flags & IFF_UP))
151c5441932SPravin B Shelar 			continue;
152c5441932SPravin B Shelar 
15377b1e00fSEric Dumazet 		if (READ_ONCE(t->parms.link) == link)
154c5441932SPravin B Shelar 			return t;
15577b1e00fSEric Dumazet 		if (!cand)
156c5441932SPravin B Shelar 			cand = t;
157c5441932SPravin B Shelar 	}
158c5441932SPravin B Shelar 
159c5441932SPravin B Shelar 	if (cand)
160c5441932SPravin B Shelar 		return cand;
161c5441932SPravin B Shelar 
1622e15ea39SPravin B Shelar 	t = rcu_dereference(itn->collect_md_tun);
163833a8b40SHaishuang Yan 	if (t && t->dev->flags & IFF_UP)
1642e15ea39SPravin B Shelar 		return t;
1652e15ea39SPravin B Shelar 
166ba61539cSTaehee Yoo 	ndev = READ_ONCE(itn->fb_tunnel_dev);
167ba61539cSTaehee Yoo 	if (ndev && ndev->flags & IFF_UP)
168ba61539cSTaehee Yoo 		return netdev_priv(ndev);
169c5441932SPravin B Shelar 
170c5441932SPravin B Shelar 	return NULL;
171c5441932SPravin B Shelar }
172c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_lookup);
173c5441932SPravin B Shelar 
ip_bucket(struct ip_tunnel_net * itn,struct ip_tunnel_parm * parms)174c5441932SPravin B Shelar static struct hlist_head *ip_bucket(struct ip_tunnel_net *itn,
175c5441932SPravin B Shelar 				    struct ip_tunnel_parm *parms)
176c5441932SPravin B Shelar {
177c5441932SPravin B Shelar 	unsigned int h;
178c5441932SPravin B Shelar 	__be32 remote;
1796d608f06SSteffen Klassert 	__be32 i_key = parms->i_key;
180c5441932SPravin B Shelar 
181c5441932SPravin B Shelar 	if (parms->iph.daddr && !ipv4_is_multicast(parms->iph.daddr))
182c5441932SPravin B Shelar 		remote = parms->iph.daddr;
183c5441932SPravin B Shelar 	else
184c5441932SPravin B Shelar 		remote = 0;
185c5441932SPravin B Shelar 
1866d608f06SSteffen Klassert 	if (!(parms->i_flags & TUNNEL_KEY) && (parms->i_flags & VTI_ISVTI))
1876d608f06SSteffen Klassert 		i_key = 0;
1886d608f06SSteffen Klassert 
1896d608f06SSteffen Klassert 	h = ip_tunnel_hash(i_key, remote);
190c5441932SPravin B Shelar 	return &itn->tunnels[h];
191c5441932SPravin B Shelar }
192c5441932SPravin B Shelar 
ip_tunnel_add(struct ip_tunnel_net * itn,struct ip_tunnel * t)193c5441932SPravin B Shelar static void ip_tunnel_add(struct ip_tunnel_net *itn, struct ip_tunnel *t)
194c5441932SPravin B Shelar {
195c5441932SPravin B Shelar 	struct hlist_head *head = ip_bucket(itn, &t->parms);
196c5441932SPravin B Shelar 
1972e15ea39SPravin B Shelar 	if (t->collect_md)
1982e15ea39SPravin B Shelar 		rcu_assign_pointer(itn->collect_md_tun, t);
199c5441932SPravin B Shelar 	hlist_add_head_rcu(&t->hash_node, head);
200c5441932SPravin B Shelar }
201c5441932SPravin B Shelar 
ip_tunnel_del(struct ip_tunnel_net * itn,struct ip_tunnel * t)2022e15ea39SPravin B Shelar static void ip_tunnel_del(struct ip_tunnel_net *itn, struct ip_tunnel *t)
203c5441932SPravin B Shelar {
2042e15ea39SPravin B Shelar 	if (t->collect_md)
2052e15ea39SPravin B Shelar 		rcu_assign_pointer(itn->collect_md_tun, NULL);
206c5441932SPravin B Shelar 	hlist_del_init_rcu(&t->hash_node);
207c5441932SPravin B Shelar }
208c5441932SPravin B Shelar 
ip_tunnel_find(struct ip_tunnel_net * itn,struct ip_tunnel_parm * parms,int type)209c5441932SPravin B Shelar static struct ip_tunnel *ip_tunnel_find(struct ip_tunnel_net *itn,
210c5441932SPravin B Shelar 					struct ip_tunnel_parm *parms,
211c5441932SPravin B Shelar 					int type)
212c5441932SPravin B Shelar {
213c5441932SPravin B Shelar 	__be32 remote = parms->iph.daddr;
214c5441932SPravin B Shelar 	__be32 local = parms->iph.saddr;
215c5441932SPravin B Shelar 	__be32 key = parms->i_key;
2165ce54af1SDmitry Popov 	__be16 flags = parms->i_flags;
217c5441932SPravin B Shelar 	int link = parms->link;
218c5441932SPravin B Shelar 	struct ip_tunnel *t = NULL;
219c5441932SPravin B Shelar 	struct hlist_head *head = ip_bucket(itn, parms);
220c5441932SPravin B Shelar 
221*e0500e43SIdo Schimmel 	hlist_for_each_entry_rcu(t, head, hash_node, lockdep_rtnl_is_held()) {
222c5441932SPravin B Shelar 		if (local == t->parms.iph.saddr &&
223c5441932SPravin B Shelar 		    remote == t->parms.iph.daddr &&
22477b1e00fSEric Dumazet 		    link == READ_ONCE(t->parms.link) &&
2255ce54af1SDmitry Popov 		    type == t->dev->type &&
2265ce54af1SDmitry Popov 		    ip_tunnel_key_match(&t->parms, flags, key))
227c5441932SPravin B Shelar 			break;
228c5441932SPravin B Shelar 	}
229c5441932SPravin B Shelar 	return t;
230c5441932SPravin B Shelar }
231c5441932SPravin B Shelar 
__ip_tunnel_create(struct net * net,const struct rtnl_link_ops * ops,struct ip_tunnel_parm * parms)232c5441932SPravin B Shelar static struct net_device *__ip_tunnel_create(struct net *net,
233c5441932SPravin B Shelar 					     const struct rtnl_link_ops *ops,
234c5441932SPravin B Shelar 					     struct ip_tunnel_parm *parms)
235c5441932SPravin B Shelar {
236c5441932SPravin B Shelar 	int err;
237c5441932SPravin B Shelar 	struct ip_tunnel *tunnel;
238c5441932SPravin B Shelar 	struct net_device *dev;
239c5441932SPravin B Shelar 	char name[IFNAMSIZ];
240c5441932SPravin B Shelar 
241c5441932SPravin B Shelar 	err = -E2BIG;
2429cb726a2SEric Dumazet 	if (parms->name[0]) {
2439cb726a2SEric Dumazet 		if (!dev_valid_name(parms->name))
244c5441932SPravin B Shelar 			goto failed;
245512b2dc4SXueBing Chen 		strscpy(name, parms->name, IFNAMSIZ);
2469cb726a2SEric Dumazet 	} else {
2479cb726a2SEric Dumazet 		if (strlen(ops->kind) > (IFNAMSIZ - 3))
2489cb726a2SEric Dumazet 			goto failed;
249000ade80SSultan Alsawaf 		strcpy(name, ops->kind);
250000ade80SSultan Alsawaf 		strcat(name, "%d");
251c5441932SPravin B Shelar 	}
252c5441932SPravin B Shelar 
253c5441932SPravin B Shelar 	ASSERT_RTNL();
254c835a677STom Gundersen 	dev = alloc_netdev(ops->priv_size, name, NET_NAME_UNKNOWN, ops->setup);
255c5441932SPravin B Shelar 	if (!dev) {
256c5441932SPravin B Shelar 		err = -ENOMEM;
257c5441932SPravin B Shelar 		goto failed;
258c5441932SPravin B Shelar 	}
259c5441932SPravin B Shelar 	dev_net_set(dev, net);
260c5441932SPravin B Shelar 
261c5441932SPravin B Shelar 	dev->rtnl_link_ops = ops;
262c5441932SPravin B Shelar 
263c5441932SPravin B Shelar 	tunnel = netdev_priv(dev);
264c5441932SPravin B Shelar 	tunnel->parms = *parms;
2655e6700b3SNicolas Dichtel 	tunnel->net = net;
266c5441932SPravin B Shelar 
267c5441932SPravin B Shelar 	err = register_netdevice(dev);
268c5441932SPravin B Shelar 	if (err)
269c5441932SPravin B Shelar 		goto failed_free;
270c5441932SPravin B Shelar 
271c5441932SPravin B Shelar 	return dev;
272c5441932SPravin B Shelar 
273c5441932SPravin B Shelar failed_free:
274c5441932SPravin B Shelar 	free_netdev(dev);
275c5441932SPravin B Shelar failed:
276c5441932SPravin B Shelar 	return ERR_PTR(err);
277c5441932SPravin B Shelar }
278c5441932SPravin B Shelar 
ip_tunnel_bind_dev(struct net_device * dev)279c5441932SPravin B Shelar static int ip_tunnel_bind_dev(struct net_device *dev)
280c5441932SPravin B Shelar {
281c5441932SPravin B Shelar 	struct net_device *tdev = NULL;
282c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
283c5441932SPravin B Shelar 	const struct iphdr *iph;
284c5441932SPravin B Shelar 	int hlen = LL_MAX_HEADER;
285c5441932SPravin B Shelar 	int mtu = ETH_DATA_LEN;
286c5441932SPravin B Shelar 	int t_hlen = tunnel->hlen + sizeof(struct iphdr);
287c5441932SPravin B Shelar 
288c5441932SPravin B Shelar 	iph = &tunnel->parms.iph;
289c5441932SPravin B Shelar 
290c5441932SPravin B Shelar 	/* Guess output device to choose reasonable mtu and needed_headroom */
291c5441932SPravin B Shelar 	if (iph->daddr) {
292c5441932SPravin B Shelar 		struct flowi4 fl4;
293c5441932SPravin B Shelar 		struct rtable *rt;
294c5441932SPravin B Shelar 
295b0066da5SPetr Machata 		ip_tunnel_init_flow(&fl4, iph->protocol, iph->daddr,
2967d442fabSTom Herbert 				    iph->saddr, tunnel->parms.o_key,
29736eff866SXiao Liang 				    iph->tos & INET_DSCP_MASK, tunnel->net,
2987ec9fce4SEyal Birger 				    tunnel->parms.link, tunnel->fwmark, 0, 0);
2997d442fabSTom Herbert 		rt = ip_route_output_key(tunnel->net, &fl4);
3007d442fabSTom Herbert 
301c5441932SPravin B Shelar 		if (!IS_ERR(rt)) {
302c5441932SPravin B Shelar 			tdev = rt->dst.dev;
303c5441932SPravin B Shelar 			ip_rt_put(rt);
304c5441932SPravin B Shelar 		}
305c5441932SPravin B Shelar 		if (dev->type != ARPHRD_ETHER)
306c5441932SPravin B Shelar 			dev->flags |= IFF_POINTOPOINT;
307f27337e1SPaolo Abeni 
308f27337e1SPaolo Abeni 		dst_cache_reset(&tunnel->dst_cache);
309c5441932SPravin B Shelar 	}
310c5441932SPravin B Shelar 
311c5441932SPravin B Shelar 	if (!tdev && tunnel->parms.link)
3126c742e71SNicolas Dichtel 		tdev = __dev_get_by_index(tunnel->net, tunnel->parms.link);
313c5441932SPravin B Shelar 
314c5441932SPravin B Shelar 	if (tdev) {
315c5441932SPravin B Shelar 		hlen = tdev->hard_header_len + tdev->needed_headroom;
31682612de1SNicolas Dichtel 		mtu = min(tdev->mtu, IP_MAX_MTU);
317c5441932SPravin B Shelar 	}
318c5441932SPravin B Shelar 
319c5441932SPravin B Shelar 	dev->needed_headroom = t_hlen + hlen;
3209992a078SHangbin Liu 	mtu -= t_hlen + (dev->type == ARPHRD_ETHER ? dev->hard_header_len : 0);
321c5441932SPravin B Shelar 
322b5476022SEric Dumazet 	if (mtu < IPV4_MIN_MTU)
323b5476022SEric Dumazet 		mtu = IPV4_MIN_MTU;
324c5441932SPravin B Shelar 
325c5441932SPravin B Shelar 	return mtu;
326c5441932SPravin B Shelar }
327c5441932SPravin B Shelar 
ip_tunnel_create(struct net * net,struct ip_tunnel_net * itn,struct ip_tunnel_parm * parms)328c5441932SPravin B Shelar static struct ip_tunnel *ip_tunnel_create(struct net *net,
329c5441932SPravin B Shelar 					  struct ip_tunnel_net *itn,
330c5441932SPravin B Shelar 					  struct ip_tunnel_parm *parms)
331c5441932SPravin B Shelar {
3324929fd8cSJulia Lawall 	struct ip_tunnel *nt;
333c5441932SPravin B Shelar 	struct net_device *dev;
334b96f9afeSJarod Wilson 	int t_hlen;
335f6cc9c05SPetr Machata 	int mtu;
336f6cc9c05SPetr Machata 	int err;
337c5441932SPravin B Shelar 
33879134e6cSEric Dumazet 	dev = __ip_tunnel_create(net, itn->rtnl_link_ops, parms);
339c5441932SPravin B Shelar 	if (IS_ERR(dev))
3406dd3c9ecSFlorian Westphal 		return ERR_CAST(dev);
341c5441932SPravin B Shelar 
342f6cc9c05SPetr Machata 	mtu = ip_tunnel_bind_dev(dev);
343f6cc9c05SPetr Machata 	err = dev_set_mtu(dev, mtu);
344f6cc9c05SPetr Machata 	if (err)
345f6cc9c05SPetr Machata 		goto err_dev_set_mtu;
346c5441932SPravin B Shelar 
347c5441932SPravin B Shelar 	nt = netdev_priv(dev);
348b96f9afeSJarod Wilson 	t_hlen = nt->hlen + sizeof(struct iphdr);
349b96f9afeSJarod Wilson 	dev->min_mtu = ETH_MIN_MTU;
35028e104d0SVadim Fedorenko 	dev->max_mtu = IP_MAX_MTU - t_hlen;
3519992a078SHangbin Liu 	if (dev->type == ARPHRD_ETHER)
3529992a078SHangbin Liu 		dev->max_mtu -= dev->hard_header_len;
3539992a078SHangbin Liu 
354c5441932SPravin B Shelar 	ip_tunnel_add(itn, nt);
355c5441932SPravin B Shelar 	return nt;
356f6cc9c05SPetr Machata 
357f6cc9c05SPetr Machata err_dev_set_mtu:
358f6cc9c05SPetr Machata 	unregister_netdevice(dev);
359f6cc9c05SPetr Machata 	return ERR_PTR(err);
360c5441932SPravin B Shelar }
361c5441932SPravin B Shelar 
ip_tunnel_md_udp_encap(struct sk_buff * skb,struct ip_tunnel_info * info)362ac931d4cSChristian Ehrig void ip_tunnel_md_udp_encap(struct sk_buff *skb, struct ip_tunnel_info *info)
363ac931d4cSChristian Ehrig {
364ac931d4cSChristian Ehrig 	const struct iphdr *iph = ip_hdr(skb);
365ac931d4cSChristian Ehrig 	const struct udphdr *udph;
366ac931d4cSChristian Ehrig 
367ac931d4cSChristian Ehrig 	if (iph->protocol != IPPROTO_UDP)
368ac931d4cSChristian Ehrig 		return;
369ac931d4cSChristian Ehrig 
370ac931d4cSChristian Ehrig 	udph = (struct udphdr *)((__u8 *)iph + (iph->ihl << 2));
371ac931d4cSChristian Ehrig 	info->encap.sport = udph->source;
372ac931d4cSChristian Ehrig 	info->encap.dport = udph->dest;
373ac931d4cSChristian Ehrig }
374ac931d4cSChristian Ehrig EXPORT_SYMBOL(ip_tunnel_md_udp_encap);
375ac931d4cSChristian Ehrig 
ip_tunnel_rcv(struct ip_tunnel * tunnel,struct sk_buff * skb,const struct tnl_ptk_info * tpi,struct metadata_dst * tun_dst,bool log_ecn_error)376c5441932SPravin B Shelar int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb,
3772e15ea39SPravin B Shelar 		  const struct tnl_ptk_info *tpi, struct metadata_dst *tun_dst,
3782e15ea39SPravin B Shelar 		  bool log_ecn_error)
379c5441932SPravin B Shelar {
380c5441932SPravin B Shelar 	const struct iphdr *iph = ip_hdr(skb);
381c4c85772SEric Dumazet 	int nh, err;
382c5441932SPravin B Shelar 
383c5441932SPravin B Shelar #ifdef CONFIG_NET_IPGRE_BROADCAST
384c5441932SPravin B Shelar 	if (ipv4_is_multicast(iph->daddr)) {
385c4794d22SEric Dumazet 		DEV_STATS_INC(tunnel->dev, multicast);
386c5441932SPravin B Shelar 		skb->pkt_type = PACKET_BROADCAST;
387c5441932SPravin B Shelar 	}
388c5441932SPravin B Shelar #endif
389c5441932SPravin B Shelar 
390c5441932SPravin B Shelar 	if ((!(tpi->flags&TUNNEL_CSUM) &&  (tunnel->parms.i_flags&TUNNEL_CSUM)) ||
391c5441932SPravin B Shelar 	     ((tpi->flags&TUNNEL_CSUM) && !(tunnel->parms.i_flags&TUNNEL_CSUM))) {
392c4794d22SEric Dumazet 		DEV_STATS_INC(tunnel->dev, rx_crc_errors);
393c4794d22SEric Dumazet 		DEV_STATS_INC(tunnel->dev, rx_errors);
394c5441932SPravin B Shelar 		goto drop;
395c5441932SPravin B Shelar 	}
396c5441932SPravin B Shelar 
397c5441932SPravin B Shelar 	if (tunnel->parms.i_flags&TUNNEL_SEQ) {
398c5441932SPravin B Shelar 		if (!(tpi->flags&TUNNEL_SEQ) ||
399c5441932SPravin B Shelar 		    (tunnel->i_seqno && (s32)(ntohl(tpi->seq) - tunnel->i_seqno) < 0)) {
400c4794d22SEric Dumazet 			DEV_STATS_INC(tunnel->dev, rx_fifo_errors);
401c4794d22SEric Dumazet 			DEV_STATS_INC(tunnel->dev, rx_errors);
402c5441932SPravin B Shelar 			goto drop;
403c5441932SPravin B Shelar 		}
404c5441932SPravin B Shelar 		tunnel->i_seqno = ntohl(tpi->seq) + 1;
405c5441932SPravin B Shelar 	}
406c5441932SPravin B Shelar 
407c4c85772SEric Dumazet 	/* Save offset of outer header relative to skb->head,
408c4c85772SEric Dumazet 	 * because we are going to reset the network header to the inner header
409c4c85772SEric Dumazet 	 * and might change skb->head.
410c4c85772SEric Dumazet 	 */
411c4c85772SEric Dumazet 	nh = skb_network_header(skb) - skb->head;
412c4c85772SEric Dumazet 
413227adfb2SGilad Naaman 	skb_set_network_header(skb, (tunnel->dev->type == ARPHRD_ETHER) ? ETH_HLEN : 0);
414e96f2e7cSYing Cai 
415c4c85772SEric Dumazet 	if (!pskb_inet_may_pull(skb)) {
416c4c85772SEric Dumazet 		DEV_STATS_INC(tunnel->dev, rx_length_errors);
417c4c85772SEric Dumazet 		DEV_STATS_INC(tunnel->dev, rx_errors);
418c4c85772SEric Dumazet 		goto drop;
419c4c85772SEric Dumazet 	}
420c4c85772SEric Dumazet 	iph = (struct iphdr *)(skb->head + nh);
421c4c85772SEric Dumazet 
422c5441932SPravin B Shelar 	err = IP_ECN_decapsulate(iph, skb);
423c5441932SPravin B Shelar 	if (unlikely(err)) {
424c5441932SPravin B Shelar 		if (log_ecn_error)
425c5441932SPravin B Shelar 			net_info_ratelimited("non-ECT from %pI4 with TOS=%#x\n",
426c5441932SPravin B Shelar 					&iph->saddr, iph->tos);
427c5441932SPravin B Shelar 		if (err > 1) {
428c4794d22SEric Dumazet 			DEV_STATS_INC(tunnel->dev, rx_frame_errors);
429c4794d22SEric Dumazet 			DEV_STATS_INC(tunnel->dev, rx_errors);
430c5441932SPravin B Shelar 			goto drop;
431c5441932SPravin B Shelar 		}
432c5441932SPravin B Shelar 	}
433c5441932SPravin B Shelar 
434560b50cfSFabian Frederick 	dev_sw_netstats_rx_add(tunnel->dev, skb->len);
43581b9eab5SAlexei Starovoitov 	skb_scrub_packet(skb, !net_eq(tunnel->net, dev_net(tunnel->dev)));
43681b9eab5SAlexei Starovoitov 
4373d7b46cdSPravin B Shelar 	if (tunnel->dev->type == ARPHRD_ETHER) {
4383d7b46cdSPravin B Shelar 		skb->protocol = eth_type_trans(skb, tunnel->dev);
4393d7b46cdSPravin B Shelar 		skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN);
4403d7b46cdSPravin B Shelar 	} else {
4413d7b46cdSPravin B Shelar 		skb->dev = tunnel->dev;
4423d7b46cdSPravin B Shelar 	}
44364261f23SNicolas Dichtel 
4442e15ea39SPravin B Shelar 	if (tun_dst)
4452e15ea39SPravin B Shelar 		skb_dst_set(skb, (struct dst_entry *)tun_dst);
4462e15ea39SPravin B Shelar 
447c5441932SPravin B Shelar 	gro_cells_receive(&tunnel->gro_cells, skb);
448c5441932SPravin B Shelar 	return 0;
449c5441932SPravin B Shelar 
450c5441932SPravin B Shelar drop:
451469f87e1SHaishuang Yan 	if (tun_dst)
452469f87e1SHaishuang Yan 		dst_release((struct dst_entry *)tun_dst);
453c5441932SPravin B Shelar 	kfree_skb(skb);
454c5441932SPravin B Shelar 	return 0;
455c5441932SPravin B Shelar }
456c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_rcv);
457c5441932SPravin B Shelar 
ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops * ops,unsigned int num)458a8c5f90fSTom Herbert int ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops *ops,
459a8c5f90fSTom Herbert 			    unsigned int num)
460a8c5f90fSTom Herbert {
461bb1553c8SThomas Graf 	if (num >= MAX_IPTUN_ENCAP_OPS)
462bb1553c8SThomas Graf 		return -ERANGE;
463bb1553c8SThomas Graf 
464a8c5f90fSTom Herbert 	return !cmpxchg((const struct ip_tunnel_encap_ops **)
465a8c5f90fSTom Herbert 			&iptun_encaps[num],
466a8c5f90fSTom Herbert 			NULL, ops) ? 0 : -1;
46756328486STom Herbert }
468a8c5f90fSTom Herbert EXPORT_SYMBOL(ip_tunnel_encap_add_ops);
469a8c5f90fSTom Herbert 
ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops * ops,unsigned int num)470a8c5f90fSTom Herbert int ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops *ops,
471a8c5f90fSTom Herbert 			    unsigned int num)
472a8c5f90fSTom Herbert {
473a8c5f90fSTom Herbert 	int ret;
474a8c5f90fSTom Herbert 
475bb1553c8SThomas Graf 	if (num >= MAX_IPTUN_ENCAP_OPS)
476bb1553c8SThomas Graf 		return -ERANGE;
477bb1553c8SThomas Graf 
478a8c5f90fSTom Herbert 	ret = (cmpxchg((const struct ip_tunnel_encap_ops **)
479a8c5f90fSTom Herbert 		       &iptun_encaps[num],
480a8c5f90fSTom Herbert 		       ops, NULL) == ops) ? 0 : -1;
481a8c5f90fSTom Herbert 
482a8c5f90fSTom Herbert 	synchronize_net();
483a8c5f90fSTom Herbert 
484a8c5f90fSTom Herbert 	return ret;
485a8c5f90fSTom Herbert }
486a8c5f90fSTom Herbert EXPORT_SYMBOL(ip_tunnel_encap_del_ops);
48756328486STom Herbert 
ip_tunnel_encap_setup(struct ip_tunnel * t,struct ip_tunnel_encap * ipencap)48856328486STom Herbert int ip_tunnel_encap_setup(struct ip_tunnel *t,
48956328486STom Herbert 			  struct ip_tunnel_encap *ipencap)
49056328486STom Herbert {
49156328486STom Herbert 	int hlen;
49256328486STom Herbert 
49356328486STom Herbert 	memset(&t->encap, 0, sizeof(t->encap));
49456328486STom Herbert 
49556328486STom Herbert 	hlen = ip_encap_hlen(ipencap);
49656328486STom Herbert 	if (hlen < 0)
49756328486STom Herbert 		return hlen;
49856328486STom Herbert 
49956328486STom Herbert 	t->encap.type = ipencap->type;
50056328486STom Herbert 	t->encap.sport = ipencap->sport;
50156328486STom Herbert 	t->encap.dport = ipencap->dport;
50256328486STom Herbert 	t->encap.flags = ipencap->flags;
50356328486STom Herbert 
50456328486STom Herbert 	t->encap_hlen = hlen;
50556328486STom Herbert 	t->hlen = t->encap_hlen + t->tun_hlen;
50656328486STom Herbert 
50756328486STom Herbert 	return 0;
50856328486STom Herbert }
50956328486STom Herbert EXPORT_SYMBOL_GPL(ip_tunnel_encap_setup);
51056328486STom Herbert 
tnl_update_pmtu(struct net_device * dev,struct sk_buff * skb,struct rtable * rt,__be16 df,const struct iphdr * inner_iph,int tunnel_hlen,__be32 dst,bool md)51123a3647bSPravin B Shelar static int tnl_update_pmtu(struct net_device *dev, struct sk_buff *skb,
512fc24f2b2STimo Teräs 			    struct rtable *rt, __be16 df,
513c8b34e68Swenxu 			    const struct iphdr *inner_iph,
514c8b34e68Swenxu 			    int tunnel_hlen, __be32 dst, bool md)
51523a3647bSPravin B Shelar {
51623a3647bSPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
517c8b34e68Swenxu 	int pkt_size;
51823a3647bSPravin B Shelar 	int mtu;
51923a3647bSPravin B Shelar 
520c8b34e68Swenxu 	tunnel_hlen = md ? tunnel_hlen : tunnel->hlen;
52128e104d0SVadim Fedorenko 	pkt_size = skb->len - tunnel_hlen;
5229992a078SHangbin Liu 	pkt_size -= dev->type == ARPHRD_ETHER ? dev->hard_header_len : 0;
523c8b34e68Swenxu 
5249992a078SHangbin Liu 	if (df) {
52528e104d0SVadim Fedorenko 		mtu = dst_mtu(&rt->dst) - (sizeof(struct iphdr) + tunnel_hlen);
5269992a078SHangbin Liu 		mtu -= dev->type == ARPHRD_ETHER ? dev->hard_header_len : 0;
5279992a078SHangbin Liu 	} else {
528f4b3ec4eSAlan Maguire 		mtu = skb_valid_dst(skb) ? dst_mtu(skb_dst(skb)) : dev->mtu;
5299992a078SHangbin Liu 	}
53023a3647bSPravin B Shelar 
531f4b3ec4eSAlan Maguire 	if (skb_valid_dst(skb))
5327a1592bcSHangbin Liu 		skb_dst_update_pmtu_no_confirm(skb, mtu);
53323a3647bSPravin B Shelar 
53423a3647bSPravin B Shelar 	if (skb->protocol == htons(ETH_P_IP)) {
53523a3647bSPravin B Shelar 		if (!skb_is_gso(skb) &&
536fc24f2b2STimo Teräs 		    (inner_iph->frag_off & htons(IP_DF)) &&
537fc24f2b2STimo Teräs 		    mtu < pkt_size) {
5384372339eSJason A. Donenfeld 			icmp_ndo_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED, htonl(mtu));
53923a3647bSPravin B Shelar 			return -E2BIG;
54023a3647bSPravin B Shelar 		}
54123a3647bSPravin B Shelar 	}
54223a3647bSPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
54323a3647bSPravin B Shelar 	else if (skb->protocol == htons(ETH_P_IPV6)) {
544f4b3ec4eSAlan Maguire 		struct rt6_info *rt6;
545c8b34e68Swenxu 		__be32 daddr;
546c8b34e68Swenxu 
547797a4c1fSEric Dumazet 		rt6 = skb_valid_dst(skb) ? dst_rt6_info(skb_dst(skb)) :
548f4b3ec4eSAlan Maguire 					   NULL;
549c8b34e68Swenxu 		daddr = md ? dst : tunnel->parms.iph.daddr;
55023a3647bSPravin B Shelar 
55123a3647bSPravin B Shelar 		if (rt6 && mtu < dst_mtu(skb_dst(skb)) &&
55223a3647bSPravin B Shelar 			   mtu >= IPV6_MIN_MTU) {
553c8b34e68Swenxu 			if ((daddr && !ipv4_is_multicast(daddr)) ||
55423a3647bSPravin B Shelar 			    rt6->rt6i_dst.plen == 128) {
55523a3647bSPravin B Shelar 				rt6->rt6i_flags |= RTF_MODIFIED;
55623a3647bSPravin B Shelar 				dst_metric_set(skb_dst(skb), RTAX_MTU, mtu);
55723a3647bSPravin B Shelar 			}
55823a3647bSPravin B Shelar 		}
55923a3647bSPravin B Shelar 
56023a3647bSPravin B Shelar 		if (!skb_is_gso(skb) && mtu >= IPV6_MIN_MTU &&
56123a3647bSPravin B Shelar 					mtu < pkt_size) {
5624372339eSJason A. Donenfeld 			icmpv6_ndo_send(skb, ICMPV6_PKT_TOOBIG, 0, mtu);
56323a3647bSPravin B Shelar 			return -E2BIG;
56423a3647bSPravin B Shelar 		}
56523a3647bSPravin B Shelar 	}
56623a3647bSPravin B Shelar #endif
56723a3647bSPravin B Shelar 	return 0;
56823a3647bSPravin B Shelar }
56923a3647bSPravin B Shelar 
ip_tunnel_adj_headroom(struct net_device * dev,unsigned int headroom)570a0a1db40SFlorian Westphal static void ip_tunnel_adj_headroom(struct net_device *dev, unsigned int headroom)
571a0a1db40SFlorian Westphal {
572a0a1db40SFlorian Westphal 	/* we must cap headroom to some upperlimit, else pskb_expand_head
573a0a1db40SFlorian Westphal 	 * will overflow header offsets in skb_headers_offset_update().
574a0a1db40SFlorian Westphal 	 */
575a0a1db40SFlorian Westphal 	static const unsigned int max_allowed = 512;
576a0a1db40SFlorian Westphal 
577a0a1db40SFlorian Westphal 	if (headroom > max_allowed)
578a0a1db40SFlorian Westphal 		headroom = max_allowed;
579a0a1db40SFlorian Westphal 
580a0a1db40SFlorian Westphal 	if (headroom > READ_ONCE(dev->needed_headroom))
581a0a1db40SFlorian Westphal 		WRITE_ONCE(dev->needed_headroom, headroom);
582a0a1db40SFlorian Westphal }
583a0a1db40SFlorian Westphal 
ip_md_tunnel_xmit(struct sk_buff * skb,struct net_device * dev,u8 proto,int tunnel_hlen)584c8b34e68Swenxu void ip_md_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
585c8b34e68Swenxu 		       u8 proto, int tunnel_hlen)
586cfc7381bSAlexei Starovoitov {
587cfc7381bSAlexei Starovoitov 	struct ip_tunnel *tunnel = netdev_priv(dev);
588cfc7381bSAlexei Starovoitov 	u32 headroom = sizeof(struct iphdr);
589cfc7381bSAlexei Starovoitov 	struct ip_tunnel_info *tun_info;
590cfc7381bSAlexei Starovoitov 	const struct ip_tunnel_key *key;
591cfc7381bSAlexei Starovoitov 	const struct iphdr *inner_iph;
592f46fe4f8Swenxu 	struct rtable *rt = NULL;
593cfc7381bSAlexei Starovoitov 	struct flowi4 fl4;
594cfc7381bSAlexei Starovoitov 	__be16 df = 0;
595cfc7381bSAlexei Starovoitov 	u8 tos, ttl;
596f46fe4f8Swenxu 	bool use_cache;
597cfc7381bSAlexei Starovoitov 
598cfc7381bSAlexei Starovoitov 	tun_info = skb_tunnel_info(skb);
599cfc7381bSAlexei Starovoitov 	if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
600cfc7381bSAlexei Starovoitov 		     ip_tunnel_info_af(tun_info) != AF_INET))
601cfc7381bSAlexei Starovoitov 		goto tx_error;
602cfc7381bSAlexei Starovoitov 	key = &tun_info->key;
603cfc7381bSAlexei Starovoitov 	memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
604cfc7381bSAlexei Starovoitov 	inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
605cfc7381bSAlexei Starovoitov 	tos = key->tos;
606cfc7381bSAlexei Starovoitov 	if (tos == 1) {
607cfc7381bSAlexei Starovoitov 		if (skb->protocol == htons(ETH_P_IP))
608cfc7381bSAlexei Starovoitov 			tos = inner_iph->tos;
609cfc7381bSAlexei Starovoitov 		else if (skb->protocol == htons(ETH_P_IPV6))
610cfc7381bSAlexei Starovoitov 			tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
611cfc7381bSAlexei Starovoitov 	}
6126e6b904aSwenxu 	ip_tunnel_init_flow(&fl4, proto, key->u.ipv4.dst, key->u.ipv4.src,
6133b1a7fb7SIdo Schimmel 			    tunnel_id_to_key32(key->tun_id),
61436eff866SXiao Liang 			    tos & INET_DSCP_MASK, tunnel->net, 0, skb->mark,
6153b1a7fb7SIdo Schimmel 			    skb_get_hash(skb), key->flow_flags);
616ac931d4cSChristian Ehrig 
617ac931d4cSChristian Ehrig 	if (!tunnel_hlen)
618ac931d4cSChristian Ehrig 		tunnel_hlen = ip_encap_hlen(&tun_info->encap);
619ac931d4cSChristian Ehrig 
620ac931d4cSChristian Ehrig 	if (ip_tunnel_encap(skb, &tun_info->encap, &proto, &fl4) < 0)
621cfc7381bSAlexei Starovoitov 		goto tx_error;
622f46fe4f8Swenxu 
623f46fe4f8Swenxu 	use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
624f46fe4f8Swenxu 	if (use_cache)
625f46fe4f8Swenxu 		rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl4.saddr);
626f46fe4f8Swenxu 	if (!rt) {
627cfc7381bSAlexei Starovoitov 		rt = ip_route_output_key(tunnel->net, &fl4);
628cfc7381bSAlexei Starovoitov 		if (IS_ERR(rt)) {
629c4794d22SEric Dumazet 			DEV_STATS_INC(dev, tx_carrier_errors);
630cfc7381bSAlexei Starovoitov 			goto tx_error;
631cfc7381bSAlexei Starovoitov 		}
632f46fe4f8Swenxu 		if (use_cache)
633f46fe4f8Swenxu 			dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
634f46fe4f8Swenxu 					  fl4.saddr);
635f46fe4f8Swenxu 	}
636cfc7381bSAlexei Starovoitov 	if (rt->dst.dev == dev) {
637cfc7381bSAlexei Starovoitov 		ip_rt_put(rt);
638c4794d22SEric Dumazet 		DEV_STATS_INC(dev, collisions);
639cfc7381bSAlexei Starovoitov 		goto tx_error;
640cfc7381bSAlexei Starovoitov 	}
641c8b34e68Swenxu 
642c8b34e68Swenxu 	if (key->tun_flags & TUNNEL_DONT_FRAGMENT)
643c8b34e68Swenxu 		df = htons(IP_DF);
644c8b34e68Swenxu 	if (tnl_update_pmtu(dev, skb, rt, df, inner_iph, tunnel_hlen,
645c8b34e68Swenxu 			    key->u.ipv4.dst, true)) {
646c8b34e68Swenxu 		ip_rt_put(rt);
647c8b34e68Swenxu 		goto tx_error;
648c8b34e68Swenxu 	}
649c8b34e68Swenxu 
650cfc7381bSAlexei Starovoitov 	tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
651cfc7381bSAlexei Starovoitov 	ttl = key->ttl;
652cfc7381bSAlexei Starovoitov 	if (ttl == 0) {
653cfc7381bSAlexei Starovoitov 		if (skb->protocol == htons(ETH_P_IP))
654cfc7381bSAlexei Starovoitov 			ttl = inner_iph->ttl;
655cfc7381bSAlexei Starovoitov 		else if (skb->protocol == htons(ETH_P_IPV6))
656cfc7381bSAlexei Starovoitov 			ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
657cfc7381bSAlexei Starovoitov 		else
658cfc7381bSAlexei Starovoitov 			ttl = ip4_dst_hoplimit(&rt->dst);
659cfc7381bSAlexei Starovoitov 	}
660c8b34e68Swenxu 
661cfc7381bSAlexei Starovoitov 	headroom += LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len;
662a0a1db40SFlorian Westphal 	if (skb_cow_head(skb, headroom)) {
663cfc7381bSAlexei Starovoitov 		ip_rt_put(rt);
664cfc7381bSAlexei Starovoitov 		goto tx_dropped;
665cfc7381bSAlexei Starovoitov 	}
666a0a1db40SFlorian Westphal 
667a0a1db40SFlorian Westphal 	ip_tunnel_adj_headroom(dev, headroom);
668a0a1db40SFlorian Westphal 
6690f693f19SHaishuang Yan 	iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, proto, tos, ttl,
6700f693f19SHaishuang Yan 		      df, !net_eq(tunnel->net, dev_net(dev)));
671cfc7381bSAlexei Starovoitov 	return;
672cfc7381bSAlexei Starovoitov tx_error:
673c4794d22SEric Dumazet 	DEV_STATS_INC(dev, tx_errors);
674cfc7381bSAlexei Starovoitov 	goto kfree;
675cfc7381bSAlexei Starovoitov tx_dropped:
676c4794d22SEric Dumazet 	DEV_STATS_INC(dev, tx_dropped);
677cfc7381bSAlexei Starovoitov kfree:
678cfc7381bSAlexei Starovoitov 	kfree_skb(skb);
679cfc7381bSAlexei Starovoitov }
680cfc7381bSAlexei Starovoitov EXPORT_SYMBOL_GPL(ip_md_tunnel_xmit);
681cfc7381bSAlexei Starovoitov 
ip_tunnel_xmit(struct sk_buff * skb,struct net_device * dev,const struct iphdr * tnl_params,u8 protocol)682c5441932SPravin B Shelar void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
68356328486STom Herbert 		    const struct iphdr *tnl_params, u8 protocol)
684c5441932SPravin B Shelar {
685c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
686186d9366Swenxu 	struct ip_tunnel_info *tun_info = NULL;
687c5441932SPravin B Shelar 	const struct iphdr *inner_iph;
688c5441932SPravin B Shelar 	unsigned int max_headroom;	/* The extra header space needed */
689186d9366Swenxu 	struct rtable *rt = NULL;		/* Route to the other host */
6907ae29fd1SMatthias May 	__be16 payload_protocol;
691186d9366Swenxu 	bool use_cache = false;
692186d9366Swenxu 	struct flowi4 fl4;
693186d9366Swenxu 	bool md = false;
69422fb22eaSTimo Teräs 	bool connected;
695186d9366Swenxu 	u8 tos, ttl;
696186d9366Swenxu 	__be32 dst;
697186d9366Swenxu 	__be16 df;
698c5441932SPravin B Shelar 
699c5441932SPravin B Shelar 	inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
70022fb22eaSTimo Teräs 	connected = (tunnel->parms.iph.daddr != 0);
7017ae29fd1SMatthias May 	payload_protocol = skb_protocol(skb, true);
702c5441932SPravin B Shelar 
7035146d1f1SBernie Harris 	memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
7045146d1f1SBernie Harris 
705c5441932SPravin B Shelar 	dst = tnl_params->daddr;
706c5441932SPravin B Shelar 	if (dst == 0) {
707c5441932SPravin B Shelar 		/* NBMA tunnel */
708c5441932SPravin B Shelar 
70951456b29SIan Morris 		if (!skb_dst(skb)) {
710c4794d22SEric Dumazet 			DEV_STATS_INC(dev, tx_fifo_errors);
711c5441932SPravin B Shelar 			goto tx_error;
712c5441932SPravin B Shelar 		}
713c5441932SPravin B Shelar 
714d71b5753Swenxu 		tun_info = skb_tunnel_info(skb);
715d71b5753Swenxu 		if (tun_info && (tun_info->mode & IP_TUNNEL_INFO_TX) &&
716d71b5753Swenxu 		    ip_tunnel_info_af(tun_info) == AF_INET &&
717186d9366Swenxu 		    tun_info->key.u.ipv4.dst) {
718d71b5753Swenxu 			dst = tun_info->key.u.ipv4.dst;
719186d9366Swenxu 			md = true;
720186d9366Swenxu 			connected = true;
7217ae29fd1SMatthias May 		} else if (payload_protocol == htons(ETH_P_IP)) {
722c5441932SPravin B Shelar 			rt = skb_rtable(skb);
723c5441932SPravin B Shelar 			dst = rt_nexthop(rt, inner_iph->daddr);
724c5441932SPravin B Shelar 		}
725c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
7267ae29fd1SMatthias May 		else if (payload_protocol == htons(ETH_P_IPV6)) {
727c5441932SPravin B Shelar 			const struct in6_addr *addr6;
728c5441932SPravin B Shelar 			struct neighbour *neigh;
729c5441932SPravin B Shelar 			bool do_tx_error_icmp;
730c5441932SPravin B Shelar 			int addr_type;
731c5441932SPravin B Shelar 
732c5441932SPravin B Shelar 			neigh = dst_neigh_lookup(skb_dst(skb),
733c5441932SPravin B Shelar 						 &ipv6_hdr(skb)->daddr);
73451456b29SIan Morris 			if (!neigh)
735c5441932SPravin B Shelar 				goto tx_error;
736c5441932SPravin B Shelar 
737c5441932SPravin B Shelar 			addr6 = (const struct in6_addr *)&neigh->primary_key;
738c5441932SPravin B Shelar 			addr_type = ipv6_addr_type(addr6);
739c5441932SPravin B Shelar 
740c5441932SPravin B Shelar 			if (addr_type == IPV6_ADDR_ANY) {
741c5441932SPravin B Shelar 				addr6 = &ipv6_hdr(skb)->daddr;
742c5441932SPravin B Shelar 				addr_type = ipv6_addr_type(addr6);
743c5441932SPravin B Shelar 			}
744c5441932SPravin B Shelar 
745c5441932SPravin B Shelar 			if ((addr_type & IPV6_ADDR_COMPATv4) == 0)
746c5441932SPravin B Shelar 				do_tx_error_icmp = true;
747c5441932SPravin B Shelar 			else {
748c5441932SPravin B Shelar 				do_tx_error_icmp = false;
749c5441932SPravin B Shelar 				dst = addr6->s6_addr32[3];
750c5441932SPravin B Shelar 			}
751c5441932SPravin B Shelar 			neigh_release(neigh);
752c5441932SPravin B Shelar 			if (do_tx_error_icmp)
753c5441932SPravin B Shelar 				goto tx_error_icmp;
754c5441932SPravin B Shelar 		}
755c5441932SPravin B Shelar #endif
756c5441932SPravin B Shelar 		else
757c5441932SPravin B Shelar 			goto tx_error;
7587d442fabSTom Herbert 
759186d9366Swenxu 		if (!md)
7607d442fabSTom Herbert 			connected = false;
761c5441932SPravin B Shelar 	}
762c5441932SPravin B Shelar 
763c5441932SPravin B Shelar 	tos = tnl_params->tos;
764c5441932SPravin B Shelar 	if (tos & 0x1) {
765c5441932SPravin B Shelar 		tos &= ~0x1;
7667ae29fd1SMatthias May 		if (payload_protocol == htons(ETH_P_IP)) {
767c5441932SPravin B Shelar 			tos = inner_iph->tos;
7687d442fabSTom Herbert 			connected = false;
7697ae29fd1SMatthias May 		} else if (payload_protocol == htons(ETH_P_IPV6)) {
770c5441932SPravin B Shelar 			tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
7717d442fabSTom Herbert 			connected = false;
7727d442fabSTom Herbert 		}
773c5441932SPravin B Shelar 	}
774c5441932SPravin B Shelar 
775b0066da5SPetr Machata 	ip_tunnel_init_flow(&fl4, protocol, dst, tnl_params->saddr,
7767e9aa1a0SIdo Schimmel 			    tunnel->parms.o_key, tos & INET_DSCP_MASK,
77736eff866SXiao Liang 			    tunnel->net, READ_ONCE(tunnel->parms.link),
7787ec9fce4SEyal Birger 			    tunnel->fwmark, skb_get_hash(skb), 0);
7797d442fabSTom Herbert 
780ac931d4cSChristian Ehrig 	if (ip_tunnel_encap(skb, &tunnel->encap, &protocol, &fl4) < 0)
78156328486STom Herbert 		goto tx_error;
78256328486STom Herbert 
783186d9366Swenxu 	if (connected && md) {
784186d9366Swenxu 		use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
785186d9366Swenxu 		if (use_cache)
786186d9366Swenxu 			rt = dst_cache_get_ip4(&tun_info->dst_cache,
787186d9366Swenxu 					       &fl4.saddr);
788186d9366Swenxu 	} else {
789186d9366Swenxu 		rt = connected ? dst_cache_get_ip4(&tunnel->dst_cache,
790186d9366Swenxu 						&fl4.saddr) : NULL;
791186d9366Swenxu 	}
7927d442fabSTom Herbert 
7937d442fabSTom Herbert 	if (!rt) {
7947d442fabSTom Herbert 		rt = ip_route_output_key(tunnel->net, &fl4);
7957d442fabSTom Herbert 
796c5441932SPravin B Shelar 		if (IS_ERR(rt)) {
797c4794d22SEric Dumazet 			DEV_STATS_INC(dev, tx_carrier_errors);
798c5441932SPravin B Shelar 			goto tx_error;
799c5441932SPravin B Shelar 		}
800186d9366Swenxu 		if (use_cache)
801186d9366Swenxu 			dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
802186d9366Swenxu 					  fl4.saddr);
803186d9366Swenxu 		else if (!md && connected)
804e09acddfSPaolo Abeni 			dst_cache_set_ip4(&tunnel->dst_cache, &rt->dst,
805e09acddfSPaolo Abeni 					  fl4.saddr);
8067d442fabSTom Herbert 	}
8077d442fabSTom Herbert 
8080e6fbc5bSPravin B Shelar 	if (rt->dst.dev == dev) {
809c5441932SPravin B Shelar 		ip_rt_put(rt);
810c4794d22SEric Dumazet 		DEV_STATS_INC(dev, collisions);
811c5441932SPravin B Shelar 		goto tx_error;
812c5441932SPravin B Shelar 	}
813c5441932SPravin B Shelar 
81450c66167SFlorian Westphal 	df = tnl_params->frag_off;
8157ae29fd1SMatthias May 	if (payload_protocol == htons(ETH_P_IP) && !tunnel->ignore_df)
81650c66167SFlorian Westphal 		df |= (inner_iph->frag_off & htons(IP_DF));
81750c66167SFlorian Westphal 
81850c66167SFlorian Westphal 	if (tnl_update_pmtu(dev, skb, rt, df, inner_iph, 0, 0, false)) {
819c5441932SPravin B Shelar 		ip_rt_put(rt);
820c5441932SPravin B Shelar 		goto tx_error;
821c5441932SPravin B Shelar 	}
822c5441932SPravin B Shelar 
823c5441932SPravin B Shelar 	if (tunnel->err_count > 0) {
824c5441932SPravin B Shelar 		if (time_before(jiffies,
825c5441932SPravin B Shelar 				tunnel->err_time + IPTUNNEL_ERR_TIMEO)) {
826c5441932SPravin B Shelar 			tunnel->err_count--;
827c5441932SPravin B Shelar 
828c5441932SPravin B Shelar 			dst_link_failure(skb);
829c5441932SPravin B Shelar 		} else
830c5441932SPravin B Shelar 			tunnel->err_count = 0;
831c5441932SPravin B Shelar 	}
832c5441932SPravin B Shelar 
833d4a71b15SPravin B Shelar 	tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
834c5441932SPravin B Shelar 	ttl = tnl_params->ttl;
835c5441932SPravin B Shelar 	if (ttl == 0) {
8367ae29fd1SMatthias May 		if (payload_protocol == htons(ETH_P_IP))
837c5441932SPravin B Shelar 			ttl = inner_iph->ttl;
838c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
8397ae29fd1SMatthias May 		else if (payload_protocol == htons(ETH_P_IPV6))
840c5441932SPravin B Shelar 			ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
841c5441932SPravin B Shelar #endif
842c5441932SPravin B Shelar 		else
843c5441932SPravin B Shelar 			ttl = ip4_dst_hoplimit(&rt->dst);
844c5441932SPravin B Shelar 	}
845c5441932SPravin B Shelar 
8460e6fbc5bSPravin B Shelar 	max_headroom = LL_RESERVED_SPACE(rt->dst.dev) + sizeof(struct iphdr)
8477371e022STom Herbert 			+ rt->dst.header_len + ip_encap_hlen(&tunnel->encap);
8483e08f4a7SSteffen Klassert 
849a0a1db40SFlorian Westphal 	if (skb_cow_head(skb, max_headroom)) {
850586d5fc8SDmitry Popov 		ip_rt_put(rt);
851c4794d22SEric Dumazet 		DEV_STATS_INC(dev, tx_dropped);
8523acfa1e7SEric Dumazet 		kfree_skb(skb);
853c5441932SPravin B Shelar 		return;
854c5441932SPravin B Shelar 	}
855c5441932SPravin B Shelar 
856a0a1db40SFlorian Westphal 	ip_tunnel_adj_headroom(dev, max_headroom);
857a0a1db40SFlorian Westphal 
858039f5062SPravin B Shelar 	iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, protocol, tos, ttl,
859039f5062SPravin B Shelar 		      df, !net_eq(tunnel->net, dev_net(dev)));
860c5441932SPravin B Shelar 	return;
861c5441932SPravin B Shelar 
862c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
863c5441932SPravin B Shelar tx_error_icmp:
864c5441932SPravin B Shelar 	dst_link_failure(skb);
865c5441932SPravin B Shelar #endif
866c5441932SPravin B Shelar tx_error:
867c4794d22SEric Dumazet 	DEV_STATS_INC(dev, tx_errors);
8683acfa1e7SEric Dumazet 	kfree_skb(skb);
869c5441932SPravin B Shelar }
870c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_xmit);
871c5441932SPravin B Shelar 
ip_tunnel_update(struct ip_tunnel_net * itn,struct ip_tunnel * t,struct net_device * dev,struct ip_tunnel_parm * p,bool set_mtu,__u32 fwmark)872c5441932SPravin B Shelar static void ip_tunnel_update(struct ip_tunnel_net *itn,
873c5441932SPravin B Shelar 			     struct ip_tunnel *t,
874c5441932SPravin B Shelar 			     struct net_device *dev,
875c5441932SPravin B Shelar 			     struct ip_tunnel_parm *p,
8769830ad4cSCraig Gallek 			     bool set_mtu,
8779830ad4cSCraig Gallek 			     __u32 fwmark)
878c5441932SPravin B Shelar {
8792e15ea39SPravin B Shelar 	ip_tunnel_del(itn, t);
880c5441932SPravin B Shelar 	t->parms.iph.saddr = p->iph.saddr;
881c5441932SPravin B Shelar 	t->parms.iph.daddr = p->iph.daddr;
882c5441932SPravin B Shelar 	t->parms.i_key = p->i_key;
883c5441932SPravin B Shelar 	t->parms.o_key = p->o_key;
884c5441932SPravin B Shelar 	if (dev->type != ARPHRD_ETHER) {
8855a1b7e1aSJakub Kicinski 		__dev_addr_set(dev, &p->iph.saddr, 4);
886c5441932SPravin B Shelar 		memcpy(dev->broadcast, &p->iph.daddr, 4);
887c5441932SPravin B Shelar 	}
888c5441932SPravin B Shelar 	ip_tunnel_add(itn, t);
889c5441932SPravin B Shelar 
890c5441932SPravin B Shelar 	t->parms.iph.ttl = p->iph.ttl;
891c5441932SPravin B Shelar 	t->parms.iph.tos = p->iph.tos;
892c5441932SPravin B Shelar 	t->parms.iph.frag_off = p->iph.frag_off;
893c5441932SPravin B Shelar 
8949830ad4cSCraig Gallek 	if (t->parms.link != p->link || t->fwmark != fwmark) {
895c5441932SPravin B Shelar 		int mtu;
896c5441932SPravin B Shelar 
89777b1e00fSEric Dumazet 		WRITE_ONCE(t->parms.link, p->link);
8989830ad4cSCraig Gallek 		t->fwmark = fwmark;
899c5441932SPravin B Shelar 		mtu = ip_tunnel_bind_dev(dev);
900c5441932SPravin B Shelar 		if (set_mtu)
901c5441932SPravin B Shelar 			dev->mtu = mtu;
902c5441932SPravin B Shelar 	}
903e09acddfSPaolo Abeni 	dst_cache_reset(&t->dst_cache);
904c5441932SPravin B Shelar 	netdev_state_change(dev);
905c5441932SPravin B Shelar }
906c5441932SPravin B Shelar 
ip_tunnel_ctl(struct net_device * dev,struct ip_tunnel_parm * p,int cmd)907607259a6SChristoph Hellwig int ip_tunnel_ctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd)
908c5441932SPravin B Shelar {
909c5441932SPravin B Shelar 	int err = 0;
9108c923ce2SNicolas Dichtel 	struct ip_tunnel *t = netdev_priv(dev);
9118c923ce2SNicolas Dichtel 	struct net *net = t->net;
9128c923ce2SNicolas Dichtel 	struct ip_tunnel_net *itn = net_generic(net, t->ip_tnl_net_id);
913c5441932SPravin B Shelar 
914c5441932SPravin B Shelar 	switch (cmd) {
915c5441932SPravin B Shelar 	case SIOCGETTUNNEL:
9168c923ce2SNicolas Dichtel 		if (dev == itn->fb_tunnel_dev) {
917c5441932SPravin B Shelar 			t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
91851456b29SIan Morris 			if (!t)
919c5441932SPravin B Shelar 				t = netdev_priv(dev);
9208c923ce2SNicolas Dichtel 		}
921c5441932SPravin B Shelar 		memcpy(p, &t->parms, sizeof(*p));
922c5441932SPravin B Shelar 		break;
923c5441932SPravin B Shelar 
924c5441932SPravin B Shelar 	case SIOCADDTUNNEL:
925c5441932SPravin B Shelar 	case SIOCCHGTUNNEL:
926c5441932SPravin B Shelar 		err = -EPERM;
927c5441932SPravin B Shelar 		if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
928c5441932SPravin B Shelar 			goto done;
929c5441932SPravin B Shelar 		if (p->iph.ttl)
930c5441932SPravin B Shelar 			p->iph.frag_off |= htons(IP_DF);
9317c8e6b9cSDmitry Popov 		if (!(p->i_flags & VTI_ISVTI)) {
932c5441932SPravin B Shelar 			if (!(p->i_flags & TUNNEL_KEY))
933c5441932SPravin B Shelar 				p->i_key = 0;
934c5441932SPravin B Shelar 			if (!(p->o_flags & TUNNEL_KEY))
935c5441932SPravin B Shelar 				p->o_key = 0;
9367c8e6b9cSDmitry Popov 		}
937c5441932SPravin B Shelar 
93879134e6cSEric Dumazet 		t = ip_tunnel_find(itn, p, itn->type);
939c5441932SPravin B Shelar 
940d61746b2SSteffen Klassert 		if (cmd == SIOCADDTUNNEL) {
941d61746b2SSteffen Klassert 			if (!t) {
942c5441932SPravin B Shelar 				t = ip_tunnel_create(net, itn, p);
943ee30ef4dSDuan Jiong 				err = PTR_ERR_OR_ZERO(t);
9446dd3c9ecSFlorian Westphal 				break;
9456dd3c9ecSFlorian Westphal 			}
946d61746b2SSteffen Klassert 
947d61746b2SSteffen Klassert 			err = -EEXIST;
948d61746b2SSteffen Klassert 			break;
949d61746b2SSteffen Klassert 		}
950c5441932SPravin B Shelar 		if (dev != itn->fb_tunnel_dev && cmd == SIOCCHGTUNNEL) {
95100db4124SIan Morris 			if (t) {
952c5441932SPravin B Shelar 				if (t->dev != dev) {
953c5441932SPravin B Shelar 					err = -EEXIST;
954c5441932SPravin B Shelar 					break;
955c5441932SPravin B Shelar 				}
956c5441932SPravin B Shelar 			} else {
957c5441932SPravin B Shelar 				unsigned int nflags = 0;
958c5441932SPravin B Shelar 
959c5441932SPravin B Shelar 				if (ipv4_is_multicast(p->iph.daddr))
960c5441932SPravin B Shelar 					nflags = IFF_BROADCAST;
961c5441932SPravin B Shelar 				else if (p->iph.daddr)
962c5441932SPravin B Shelar 					nflags = IFF_POINTOPOINT;
963c5441932SPravin B Shelar 
964c5441932SPravin B Shelar 				if ((dev->flags^nflags)&(IFF_POINTOPOINT|IFF_BROADCAST)) {
965c5441932SPravin B Shelar 					err = -EINVAL;
966c5441932SPravin B Shelar 					break;
967c5441932SPravin B Shelar 				}
968c5441932SPravin B Shelar 
969c5441932SPravin B Shelar 				t = netdev_priv(dev);
970c5441932SPravin B Shelar 			}
971c5441932SPravin B Shelar 		}
972c5441932SPravin B Shelar 
973c5441932SPravin B Shelar 		if (t) {
974c5441932SPravin B Shelar 			err = 0;
9759830ad4cSCraig Gallek 			ip_tunnel_update(itn, t, dev, p, true, 0);
9766dd3c9ecSFlorian Westphal 		} else {
9776dd3c9ecSFlorian Westphal 			err = -ENOENT;
9786dd3c9ecSFlorian Westphal 		}
979c5441932SPravin B Shelar 		break;
980c5441932SPravin B Shelar 
981c5441932SPravin B Shelar 	case SIOCDELTUNNEL:
982c5441932SPravin B Shelar 		err = -EPERM;
983c5441932SPravin B Shelar 		if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
984c5441932SPravin B Shelar 			goto done;
985c5441932SPravin B Shelar 
986c5441932SPravin B Shelar 		if (dev == itn->fb_tunnel_dev) {
987c5441932SPravin B Shelar 			err = -ENOENT;
988c5441932SPravin B Shelar 			t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
98951456b29SIan Morris 			if (!t)
990c5441932SPravin B Shelar 				goto done;
991c5441932SPravin B Shelar 			err = -EPERM;
992c5441932SPravin B Shelar 			if (t == netdev_priv(itn->fb_tunnel_dev))
993c5441932SPravin B Shelar 				goto done;
994c5441932SPravin B Shelar 			dev = t->dev;
995c5441932SPravin B Shelar 		}
996c5441932SPravin B Shelar 		unregister_netdevice(dev);
997c5441932SPravin B Shelar 		err = 0;
998c5441932SPravin B Shelar 		break;
999c5441932SPravin B Shelar 
1000c5441932SPravin B Shelar 	default:
1001c5441932SPravin B Shelar 		err = -EINVAL;
1002c5441932SPravin B Shelar 	}
1003c5441932SPravin B Shelar 
1004c5441932SPravin B Shelar done:
1005c5441932SPravin B Shelar 	return err;
1006c5441932SPravin B Shelar }
1007607259a6SChristoph Hellwig EXPORT_SYMBOL_GPL(ip_tunnel_ctl);
1008607259a6SChristoph Hellwig 
ip_tunnel_siocdevprivate(struct net_device * dev,struct ifreq * ifr,void __user * data,int cmd)10093e7a1c7cSArnd Bergmann int ip_tunnel_siocdevprivate(struct net_device *dev, struct ifreq *ifr,
10103e7a1c7cSArnd Bergmann 			     void __user *data, int cmd)
1011607259a6SChristoph Hellwig {
1012607259a6SChristoph Hellwig 	struct ip_tunnel_parm p;
1013607259a6SChristoph Hellwig 	int err;
1014607259a6SChristoph Hellwig 
10153e7a1c7cSArnd Bergmann 	if (copy_from_user(&p, data, sizeof(p)))
1016607259a6SChristoph Hellwig 		return -EFAULT;
1017607259a6SChristoph Hellwig 	err = dev->netdev_ops->ndo_tunnel_ctl(dev, &p, cmd);
10183e7a1c7cSArnd Bergmann 	if (!err && copy_to_user(data, &p, sizeof(p)))
1019607259a6SChristoph Hellwig 		return -EFAULT;
1020607259a6SChristoph Hellwig 	return err;
1021607259a6SChristoph Hellwig }
10223e7a1c7cSArnd Bergmann EXPORT_SYMBOL_GPL(ip_tunnel_siocdevprivate);
1023c5441932SPravin B Shelar 
__ip_tunnel_change_mtu(struct net_device * dev,int new_mtu,bool strict)10247e059158SDavid Wragg int __ip_tunnel_change_mtu(struct net_device *dev, int new_mtu, bool strict)
1025c5441932SPravin B Shelar {
1026c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
1027c5441932SPravin B Shelar 	int t_hlen = tunnel->hlen + sizeof(struct iphdr);
102828e104d0SVadim Fedorenko 	int max_mtu = IP_MAX_MTU - t_hlen;
1029c5441932SPravin B Shelar 
10309992a078SHangbin Liu 	if (dev->type == ARPHRD_ETHER)
10319992a078SHangbin Liu 		max_mtu -= dev->hard_header_len;
10329992a078SHangbin Liu 
1033b96f9afeSJarod Wilson 	if (new_mtu < ETH_MIN_MTU)
1034c5441932SPravin B Shelar 		return -EINVAL;
10357e059158SDavid Wragg 
10367e059158SDavid Wragg 	if (new_mtu > max_mtu) {
10377e059158SDavid Wragg 		if (strict)
10387e059158SDavid Wragg 			return -EINVAL;
10397e059158SDavid Wragg 
10407e059158SDavid Wragg 		new_mtu = max_mtu;
10417e059158SDavid Wragg 	}
10427e059158SDavid Wragg 
1043c5441932SPravin B Shelar 	dev->mtu = new_mtu;
1044c5441932SPravin B Shelar 	return 0;
1045c5441932SPravin B Shelar }
10467e059158SDavid Wragg EXPORT_SYMBOL_GPL(__ip_tunnel_change_mtu);
10477e059158SDavid Wragg 
ip_tunnel_change_mtu(struct net_device * dev,int new_mtu)10487e059158SDavid Wragg int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu)
10497e059158SDavid Wragg {
10507e059158SDavid Wragg 	return __ip_tunnel_change_mtu(dev, new_mtu, true);
10517e059158SDavid Wragg }
1052c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_change_mtu);
1053c5441932SPravin B Shelar 
ip_tunnel_dev_free(struct net_device * dev)1054c5441932SPravin B Shelar static void ip_tunnel_dev_free(struct net_device *dev)
1055c5441932SPravin B Shelar {
1056c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
1057c5441932SPravin B Shelar 
1058c5441932SPravin B Shelar 	gro_cells_destroy(&tunnel->gro_cells);
1059e09acddfSPaolo Abeni 	dst_cache_destroy(&tunnel->dst_cache);
1060c5441932SPravin B Shelar 	free_percpu(dev->tstats);
1061c5441932SPravin B Shelar }
1062c5441932SPravin B Shelar 
ip_tunnel_dellink(struct net_device * dev,struct list_head * head)1063c5441932SPravin B Shelar void ip_tunnel_dellink(struct net_device *dev, struct list_head *head)
1064c5441932SPravin B Shelar {
1065c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
1066c5441932SPravin B Shelar 	struct ip_tunnel_net *itn;
1067c5441932SPravin B Shelar 
10686c742e71SNicolas Dichtel 	itn = net_generic(tunnel->net, tunnel->ip_tnl_net_id);
1069c5441932SPravin B Shelar 
1070c5441932SPravin B Shelar 	if (itn->fb_tunnel_dev != dev) {
10712e15ea39SPravin B Shelar 		ip_tunnel_del(itn, netdev_priv(dev));
1072c5441932SPravin B Shelar 		unregister_netdevice_queue(dev, head);
1073c5441932SPravin B Shelar 	}
1074c5441932SPravin B Shelar }
1075c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_dellink);
1076c5441932SPravin B Shelar 
ip_tunnel_get_link_net(const struct net_device * dev)10771728d4faSNicolas Dichtel struct net *ip_tunnel_get_link_net(const struct net_device *dev)
10781728d4faSNicolas Dichtel {
10791728d4faSNicolas Dichtel 	struct ip_tunnel *tunnel = netdev_priv(dev);
10801728d4faSNicolas Dichtel 
10811728d4faSNicolas Dichtel 	return tunnel->net;
10821728d4faSNicolas Dichtel }
10831728d4faSNicolas Dichtel EXPORT_SYMBOL(ip_tunnel_get_link_net);
10841728d4faSNicolas Dichtel 
ip_tunnel_get_iflink(const struct net_device * dev)10851e99584bSNicolas Dichtel int ip_tunnel_get_iflink(const struct net_device *dev)
10861e99584bSNicolas Dichtel {
108777b1e00fSEric Dumazet 	const struct ip_tunnel *tunnel = netdev_priv(dev);
10881e99584bSNicolas Dichtel 
108977b1e00fSEric Dumazet 	return READ_ONCE(tunnel->parms.link);
10901e99584bSNicolas Dichtel }
10911e99584bSNicolas Dichtel EXPORT_SYMBOL(ip_tunnel_get_iflink);
10921e99584bSNicolas Dichtel 
ip_tunnel_init_net(struct net * net,unsigned int ip_tnl_net_id,struct rtnl_link_ops * ops,char * devname)1093c7d03a00SAlexey Dobriyan int ip_tunnel_init_net(struct net *net, unsigned int ip_tnl_net_id,
1094c5441932SPravin B Shelar 				  struct rtnl_link_ops *ops, char *devname)
1095c5441932SPravin B Shelar {
1096c5441932SPravin B Shelar 	struct ip_tunnel_net *itn = net_generic(net, ip_tnl_net_id);
1097c5441932SPravin B Shelar 	struct ip_tunnel_parm parms;
10986261d983Sstephen hemminger 	unsigned int i;
1099c5441932SPravin B Shelar 
110079134e6cSEric Dumazet 	itn->rtnl_link_ops = ops;
11016261d983Sstephen hemminger 	for (i = 0; i < IP_TNL_HASH_SIZE; i++)
11026261d983Sstephen hemminger 		INIT_HLIST_HEAD(&itn->tunnels[i]);
1103c5441932SPravin B Shelar 
110479134e6cSEric Dumazet 	if (!ops || !net_has_fallback_tunnels(net)) {
110579134e6cSEric Dumazet 		struct ip_tunnel_net *it_init_net;
110679134e6cSEric Dumazet 
110779134e6cSEric Dumazet 		it_init_net = net_generic(&init_net, ip_tnl_net_id);
110879134e6cSEric Dumazet 		itn->type = it_init_net->type;
1109c5441932SPravin B Shelar 		itn->fb_tunnel_dev = NULL;
1110c5441932SPravin B Shelar 		return 0;
1111c5441932SPravin B Shelar 	}
11126261d983Sstephen hemminger 
1113c5441932SPravin B Shelar 	memset(&parms, 0, sizeof(parms));
1114c5441932SPravin B Shelar 	if (devname)
1115512b2dc4SXueBing Chen 		strscpy(parms.name, devname, IFNAMSIZ);
1116c5441932SPravin B Shelar 
1117c5441932SPravin B Shelar 	rtnl_lock();
1118c5441932SPravin B Shelar 	itn->fb_tunnel_dev = __ip_tunnel_create(net, ops, &parms);
1119ea857f28SDan Carpenter 	/* FB netdevice is special: we have one, and only one per netns.
1120ea857f28SDan Carpenter 	 * Allowing to move it to another netns is clearly unsafe.
1121ea857f28SDan Carpenter 	 */
112267013282SSteffen Klassert 	if (!IS_ERR(itn->fb_tunnel_dev)) {
1123ea857f28SDan Carpenter 		itn->fb_tunnel_dev->features |= NETIF_F_NETNS_LOCAL;
112478ff4be4SSteffen Klassert 		itn->fb_tunnel_dev->mtu = ip_tunnel_bind_dev(itn->fb_tunnel_dev);
112567013282SSteffen Klassert 		ip_tunnel_add(itn, netdev_priv(itn->fb_tunnel_dev));
112679134e6cSEric Dumazet 		itn->type = itn->fb_tunnel_dev->type;
112767013282SSteffen Klassert 	}
1128b4de77adSDan Carpenter 	rtnl_unlock();
1129c5441932SPravin B Shelar 
113027d79f3bSSachin Kamat 	return PTR_ERR_OR_ZERO(itn->fb_tunnel_dev);
1131c5441932SPravin B Shelar }
1132c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_init_net);
1133c5441932SPravin B Shelar 
ip_tunnel_destroy(struct net * net,struct ip_tunnel_net * itn,struct list_head * head,struct rtnl_link_ops * ops)113479134e6cSEric Dumazet static void ip_tunnel_destroy(struct net *net, struct ip_tunnel_net *itn,
113579134e6cSEric Dumazet 			      struct list_head *head,
11366c742e71SNicolas Dichtel 			      struct rtnl_link_ops *ops)
1137c5441932SPravin B Shelar {
11386c742e71SNicolas Dichtel 	struct net_device *dev, *aux;
1139c5441932SPravin B Shelar 	int h;
1140c5441932SPravin B Shelar 
11416c742e71SNicolas Dichtel 	for_each_netdev_safe(net, dev, aux)
11426c742e71SNicolas Dichtel 		if (dev->rtnl_link_ops == ops)
11436c742e71SNicolas Dichtel 			unregister_netdevice_queue(dev, head);
11446c742e71SNicolas Dichtel 
1145c5441932SPravin B Shelar 	for (h = 0; h < IP_TNL_HASH_SIZE; h++) {
1146c5441932SPravin B Shelar 		struct ip_tunnel *t;
1147c5441932SPravin B Shelar 		struct hlist_node *n;
1148c5441932SPravin B Shelar 		struct hlist_head *thead = &itn->tunnels[h];
1149c5441932SPravin B Shelar 
1150c5441932SPravin B Shelar 		hlist_for_each_entry_safe(t, n, thead, hash_node)
11516c742e71SNicolas Dichtel 			/* If dev is in the same netns, it has already
11526c742e71SNicolas Dichtel 			 * been added to the list by the previous loop.
11536c742e71SNicolas Dichtel 			 */
11546c742e71SNicolas Dichtel 			if (!net_eq(dev_net(t->dev), net))
1155c5441932SPravin B Shelar 				unregister_netdevice_queue(t->dev, head);
1156c5441932SPravin B Shelar 	}
1157c5441932SPravin B Shelar }
1158c5441932SPravin B Shelar 
ip_tunnel_delete_nets(struct list_head * net_list,unsigned int id,struct rtnl_link_ops * ops)115964bc1781SEric Dumazet void ip_tunnel_delete_nets(struct list_head *net_list, unsigned int id,
116064bc1781SEric Dumazet 			   struct rtnl_link_ops *ops)
1161c5441932SPravin B Shelar {
116264bc1781SEric Dumazet 	struct ip_tunnel_net *itn;
116364bc1781SEric Dumazet 	struct net *net;
1164c5441932SPravin B Shelar 	LIST_HEAD(list);
1165c5441932SPravin B Shelar 
1166c5441932SPravin B Shelar 	rtnl_lock();
116764bc1781SEric Dumazet 	list_for_each_entry(net, net_list, exit_list) {
116864bc1781SEric Dumazet 		itn = net_generic(net, id);
116979134e6cSEric Dumazet 		ip_tunnel_destroy(net, itn, &list, ops);
117064bc1781SEric Dumazet 	}
1171c5441932SPravin B Shelar 	unregister_netdevice_many(&list);
1172c5441932SPravin B Shelar 	rtnl_unlock();
1173c5441932SPravin B Shelar }
117464bc1781SEric Dumazet EXPORT_SYMBOL_GPL(ip_tunnel_delete_nets);
1175c5441932SPravin B Shelar 
ip_tunnel_newlink(struct net_device * dev,struct nlattr * tb[],struct ip_tunnel_parm * p,__u32 fwmark)1176c5441932SPravin B Shelar int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[],
11779830ad4cSCraig Gallek 		      struct ip_tunnel_parm *p, __u32 fwmark)
1178c5441932SPravin B Shelar {
1179c5441932SPravin B Shelar 	struct ip_tunnel *nt;
1180c5441932SPravin B Shelar 	struct net *net = dev_net(dev);
1181c5441932SPravin B Shelar 	struct ip_tunnel_net *itn;
1182c5441932SPravin B Shelar 	int mtu;
1183c5441932SPravin B Shelar 	int err;
1184c5441932SPravin B Shelar 
1185c5441932SPravin B Shelar 	nt = netdev_priv(dev);
1186c5441932SPravin B Shelar 	itn = net_generic(net, nt->ip_tnl_net_id);
1187c5441932SPravin B Shelar 
11882e15ea39SPravin B Shelar 	if (nt->collect_md) {
11892e15ea39SPravin B Shelar 		if (rtnl_dereference(itn->collect_md_tun))
11902e15ea39SPravin B Shelar 			return -EEXIST;
11912e15ea39SPravin B Shelar 	} else {
1192c5441932SPravin B Shelar 		if (ip_tunnel_find(itn, p, dev->type))
1193c5441932SPravin B Shelar 			return -EEXIST;
11942e15ea39SPravin B Shelar 	}
1195c5441932SPravin B Shelar 
11965e6700b3SNicolas Dichtel 	nt->net = net;
1197c5441932SPravin B Shelar 	nt->parms = *p;
11989830ad4cSCraig Gallek 	nt->fwmark = fwmark;
1199c5441932SPravin B Shelar 	err = register_netdevice(dev);
1200c5441932SPravin B Shelar 	if (err)
1201f6cc9c05SPetr Machata 		goto err_register_netdevice;
1202c5441932SPravin B Shelar 
1203c5441932SPravin B Shelar 	if (dev->type == ARPHRD_ETHER && !tb[IFLA_ADDRESS])
1204c5441932SPravin B Shelar 		eth_hw_addr_random(dev);
1205c5441932SPravin B Shelar 
1206c5441932SPravin B Shelar 	mtu = ip_tunnel_bind_dev(dev);
120724fc7979SStefano Brivio 	if (tb[IFLA_MTU]) {
120828e104d0SVadim Fedorenko 		unsigned int max = IP_MAX_MTU - (nt->hlen + sizeof(struct iphdr));
120924fc7979SStefano Brivio 
12109992a078SHangbin Liu 		if (dev->type == ARPHRD_ETHER)
12119992a078SHangbin Liu 			max -= dev->hard_header_len;
12129992a078SHangbin Liu 
121328e104d0SVadim Fedorenko 		mtu = clamp(dev->mtu, (unsigned int)ETH_MIN_MTU, max);
12145568cdc3SDavid S. Miller 	}
12155568cdc3SDavid S. Miller 
1216f6cc9c05SPetr Machata 	err = dev_set_mtu(dev, mtu);
1217f6cc9c05SPetr Machata 	if (err)
1218f6cc9c05SPetr Machata 		goto err_dev_set_mtu;
1219c5441932SPravin B Shelar 
1220c5441932SPravin B Shelar 	ip_tunnel_add(itn, nt);
1221f6cc9c05SPetr Machata 	return 0;
1222f6cc9c05SPetr Machata 
1223f6cc9c05SPetr Machata err_dev_set_mtu:
1224f6cc9c05SPetr Machata 	unregister_netdevice(dev);
1225f6cc9c05SPetr Machata err_register_netdevice:
1226c5441932SPravin B Shelar 	return err;
1227c5441932SPravin B Shelar }
1228c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_newlink);
1229c5441932SPravin B Shelar 
ip_tunnel_changelink(struct net_device * dev,struct nlattr * tb[],struct ip_tunnel_parm * p,__u32 fwmark)1230c5441932SPravin B Shelar int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[],
12319830ad4cSCraig Gallek 			 struct ip_tunnel_parm *p, __u32 fwmark)
1232c5441932SPravin B Shelar {
12336c742e71SNicolas Dichtel 	struct ip_tunnel *t;
1234c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
12356c742e71SNicolas Dichtel 	struct net *net = tunnel->net;
1236c5441932SPravin B Shelar 	struct ip_tunnel_net *itn = net_generic(net, tunnel->ip_tnl_net_id);
1237c5441932SPravin B Shelar 
1238c5441932SPravin B Shelar 	if (dev == itn->fb_tunnel_dev)
1239c5441932SPravin B Shelar 		return -EINVAL;
1240c5441932SPravin B Shelar 
1241c5441932SPravin B Shelar 	t = ip_tunnel_find(itn, p, dev->type);
1242c5441932SPravin B Shelar 
1243c5441932SPravin B Shelar 	if (t) {
1244c5441932SPravin B Shelar 		if (t->dev != dev)
1245c5441932SPravin B Shelar 			return -EEXIST;
1246c5441932SPravin B Shelar 	} else {
12476c742e71SNicolas Dichtel 		t = tunnel;
1248c5441932SPravin B Shelar 
1249c5441932SPravin B Shelar 		if (dev->type != ARPHRD_ETHER) {
1250c5441932SPravin B Shelar 			unsigned int nflags = 0;
1251c5441932SPravin B Shelar 
1252c5441932SPravin B Shelar 			if (ipv4_is_multicast(p->iph.daddr))
1253c5441932SPravin B Shelar 				nflags = IFF_BROADCAST;
1254c5441932SPravin B Shelar 			else if (p->iph.daddr)
1255c5441932SPravin B Shelar 				nflags = IFF_POINTOPOINT;
1256c5441932SPravin B Shelar 
1257c5441932SPravin B Shelar 			if ((dev->flags ^ nflags) &
1258c5441932SPravin B Shelar 			    (IFF_POINTOPOINT | IFF_BROADCAST))
1259c5441932SPravin B Shelar 				return -EINVAL;
1260c5441932SPravin B Shelar 		}
1261c5441932SPravin B Shelar 	}
1262c5441932SPravin B Shelar 
12639830ad4cSCraig Gallek 	ip_tunnel_update(itn, t, dev, p, !tb[IFLA_MTU], fwmark);
1264c5441932SPravin B Shelar 	return 0;
1265c5441932SPravin B Shelar }
1266c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_changelink);
1267c5441932SPravin B Shelar 
ip_tunnel_init(struct net_device * dev)1268c5441932SPravin B Shelar int ip_tunnel_init(struct net_device *dev)
1269c5441932SPravin B Shelar {
1270c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
1271c5441932SPravin B Shelar 	struct iphdr *iph = &tunnel->parms.iph;
12721c213bd2SWANG Cong 	int err;
1273c5441932SPravin B Shelar 
1274cf124db5SDavid S. Miller 	dev->needs_free_netdev = true;
1275cf124db5SDavid S. Miller 	dev->priv_destructor = ip_tunnel_dev_free;
12761c213bd2SWANG Cong 	dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
1277c5441932SPravin B Shelar 	if (!dev->tstats)
1278c5441932SPravin B Shelar 		return -ENOMEM;
1279c5441932SPravin B Shelar 
1280e09acddfSPaolo Abeni 	err = dst_cache_init(&tunnel->dst_cache, GFP_KERNEL);
1281e09acddfSPaolo Abeni 	if (err) {
12829a4aa9afSTom Herbert 		free_percpu(dev->tstats);
1283e09acddfSPaolo Abeni 		return err;
12849a4aa9afSTom Herbert 	}
12859a4aa9afSTom Herbert 
1286c5441932SPravin B Shelar 	err = gro_cells_init(&tunnel->gro_cells, dev);
1287c5441932SPravin B Shelar 	if (err) {
1288e09acddfSPaolo Abeni 		dst_cache_destroy(&tunnel->dst_cache);
1289c5441932SPravin B Shelar 		free_percpu(dev->tstats);
1290c5441932SPravin B Shelar 		return err;
1291c5441932SPravin B Shelar 	}
1292c5441932SPravin B Shelar 
1293c5441932SPravin B Shelar 	tunnel->dev = dev;
12946c742e71SNicolas Dichtel 	tunnel->net = dev_net(dev);
1295c5441932SPravin B Shelar 	strcpy(tunnel->parms.name, dev->name);
1296c5441932SPravin B Shelar 	iph->version		= 4;
1297c5441932SPravin B Shelar 	iph->ihl		= 5;
1298c5441932SPravin B Shelar 
1299d0f41851SWilliam Dauchy 	if (tunnel->collect_md)
13002e15ea39SPravin B Shelar 		netif_keep_dst(dev);
1301a7b862abSEric Dumazet 	netdev_lockdep_set_classes(dev);
1302c5441932SPravin B Shelar 	return 0;
1303c5441932SPravin B Shelar }
1304c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_init);
1305c5441932SPravin B Shelar 
ip_tunnel_uninit(struct net_device * dev)1306c5441932SPravin B Shelar void ip_tunnel_uninit(struct net_device *dev)
1307c5441932SPravin B Shelar {
1308c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
13096c742e71SNicolas Dichtel 	struct net *net = tunnel->net;
1310c5441932SPravin B Shelar 	struct ip_tunnel_net *itn;
1311c5441932SPravin B Shelar 
1312c5441932SPravin B Shelar 	itn = net_generic(net, tunnel->ip_tnl_net_id);
13132e15ea39SPravin B Shelar 	ip_tunnel_del(itn, netdev_priv(dev));
1314ba61539cSTaehee Yoo 	if (itn->fb_tunnel_dev == dev)
1315ba61539cSTaehee Yoo 		WRITE_ONCE(itn->fb_tunnel_dev, NULL);
13167d442fabSTom Herbert 
1317e09acddfSPaolo Abeni 	dst_cache_reset(&tunnel->dst_cache);
1318c5441932SPravin B Shelar }
1319c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_uninit);
1320c5441932SPravin B Shelar 
1321c5441932SPravin B Shelar /* Do least required initialization, rest of init is done in tunnel_init call */
ip_tunnel_setup(struct net_device * dev,unsigned int net_id)1322c7d03a00SAlexey Dobriyan void ip_tunnel_setup(struct net_device *dev, unsigned int net_id)
1323c5441932SPravin B Shelar {
1324c5441932SPravin B Shelar 	struct ip_tunnel *tunnel = netdev_priv(dev);
1325c5441932SPravin B Shelar 	tunnel->ip_tnl_net_id = net_id;
1326c5441932SPravin B Shelar }
1327c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_setup);
1328c5441932SPravin B Shelar 
1329c5441932SPravin B Shelar MODULE_LICENSE("GPL");
1330