1c9422999SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2c5441932SPravin B Shelar /*
3c5441932SPravin B Shelar * Copyright (c) 2013 Nicira, Inc.
4c5441932SPravin B Shelar */
5c5441932SPravin B Shelar
6c5441932SPravin B Shelar #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
7c5441932SPravin B Shelar
8c5441932SPravin B Shelar #include <linux/capability.h>
9c5441932SPravin B Shelar #include <linux/module.h>
10c5441932SPravin B Shelar #include <linux/types.h>
11c5441932SPravin B Shelar #include <linux/kernel.h>
12c5441932SPravin B Shelar #include <linux/slab.h>
13c5441932SPravin B Shelar #include <linux/uaccess.h>
14c5441932SPravin B Shelar #include <linux/skbuff.h>
15c5441932SPravin B Shelar #include <linux/netdevice.h>
16c5441932SPravin B Shelar #include <linux/in.h>
17c5441932SPravin B Shelar #include <linux/tcp.h>
18c5441932SPravin B Shelar #include <linux/udp.h>
19c5441932SPravin B Shelar #include <linux/if_arp.h>
20c5441932SPravin B Shelar #include <linux/init.h>
21c5441932SPravin B Shelar #include <linux/in6.h>
22c5441932SPravin B Shelar #include <linux/inetdevice.h>
23c5441932SPravin B Shelar #include <linux/igmp.h>
24c5441932SPravin B Shelar #include <linux/netfilter_ipv4.h>
25c5441932SPravin B Shelar #include <linux/etherdevice.h>
26c5441932SPravin B Shelar #include <linux/if_ether.h>
27c5441932SPravin B Shelar #include <linux/if_vlan.h>
28c5441932SPravin B Shelar #include <linux/rculist.h>
2927d79f3bSSachin Kamat #include <linux/err.h>
30c5441932SPravin B Shelar
31c5441932SPravin B Shelar #include <net/sock.h>
32c5441932SPravin B Shelar #include <net/ip.h>
33c5441932SPravin B Shelar #include <net/icmp.h>
34c5441932SPravin B Shelar #include <net/protocol.h>
35c5441932SPravin B Shelar #include <net/ip_tunnels.h>
36c5441932SPravin B Shelar #include <net/arp.h>
37c5441932SPravin B Shelar #include <net/checksum.h>
38c5441932SPravin B Shelar #include <net/dsfield.h>
39c5441932SPravin B Shelar #include <net/inet_ecn.h>
40c5441932SPravin B Shelar #include <net/xfrm.h>
41c5441932SPravin B Shelar #include <net/net_namespace.h>
42c5441932SPravin B Shelar #include <net/netns/generic.h>
43c5441932SPravin B Shelar #include <net/rtnetlink.h>
4456328486STom Herbert #include <net/udp.h>
45cfc7381bSAlexei Starovoitov #include <net/dst_metadata.h>
463b1a7fb7SIdo Schimmel #include <net/inet_dscp.h>
4763487babSTom Herbert
48c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
49c5441932SPravin B Shelar #include <net/ipv6.h>
50c5441932SPravin B Shelar #include <net/ip6_fib.h>
51c5441932SPravin B Shelar #include <net/ip6_route.h>
52c5441932SPravin B Shelar #endif
53c5441932SPravin B Shelar
ip_tunnel_hash(__be32 key,__be32 remote)54967680e0SDuan Jiong static unsigned int ip_tunnel_hash(__be32 key, __be32 remote)
55c5441932SPravin B Shelar {
56c5441932SPravin B Shelar return hash_32((__force u32)key ^ (__force u32)remote,
57c5441932SPravin B Shelar IP_TNL_HASH_BITS);
58c5441932SPravin B Shelar }
59c5441932SPravin B Shelar
ip_tunnel_key_match(const struct ip_tunnel_parm * p,__be16 flags,__be32 key)60c5441932SPravin B Shelar static bool ip_tunnel_key_match(const struct ip_tunnel_parm *p,
61c5441932SPravin B Shelar __be16 flags, __be32 key)
62c5441932SPravin B Shelar {
63c5441932SPravin B Shelar if (p->i_flags & TUNNEL_KEY) {
64c5441932SPravin B Shelar if (flags & TUNNEL_KEY)
65c5441932SPravin B Shelar return key == p->i_key;
66c5441932SPravin B Shelar else
67c5441932SPravin B Shelar /* key expected, none present */
68c5441932SPravin B Shelar return false;
69c5441932SPravin B Shelar } else
70c5441932SPravin B Shelar return !(flags & TUNNEL_KEY);
71c5441932SPravin B Shelar }
72c5441932SPravin B Shelar
73c5441932SPravin B Shelar /* Fallback tunnel: no source, no destination, no key, no options
74c5441932SPravin B Shelar
75c5441932SPravin B Shelar Tunnel hash table:
76c5441932SPravin B Shelar We require exact key match i.e. if a key is present in packet
77c5441932SPravin B Shelar it will match only tunnel with the same key; if it is not present,
78c5441932SPravin B Shelar it will match only keyless tunnel.
79c5441932SPravin B Shelar
80c5441932SPravin B Shelar All keysless packets, if not matched configured keyless tunnels
81c5441932SPravin B Shelar will match fallback tunnel.
82c5441932SPravin B Shelar Given src, dst and key, find appropriate for input tunnel.
83c5441932SPravin B Shelar */
ip_tunnel_lookup(struct ip_tunnel_net * itn,int link,__be16 flags,__be32 remote,__be32 local,__be32 key)84c5441932SPravin B Shelar struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn,
85c5441932SPravin B Shelar int link, __be16 flags,
86c5441932SPravin B Shelar __be32 remote, __be32 local,
87c5441932SPravin B Shelar __be32 key)
88c5441932SPravin B Shelar {
89c5441932SPravin B Shelar struct ip_tunnel *t, *cand = NULL;
90c5441932SPravin B Shelar struct hlist_head *head;
91ba61539cSTaehee Yoo struct net_device *ndev;
92ba61539cSTaehee Yoo unsigned int hash;
93c5441932SPravin B Shelar
94967680e0SDuan Jiong hash = ip_tunnel_hash(key, remote);
95c5441932SPravin B Shelar head = &itn->tunnels[hash];
96c5441932SPravin B Shelar
97c5441932SPravin B Shelar hlist_for_each_entry_rcu(t, head, hash_node) {
98c5441932SPravin B Shelar if (local != t->parms.iph.saddr ||
99c5441932SPravin B Shelar remote != t->parms.iph.daddr ||
100c5441932SPravin B Shelar !(t->dev->flags & IFF_UP))
101c5441932SPravin B Shelar continue;
102c5441932SPravin B Shelar
103c5441932SPravin B Shelar if (!ip_tunnel_key_match(&t->parms, flags, key))
104c5441932SPravin B Shelar continue;
105c5441932SPravin B Shelar
10677b1e00fSEric Dumazet if (READ_ONCE(t->parms.link) == link)
107c5441932SPravin B Shelar return t;
108c5441932SPravin B Shelar cand = t;
109c5441932SPravin B Shelar }
110c5441932SPravin B Shelar
111c5441932SPravin B Shelar hlist_for_each_entry_rcu(t, head, hash_node) {
112c5441932SPravin B Shelar if (remote != t->parms.iph.daddr ||
113e0056593SDmitry Popov t->parms.iph.saddr != 0 ||
114c5441932SPravin B Shelar !(t->dev->flags & IFF_UP))
115c5441932SPravin B Shelar continue;
116c5441932SPravin B Shelar
117c5441932SPravin B Shelar if (!ip_tunnel_key_match(&t->parms, flags, key))
118c5441932SPravin B Shelar continue;
119c5441932SPravin B Shelar
12077b1e00fSEric Dumazet if (READ_ONCE(t->parms.link) == link)
121c5441932SPravin B Shelar return t;
12277b1e00fSEric Dumazet if (!cand)
123c5441932SPravin B Shelar cand = t;
124c5441932SPravin B Shelar }
125c5441932SPravin B Shelar
126967680e0SDuan Jiong hash = ip_tunnel_hash(key, 0);
127c5441932SPravin B Shelar head = &itn->tunnels[hash];
128c5441932SPravin B Shelar
129c5441932SPravin B Shelar hlist_for_each_entry_rcu(t, head, hash_node) {
130e0056593SDmitry Popov if ((local != t->parms.iph.saddr || t->parms.iph.daddr != 0) &&
131e0056593SDmitry Popov (local != t->parms.iph.daddr || !ipv4_is_multicast(local)))
132e0056593SDmitry Popov continue;
133e0056593SDmitry Popov
134e0056593SDmitry Popov if (!(t->dev->flags & IFF_UP))
135c5441932SPravin B Shelar continue;
136c5441932SPravin B Shelar
137c5441932SPravin B Shelar if (!ip_tunnel_key_match(&t->parms, flags, key))
138c5441932SPravin B Shelar continue;
139c5441932SPravin B Shelar
14077b1e00fSEric Dumazet if (READ_ONCE(t->parms.link) == link)
141c5441932SPravin B Shelar return t;
14277b1e00fSEric Dumazet if (!cand)
143c5441932SPravin B Shelar cand = t;
144c5441932SPravin B Shelar }
145c5441932SPravin B Shelar
146c5441932SPravin B Shelar hlist_for_each_entry_rcu(t, head, hash_node) {
14725629fdaSWilliam Dauchy if ((!(flags & TUNNEL_NO_KEY) && t->parms.i_key != key) ||
148e0056593SDmitry Popov t->parms.iph.saddr != 0 ||
149e0056593SDmitry Popov t->parms.iph.daddr != 0 ||
150c5441932SPravin B Shelar !(t->dev->flags & IFF_UP))
151c5441932SPravin B Shelar continue;
152c5441932SPravin B Shelar
15377b1e00fSEric Dumazet if (READ_ONCE(t->parms.link) == link)
154c5441932SPravin B Shelar return t;
15577b1e00fSEric Dumazet if (!cand)
156c5441932SPravin B Shelar cand = t;
157c5441932SPravin B Shelar }
158c5441932SPravin B Shelar
159c5441932SPravin B Shelar if (cand)
160c5441932SPravin B Shelar return cand;
161c5441932SPravin B Shelar
1622e15ea39SPravin B Shelar t = rcu_dereference(itn->collect_md_tun);
163833a8b40SHaishuang Yan if (t && t->dev->flags & IFF_UP)
1642e15ea39SPravin B Shelar return t;
1652e15ea39SPravin B Shelar
166ba61539cSTaehee Yoo ndev = READ_ONCE(itn->fb_tunnel_dev);
167ba61539cSTaehee Yoo if (ndev && ndev->flags & IFF_UP)
168ba61539cSTaehee Yoo return netdev_priv(ndev);
169c5441932SPravin B Shelar
170c5441932SPravin B Shelar return NULL;
171c5441932SPravin B Shelar }
172c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_lookup);
173c5441932SPravin B Shelar
ip_bucket(struct ip_tunnel_net * itn,struct ip_tunnel_parm * parms)174c5441932SPravin B Shelar static struct hlist_head *ip_bucket(struct ip_tunnel_net *itn,
175c5441932SPravin B Shelar struct ip_tunnel_parm *parms)
176c5441932SPravin B Shelar {
177c5441932SPravin B Shelar unsigned int h;
178c5441932SPravin B Shelar __be32 remote;
1796d608f06SSteffen Klassert __be32 i_key = parms->i_key;
180c5441932SPravin B Shelar
181c5441932SPravin B Shelar if (parms->iph.daddr && !ipv4_is_multicast(parms->iph.daddr))
182c5441932SPravin B Shelar remote = parms->iph.daddr;
183c5441932SPravin B Shelar else
184c5441932SPravin B Shelar remote = 0;
185c5441932SPravin B Shelar
1866d608f06SSteffen Klassert if (!(parms->i_flags & TUNNEL_KEY) && (parms->i_flags & VTI_ISVTI))
1876d608f06SSteffen Klassert i_key = 0;
1886d608f06SSteffen Klassert
1896d608f06SSteffen Klassert h = ip_tunnel_hash(i_key, remote);
190c5441932SPravin B Shelar return &itn->tunnels[h];
191c5441932SPravin B Shelar }
192c5441932SPravin B Shelar
ip_tunnel_add(struct ip_tunnel_net * itn,struct ip_tunnel * t)193c5441932SPravin B Shelar static void ip_tunnel_add(struct ip_tunnel_net *itn, struct ip_tunnel *t)
194c5441932SPravin B Shelar {
195c5441932SPravin B Shelar struct hlist_head *head = ip_bucket(itn, &t->parms);
196c5441932SPravin B Shelar
1972e15ea39SPravin B Shelar if (t->collect_md)
1982e15ea39SPravin B Shelar rcu_assign_pointer(itn->collect_md_tun, t);
199c5441932SPravin B Shelar hlist_add_head_rcu(&t->hash_node, head);
200c5441932SPravin B Shelar }
201c5441932SPravin B Shelar
ip_tunnel_del(struct ip_tunnel_net * itn,struct ip_tunnel * t)2022e15ea39SPravin B Shelar static void ip_tunnel_del(struct ip_tunnel_net *itn, struct ip_tunnel *t)
203c5441932SPravin B Shelar {
2042e15ea39SPravin B Shelar if (t->collect_md)
2052e15ea39SPravin B Shelar rcu_assign_pointer(itn->collect_md_tun, NULL);
206c5441932SPravin B Shelar hlist_del_init_rcu(&t->hash_node);
207c5441932SPravin B Shelar }
208c5441932SPravin B Shelar
ip_tunnel_find(struct ip_tunnel_net * itn,struct ip_tunnel_parm * parms,int type)209c5441932SPravin B Shelar static struct ip_tunnel *ip_tunnel_find(struct ip_tunnel_net *itn,
210c5441932SPravin B Shelar struct ip_tunnel_parm *parms,
211c5441932SPravin B Shelar int type)
212c5441932SPravin B Shelar {
213c5441932SPravin B Shelar __be32 remote = parms->iph.daddr;
214c5441932SPravin B Shelar __be32 local = parms->iph.saddr;
215c5441932SPravin B Shelar __be32 key = parms->i_key;
2165ce54af1SDmitry Popov __be16 flags = parms->i_flags;
217c5441932SPravin B Shelar int link = parms->link;
218c5441932SPravin B Shelar struct ip_tunnel *t = NULL;
219c5441932SPravin B Shelar struct hlist_head *head = ip_bucket(itn, parms);
220c5441932SPravin B Shelar
221*e0500e43SIdo Schimmel hlist_for_each_entry_rcu(t, head, hash_node, lockdep_rtnl_is_held()) {
222c5441932SPravin B Shelar if (local == t->parms.iph.saddr &&
223c5441932SPravin B Shelar remote == t->parms.iph.daddr &&
22477b1e00fSEric Dumazet link == READ_ONCE(t->parms.link) &&
2255ce54af1SDmitry Popov type == t->dev->type &&
2265ce54af1SDmitry Popov ip_tunnel_key_match(&t->parms, flags, key))
227c5441932SPravin B Shelar break;
228c5441932SPravin B Shelar }
229c5441932SPravin B Shelar return t;
230c5441932SPravin B Shelar }
231c5441932SPravin B Shelar
__ip_tunnel_create(struct net * net,const struct rtnl_link_ops * ops,struct ip_tunnel_parm * parms)232c5441932SPravin B Shelar static struct net_device *__ip_tunnel_create(struct net *net,
233c5441932SPravin B Shelar const struct rtnl_link_ops *ops,
234c5441932SPravin B Shelar struct ip_tunnel_parm *parms)
235c5441932SPravin B Shelar {
236c5441932SPravin B Shelar int err;
237c5441932SPravin B Shelar struct ip_tunnel *tunnel;
238c5441932SPravin B Shelar struct net_device *dev;
239c5441932SPravin B Shelar char name[IFNAMSIZ];
240c5441932SPravin B Shelar
241c5441932SPravin B Shelar err = -E2BIG;
2429cb726a2SEric Dumazet if (parms->name[0]) {
2439cb726a2SEric Dumazet if (!dev_valid_name(parms->name))
244c5441932SPravin B Shelar goto failed;
245512b2dc4SXueBing Chen strscpy(name, parms->name, IFNAMSIZ);
2469cb726a2SEric Dumazet } else {
2479cb726a2SEric Dumazet if (strlen(ops->kind) > (IFNAMSIZ - 3))
2489cb726a2SEric Dumazet goto failed;
249000ade80SSultan Alsawaf strcpy(name, ops->kind);
250000ade80SSultan Alsawaf strcat(name, "%d");
251c5441932SPravin B Shelar }
252c5441932SPravin B Shelar
253c5441932SPravin B Shelar ASSERT_RTNL();
254c835a677STom Gundersen dev = alloc_netdev(ops->priv_size, name, NET_NAME_UNKNOWN, ops->setup);
255c5441932SPravin B Shelar if (!dev) {
256c5441932SPravin B Shelar err = -ENOMEM;
257c5441932SPravin B Shelar goto failed;
258c5441932SPravin B Shelar }
259c5441932SPravin B Shelar dev_net_set(dev, net);
260c5441932SPravin B Shelar
261c5441932SPravin B Shelar dev->rtnl_link_ops = ops;
262c5441932SPravin B Shelar
263c5441932SPravin B Shelar tunnel = netdev_priv(dev);
264c5441932SPravin B Shelar tunnel->parms = *parms;
2655e6700b3SNicolas Dichtel tunnel->net = net;
266c5441932SPravin B Shelar
267c5441932SPravin B Shelar err = register_netdevice(dev);
268c5441932SPravin B Shelar if (err)
269c5441932SPravin B Shelar goto failed_free;
270c5441932SPravin B Shelar
271c5441932SPravin B Shelar return dev;
272c5441932SPravin B Shelar
273c5441932SPravin B Shelar failed_free:
274c5441932SPravin B Shelar free_netdev(dev);
275c5441932SPravin B Shelar failed:
276c5441932SPravin B Shelar return ERR_PTR(err);
277c5441932SPravin B Shelar }
278c5441932SPravin B Shelar
ip_tunnel_bind_dev(struct net_device * dev)279c5441932SPravin B Shelar static int ip_tunnel_bind_dev(struct net_device *dev)
280c5441932SPravin B Shelar {
281c5441932SPravin B Shelar struct net_device *tdev = NULL;
282c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
283c5441932SPravin B Shelar const struct iphdr *iph;
284c5441932SPravin B Shelar int hlen = LL_MAX_HEADER;
285c5441932SPravin B Shelar int mtu = ETH_DATA_LEN;
286c5441932SPravin B Shelar int t_hlen = tunnel->hlen + sizeof(struct iphdr);
287c5441932SPravin B Shelar
288c5441932SPravin B Shelar iph = &tunnel->parms.iph;
289c5441932SPravin B Shelar
290c5441932SPravin B Shelar /* Guess output device to choose reasonable mtu and needed_headroom */
291c5441932SPravin B Shelar if (iph->daddr) {
292c5441932SPravin B Shelar struct flowi4 fl4;
293c5441932SPravin B Shelar struct rtable *rt;
294c5441932SPravin B Shelar
295b0066da5SPetr Machata ip_tunnel_init_flow(&fl4, iph->protocol, iph->daddr,
2967d442fabSTom Herbert iph->saddr, tunnel->parms.o_key,
29736eff866SXiao Liang iph->tos & INET_DSCP_MASK, tunnel->net,
2987ec9fce4SEyal Birger tunnel->parms.link, tunnel->fwmark, 0, 0);
2997d442fabSTom Herbert rt = ip_route_output_key(tunnel->net, &fl4);
3007d442fabSTom Herbert
301c5441932SPravin B Shelar if (!IS_ERR(rt)) {
302c5441932SPravin B Shelar tdev = rt->dst.dev;
303c5441932SPravin B Shelar ip_rt_put(rt);
304c5441932SPravin B Shelar }
305c5441932SPravin B Shelar if (dev->type != ARPHRD_ETHER)
306c5441932SPravin B Shelar dev->flags |= IFF_POINTOPOINT;
307f27337e1SPaolo Abeni
308f27337e1SPaolo Abeni dst_cache_reset(&tunnel->dst_cache);
309c5441932SPravin B Shelar }
310c5441932SPravin B Shelar
311c5441932SPravin B Shelar if (!tdev && tunnel->parms.link)
3126c742e71SNicolas Dichtel tdev = __dev_get_by_index(tunnel->net, tunnel->parms.link);
313c5441932SPravin B Shelar
314c5441932SPravin B Shelar if (tdev) {
315c5441932SPravin B Shelar hlen = tdev->hard_header_len + tdev->needed_headroom;
31682612de1SNicolas Dichtel mtu = min(tdev->mtu, IP_MAX_MTU);
317c5441932SPravin B Shelar }
318c5441932SPravin B Shelar
319c5441932SPravin B Shelar dev->needed_headroom = t_hlen + hlen;
3209992a078SHangbin Liu mtu -= t_hlen + (dev->type == ARPHRD_ETHER ? dev->hard_header_len : 0);
321c5441932SPravin B Shelar
322b5476022SEric Dumazet if (mtu < IPV4_MIN_MTU)
323b5476022SEric Dumazet mtu = IPV4_MIN_MTU;
324c5441932SPravin B Shelar
325c5441932SPravin B Shelar return mtu;
326c5441932SPravin B Shelar }
327c5441932SPravin B Shelar
ip_tunnel_create(struct net * net,struct ip_tunnel_net * itn,struct ip_tunnel_parm * parms)328c5441932SPravin B Shelar static struct ip_tunnel *ip_tunnel_create(struct net *net,
329c5441932SPravin B Shelar struct ip_tunnel_net *itn,
330c5441932SPravin B Shelar struct ip_tunnel_parm *parms)
331c5441932SPravin B Shelar {
3324929fd8cSJulia Lawall struct ip_tunnel *nt;
333c5441932SPravin B Shelar struct net_device *dev;
334b96f9afeSJarod Wilson int t_hlen;
335f6cc9c05SPetr Machata int mtu;
336f6cc9c05SPetr Machata int err;
337c5441932SPravin B Shelar
33879134e6cSEric Dumazet dev = __ip_tunnel_create(net, itn->rtnl_link_ops, parms);
339c5441932SPravin B Shelar if (IS_ERR(dev))
3406dd3c9ecSFlorian Westphal return ERR_CAST(dev);
341c5441932SPravin B Shelar
342f6cc9c05SPetr Machata mtu = ip_tunnel_bind_dev(dev);
343f6cc9c05SPetr Machata err = dev_set_mtu(dev, mtu);
344f6cc9c05SPetr Machata if (err)
345f6cc9c05SPetr Machata goto err_dev_set_mtu;
346c5441932SPravin B Shelar
347c5441932SPravin B Shelar nt = netdev_priv(dev);
348b96f9afeSJarod Wilson t_hlen = nt->hlen + sizeof(struct iphdr);
349b96f9afeSJarod Wilson dev->min_mtu = ETH_MIN_MTU;
35028e104d0SVadim Fedorenko dev->max_mtu = IP_MAX_MTU - t_hlen;
3519992a078SHangbin Liu if (dev->type == ARPHRD_ETHER)
3529992a078SHangbin Liu dev->max_mtu -= dev->hard_header_len;
3539992a078SHangbin Liu
354c5441932SPravin B Shelar ip_tunnel_add(itn, nt);
355c5441932SPravin B Shelar return nt;
356f6cc9c05SPetr Machata
357f6cc9c05SPetr Machata err_dev_set_mtu:
358f6cc9c05SPetr Machata unregister_netdevice(dev);
359f6cc9c05SPetr Machata return ERR_PTR(err);
360c5441932SPravin B Shelar }
361c5441932SPravin B Shelar
ip_tunnel_md_udp_encap(struct sk_buff * skb,struct ip_tunnel_info * info)362ac931d4cSChristian Ehrig void ip_tunnel_md_udp_encap(struct sk_buff *skb, struct ip_tunnel_info *info)
363ac931d4cSChristian Ehrig {
364ac931d4cSChristian Ehrig const struct iphdr *iph = ip_hdr(skb);
365ac931d4cSChristian Ehrig const struct udphdr *udph;
366ac931d4cSChristian Ehrig
367ac931d4cSChristian Ehrig if (iph->protocol != IPPROTO_UDP)
368ac931d4cSChristian Ehrig return;
369ac931d4cSChristian Ehrig
370ac931d4cSChristian Ehrig udph = (struct udphdr *)((__u8 *)iph + (iph->ihl << 2));
371ac931d4cSChristian Ehrig info->encap.sport = udph->source;
372ac931d4cSChristian Ehrig info->encap.dport = udph->dest;
373ac931d4cSChristian Ehrig }
374ac931d4cSChristian Ehrig EXPORT_SYMBOL(ip_tunnel_md_udp_encap);
375ac931d4cSChristian Ehrig
ip_tunnel_rcv(struct ip_tunnel * tunnel,struct sk_buff * skb,const struct tnl_ptk_info * tpi,struct metadata_dst * tun_dst,bool log_ecn_error)376c5441932SPravin B Shelar int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb,
3772e15ea39SPravin B Shelar const struct tnl_ptk_info *tpi, struct metadata_dst *tun_dst,
3782e15ea39SPravin B Shelar bool log_ecn_error)
379c5441932SPravin B Shelar {
380c5441932SPravin B Shelar const struct iphdr *iph = ip_hdr(skb);
381c4c85772SEric Dumazet int nh, err;
382c5441932SPravin B Shelar
383c5441932SPravin B Shelar #ifdef CONFIG_NET_IPGRE_BROADCAST
384c5441932SPravin B Shelar if (ipv4_is_multicast(iph->daddr)) {
385c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, multicast);
386c5441932SPravin B Shelar skb->pkt_type = PACKET_BROADCAST;
387c5441932SPravin B Shelar }
388c5441932SPravin B Shelar #endif
389c5441932SPravin B Shelar
390c5441932SPravin B Shelar if ((!(tpi->flags&TUNNEL_CSUM) && (tunnel->parms.i_flags&TUNNEL_CSUM)) ||
391c5441932SPravin B Shelar ((tpi->flags&TUNNEL_CSUM) && !(tunnel->parms.i_flags&TUNNEL_CSUM))) {
392c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_crc_errors);
393c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_errors);
394c5441932SPravin B Shelar goto drop;
395c5441932SPravin B Shelar }
396c5441932SPravin B Shelar
397c5441932SPravin B Shelar if (tunnel->parms.i_flags&TUNNEL_SEQ) {
398c5441932SPravin B Shelar if (!(tpi->flags&TUNNEL_SEQ) ||
399c5441932SPravin B Shelar (tunnel->i_seqno && (s32)(ntohl(tpi->seq) - tunnel->i_seqno) < 0)) {
400c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_fifo_errors);
401c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_errors);
402c5441932SPravin B Shelar goto drop;
403c5441932SPravin B Shelar }
404c5441932SPravin B Shelar tunnel->i_seqno = ntohl(tpi->seq) + 1;
405c5441932SPravin B Shelar }
406c5441932SPravin B Shelar
407c4c85772SEric Dumazet /* Save offset of outer header relative to skb->head,
408c4c85772SEric Dumazet * because we are going to reset the network header to the inner header
409c4c85772SEric Dumazet * and might change skb->head.
410c4c85772SEric Dumazet */
411c4c85772SEric Dumazet nh = skb_network_header(skb) - skb->head;
412c4c85772SEric Dumazet
413227adfb2SGilad Naaman skb_set_network_header(skb, (tunnel->dev->type == ARPHRD_ETHER) ? ETH_HLEN : 0);
414e96f2e7cSYing Cai
415c4c85772SEric Dumazet if (!pskb_inet_may_pull(skb)) {
416c4c85772SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_length_errors);
417c4c85772SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_errors);
418c4c85772SEric Dumazet goto drop;
419c4c85772SEric Dumazet }
420c4c85772SEric Dumazet iph = (struct iphdr *)(skb->head + nh);
421c4c85772SEric Dumazet
422c5441932SPravin B Shelar err = IP_ECN_decapsulate(iph, skb);
423c5441932SPravin B Shelar if (unlikely(err)) {
424c5441932SPravin B Shelar if (log_ecn_error)
425c5441932SPravin B Shelar net_info_ratelimited("non-ECT from %pI4 with TOS=%#x\n",
426c5441932SPravin B Shelar &iph->saddr, iph->tos);
427c5441932SPravin B Shelar if (err > 1) {
428c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_frame_errors);
429c4794d22SEric Dumazet DEV_STATS_INC(tunnel->dev, rx_errors);
430c5441932SPravin B Shelar goto drop;
431c5441932SPravin B Shelar }
432c5441932SPravin B Shelar }
433c5441932SPravin B Shelar
434560b50cfSFabian Frederick dev_sw_netstats_rx_add(tunnel->dev, skb->len);
43581b9eab5SAlexei Starovoitov skb_scrub_packet(skb, !net_eq(tunnel->net, dev_net(tunnel->dev)));
43681b9eab5SAlexei Starovoitov
4373d7b46cdSPravin B Shelar if (tunnel->dev->type == ARPHRD_ETHER) {
4383d7b46cdSPravin B Shelar skb->protocol = eth_type_trans(skb, tunnel->dev);
4393d7b46cdSPravin B Shelar skb_postpull_rcsum(skb, eth_hdr(skb), ETH_HLEN);
4403d7b46cdSPravin B Shelar } else {
4413d7b46cdSPravin B Shelar skb->dev = tunnel->dev;
4423d7b46cdSPravin B Shelar }
44364261f23SNicolas Dichtel
4442e15ea39SPravin B Shelar if (tun_dst)
4452e15ea39SPravin B Shelar skb_dst_set(skb, (struct dst_entry *)tun_dst);
4462e15ea39SPravin B Shelar
447c5441932SPravin B Shelar gro_cells_receive(&tunnel->gro_cells, skb);
448c5441932SPravin B Shelar return 0;
449c5441932SPravin B Shelar
450c5441932SPravin B Shelar drop:
451469f87e1SHaishuang Yan if (tun_dst)
452469f87e1SHaishuang Yan dst_release((struct dst_entry *)tun_dst);
453c5441932SPravin B Shelar kfree_skb(skb);
454c5441932SPravin B Shelar return 0;
455c5441932SPravin B Shelar }
456c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_rcv);
457c5441932SPravin B Shelar
ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops * ops,unsigned int num)458a8c5f90fSTom Herbert int ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops *ops,
459a8c5f90fSTom Herbert unsigned int num)
460a8c5f90fSTom Herbert {
461bb1553c8SThomas Graf if (num >= MAX_IPTUN_ENCAP_OPS)
462bb1553c8SThomas Graf return -ERANGE;
463bb1553c8SThomas Graf
464a8c5f90fSTom Herbert return !cmpxchg((const struct ip_tunnel_encap_ops **)
465a8c5f90fSTom Herbert &iptun_encaps[num],
466a8c5f90fSTom Herbert NULL, ops) ? 0 : -1;
46756328486STom Herbert }
468a8c5f90fSTom Herbert EXPORT_SYMBOL(ip_tunnel_encap_add_ops);
469a8c5f90fSTom Herbert
ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops * ops,unsigned int num)470a8c5f90fSTom Herbert int ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops *ops,
471a8c5f90fSTom Herbert unsigned int num)
472a8c5f90fSTom Herbert {
473a8c5f90fSTom Herbert int ret;
474a8c5f90fSTom Herbert
475bb1553c8SThomas Graf if (num >= MAX_IPTUN_ENCAP_OPS)
476bb1553c8SThomas Graf return -ERANGE;
477bb1553c8SThomas Graf
478a8c5f90fSTom Herbert ret = (cmpxchg((const struct ip_tunnel_encap_ops **)
479a8c5f90fSTom Herbert &iptun_encaps[num],
480a8c5f90fSTom Herbert ops, NULL) == ops) ? 0 : -1;
481a8c5f90fSTom Herbert
482a8c5f90fSTom Herbert synchronize_net();
483a8c5f90fSTom Herbert
484a8c5f90fSTom Herbert return ret;
485a8c5f90fSTom Herbert }
486a8c5f90fSTom Herbert EXPORT_SYMBOL(ip_tunnel_encap_del_ops);
48756328486STom Herbert
ip_tunnel_encap_setup(struct ip_tunnel * t,struct ip_tunnel_encap * ipencap)48856328486STom Herbert int ip_tunnel_encap_setup(struct ip_tunnel *t,
48956328486STom Herbert struct ip_tunnel_encap *ipencap)
49056328486STom Herbert {
49156328486STom Herbert int hlen;
49256328486STom Herbert
49356328486STom Herbert memset(&t->encap, 0, sizeof(t->encap));
49456328486STom Herbert
49556328486STom Herbert hlen = ip_encap_hlen(ipencap);
49656328486STom Herbert if (hlen < 0)
49756328486STom Herbert return hlen;
49856328486STom Herbert
49956328486STom Herbert t->encap.type = ipencap->type;
50056328486STom Herbert t->encap.sport = ipencap->sport;
50156328486STom Herbert t->encap.dport = ipencap->dport;
50256328486STom Herbert t->encap.flags = ipencap->flags;
50356328486STom Herbert
50456328486STom Herbert t->encap_hlen = hlen;
50556328486STom Herbert t->hlen = t->encap_hlen + t->tun_hlen;
50656328486STom Herbert
50756328486STom Herbert return 0;
50856328486STom Herbert }
50956328486STom Herbert EXPORT_SYMBOL_GPL(ip_tunnel_encap_setup);
51056328486STom Herbert
tnl_update_pmtu(struct net_device * dev,struct sk_buff * skb,struct rtable * rt,__be16 df,const struct iphdr * inner_iph,int tunnel_hlen,__be32 dst,bool md)51123a3647bSPravin B Shelar static int tnl_update_pmtu(struct net_device *dev, struct sk_buff *skb,
512fc24f2b2STimo Teräs struct rtable *rt, __be16 df,
513c8b34e68Swenxu const struct iphdr *inner_iph,
514c8b34e68Swenxu int tunnel_hlen, __be32 dst, bool md)
51523a3647bSPravin B Shelar {
51623a3647bSPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
517c8b34e68Swenxu int pkt_size;
51823a3647bSPravin B Shelar int mtu;
51923a3647bSPravin B Shelar
520c8b34e68Swenxu tunnel_hlen = md ? tunnel_hlen : tunnel->hlen;
52128e104d0SVadim Fedorenko pkt_size = skb->len - tunnel_hlen;
5229992a078SHangbin Liu pkt_size -= dev->type == ARPHRD_ETHER ? dev->hard_header_len : 0;
523c8b34e68Swenxu
5249992a078SHangbin Liu if (df) {
52528e104d0SVadim Fedorenko mtu = dst_mtu(&rt->dst) - (sizeof(struct iphdr) + tunnel_hlen);
5269992a078SHangbin Liu mtu -= dev->type == ARPHRD_ETHER ? dev->hard_header_len : 0;
5279992a078SHangbin Liu } else {
528f4b3ec4eSAlan Maguire mtu = skb_valid_dst(skb) ? dst_mtu(skb_dst(skb)) : dev->mtu;
5299992a078SHangbin Liu }
53023a3647bSPravin B Shelar
531f4b3ec4eSAlan Maguire if (skb_valid_dst(skb))
5327a1592bcSHangbin Liu skb_dst_update_pmtu_no_confirm(skb, mtu);
53323a3647bSPravin B Shelar
53423a3647bSPravin B Shelar if (skb->protocol == htons(ETH_P_IP)) {
53523a3647bSPravin B Shelar if (!skb_is_gso(skb) &&
536fc24f2b2STimo Teräs (inner_iph->frag_off & htons(IP_DF)) &&
537fc24f2b2STimo Teräs mtu < pkt_size) {
5384372339eSJason A. Donenfeld icmp_ndo_send(skb, ICMP_DEST_UNREACH, ICMP_FRAG_NEEDED, htonl(mtu));
53923a3647bSPravin B Shelar return -E2BIG;
54023a3647bSPravin B Shelar }
54123a3647bSPravin B Shelar }
54223a3647bSPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
54323a3647bSPravin B Shelar else if (skb->protocol == htons(ETH_P_IPV6)) {
544f4b3ec4eSAlan Maguire struct rt6_info *rt6;
545c8b34e68Swenxu __be32 daddr;
546c8b34e68Swenxu
547797a4c1fSEric Dumazet rt6 = skb_valid_dst(skb) ? dst_rt6_info(skb_dst(skb)) :
548f4b3ec4eSAlan Maguire NULL;
549c8b34e68Swenxu daddr = md ? dst : tunnel->parms.iph.daddr;
55023a3647bSPravin B Shelar
55123a3647bSPravin B Shelar if (rt6 && mtu < dst_mtu(skb_dst(skb)) &&
55223a3647bSPravin B Shelar mtu >= IPV6_MIN_MTU) {
553c8b34e68Swenxu if ((daddr && !ipv4_is_multicast(daddr)) ||
55423a3647bSPravin B Shelar rt6->rt6i_dst.plen == 128) {
55523a3647bSPravin B Shelar rt6->rt6i_flags |= RTF_MODIFIED;
55623a3647bSPravin B Shelar dst_metric_set(skb_dst(skb), RTAX_MTU, mtu);
55723a3647bSPravin B Shelar }
55823a3647bSPravin B Shelar }
55923a3647bSPravin B Shelar
56023a3647bSPravin B Shelar if (!skb_is_gso(skb) && mtu >= IPV6_MIN_MTU &&
56123a3647bSPravin B Shelar mtu < pkt_size) {
5624372339eSJason A. Donenfeld icmpv6_ndo_send(skb, ICMPV6_PKT_TOOBIG, 0, mtu);
56323a3647bSPravin B Shelar return -E2BIG;
56423a3647bSPravin B Shelar }
56523a3647bSPravin B Shelar }
56623a3647bSPravin B Shelar #endif
56723a3647bSPravin B Shelar return 0;
56823a3647bSPravin B Shelar }
56923a3647bSPravin B Shelar
ip_tunnel_adj_headroom(struct net_device * dev,unsigned int headroom)570a0a1db40SFlorian Westphal static void ip_tunnel_adj_headroom(struct net_device *dev, unsigned int headroom)
571a0a1db40SFlorian Westphal {
572a0a1db40SFlorian Westphal /* we must cap headroom to some upperlimit, else pskb_expand_head
573a0a1db40SFlorian Westphal * will overflow header offsets in skb_headers_offset_update().
574a0a1db40SFlorian Westphal */
575a0a1db40SFlorian Westphal static const unsigned int max_allowed = 512;
576a0a1db40SFlorian Westphal
577a0a1db40SFlorian Westphal if (headroom > max_allowed)
578a0a1db40SFlorian Westphal headroom = max_allowed;
579a0a1db40SFlorian Westphal
580a0a1db40SFlorian Westphal if (headroom > READ_ONCE(dev->needed_headroom))
581a0a1db40SFlorian Westphal WRITE_ONCE(dev->needed_headroom, headroom);
582a0a1db40SFlorian Westphal }
583a0a1db40SFlorian Westphal
ip_md_tunnel_xmit(struct sk_buff * skb,struct net_device * dev,u8 proto,int tunnel_hlen)584c8b34e68Swenxu void ip_md_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
585c8b34e68Swenxu u8 proto, int tunnel_hlen)
586cfc7381bSAlexei Starovoitov {
587cfc7381bSAlexei Starovoitov struct ip_tunnel *tunnel = netdev_priv(dev);
588cfc7381bSAlexei Starovoitov u32 headroom = sizeof(struct iphdr);
589cfc7381bSAlexei Starovoitov struct ip_tunnel_info *tun_info;
590cfc7381bSAlexei Starovoitov const struct ip_tunnel_key *key;
591cfc7381bSAlexei Starovoitov const struct iphdr *inner_iph;
592f46fe4f8Swenxu struct rtable *rt = NULL;
593cfc7381bSAlexei Starovoitov struct flowi4 fl4;
594cfc7381bSAlexei Starovoitov __be16 df = 0;
595cfc7381bSAlexei Starovoitov u8 tos, ttl;
596f46fe4f8Swenxu bool use_cache;
597cfc7381bSAlexei Starovoitov
598cfc7381bSAlexei Starovoitov tun_info = skb_tunnel_info(skb);
599cfc7381bSAlexei Starovoitov if (unlikely(!tun_info || !(tun_info->mode & IP_TUNNEL_INFO_TX) ||
600cfc7381bSAlexei Starovoitov ip_tunnel_info_af(tun_info) != AF_INET))
601cfc7381bSAlexei Starovoitov goto tx_error;
602cfc7381bSAlexei Starovoitov key = &tun_info->key;
603cfc7381bSAlexei Starovoitov memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
604cfc7381bSAlexei Starovoitov inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
605cfc7381bSAlexei Starovoitov tos = key->tos;
606cfc7381bSAlexei Starovoitov if (tos == 1) {
607cfc7381bSAlexei Starovoitov if (skb->protocol == htons(ETH_P_IP))
608cfc7381bSAlexei Starovoitov tos = inner_iph->tos;
609cfc7381bSAlexei Starovoitov else if (skb->protocol == htons(ETH_P_IPV6))
610cfc7381bSAlexei Starovoitov tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
611cfc7381bSAlexei Starovoitov }
6126e6b904aSwenxu ip_tunnel_init_flow(&fl4, proto, key->u.ipv4.dst, key->u.ipv4.src,
6133b1a7fb7SIdo Schimmel tunnel_id_to_key32(key->tun_id),
61436eff866SXiao Liang tos & INET_DSCP_MASK, tunnel->net, 0, skb->mark,
6153b1a7fb7SIdo Schimmel skb_get_hash(skb), key->flow_flags);
616ac931d4cSChristian Ehrig
617ac931d4cSChristian Ehrig if (!tunnel_hlen)
618ac931d4cSChristian Ehrig tunnel_hlen = ip_encap_hlen(&tun_info->encap);
619ac931d4cSChristian Ehrig
620ac931d4cSChristian Ehrig if (ip_tunnel_encap(skb, &tun_info->encap, &proto, &fl4) < 0)
621cfc7381bSAlexei Starovoitov goto tx_error;
622f46fe4f8Swenxu
623f46fe4f8Swenxu use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
624f46fe4f8Swenxu if (use_cache)
625f46fe4f8Swenxu rt = dst_cache_get_ip4(&tun_info->dst_cache, &fl4.saddr);
626f46fe4f8Swenxu if (!rt) {
627cfc7381bSAlexei Starovoitov rt = ip_route_output_key(tunnel->net, &fl4);
628cfc7381bSAlexei Starovoitov if (IS_ERR(rt)) {
629c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_carrier_errors);
630cfc7381bSAlexei Starovoitov goto tx_error;
631cfc7381bSAlexei Starovoitov }
632f46fe4f8Swenxu if (use_cache)
633f46fe4f8Swenxu dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
634f46fe4f8Swenxu fl4.saddr);
635f46fe4f8Swenxu }
636cfc7381bSAlexei Starovoitov if (rt->dst.dev == dev) {
637cfc7381bSAlexei Starovoitov ip_rt_put(rt);
638c4794d22SEric Dumazet DEV_STATS_INC(dev, collisions);
639cfc7381bSAlexei Starovoitov goto tx_error;
640cfc7381bSAlexei Starovoitov }
641c8b34e68Swenxu
642c8b34e68Swenxu if (key->tun_flags & TUNNEL_DONT_FRAGMENT)
643c8b34e68Swenxu df = htons(IP_DF);
644c8b34e68Swenxu if (tnl_update_pmtu(dev, skb, rt, df, inner_iph, tunnel_hlen,
645c8b34e68Swenxu key->u.ipv4.dst, true)) {
646c8b34e68Swenxu ip_rt_put(rt);
647c8b34e68Swenxu goto tx_error;
648c8b34e68Swenxu }
649c8b34e68Swenxu
650cfc7381bSAlexei Starovoitov tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
651cfc7381bSAlexei Starovoitov ttl = key->ttl;
652cfc7381bSAlexei Starovoitov if (ttl == 0) {
653cfc7381bSAlexei Starovoitov if (skb->protocol == htons(ETH_P_IP))
654cfc7381bSAlexei Starovoitov ttl = inner_iph->ttl;
655cfc7381bSAlexei Starovoitov else if (skb->protocol == htons(ETH_P_IPV6))
656cfc7381bSAlexei Starovoitov ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
657cfc7381bSAlexei Starovoitov else
658cfc7381bSAlexei Starovoitov ttl = ip4_dst_hoplimit(&rt->dst);
659cfc7381bSAlexei Starovoitov }
660c8b34e68Swenxu
661cfc7381bSAlexei Starovoitov headroom += LL_RESERVED_SPACE(rt->dst.dev) + rt->dst.header_len;
662a0a1db40SFlorian Westphal if (skb_cow_head(skb, headroom)) {
663cfc7381bSAlexei Starovoitov ip_rt_put(rt);
664cfc7381bSAlexei Starovoitov goto tx_dropped;
665cfc7381bSAlexei Starovoitov }
666a0a1db40SFlorian Westphal
667a0a1db40SFlorian Westphal ip_tunnel_adj_headroom(dev, headroom);
668a0a1db40SFlorian Westphal
6690f693f19SHaishuang Yan iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, proto, tos, ttl,
6700f693f19SHaishuang Yan df, !net_eq(tunnel->net, dev_net(dev)));
671cfc7381bSAlexei Starovoitov return;
672cfc7381bSAlexei Starovoitov tx_error:
673c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_errors);
674cfc7381bSAlexei Starovoitov goto kfree;
675cfc7381bSAlexei Starovoitov tx_dropped:
676c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_dropped);
677cfc7381bSAlexei Starovoitov kfree:
678cfc7381bSAlexei Starovoitov kfree_skb(skb);
679cfc7381bSAlexei Starovoitov }
680cfc7381bSAlexei Starovoitov EXPORT_SYMBOL_GPL(ip_md_tunnel_xmit);
681cfc7381bSAlexei Starovoitov
ip_tunnel_xmit(struct sk_buff * skb,struct net_device * dev,const struct iphdr * tnl_params,u8 protocol)682c5441932SPravin B Shelar void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
68356328486STom Herbert const struct iphdr *tnl_params, u8 protocol)
684c5441932SPravin B Shelar {
685c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
686186d9366Swenxu struct ip_tunnel_info *tun_info = NULL;
687c5441932SPravin B Shelar const struct iphdr *inner_iph;
688c5441932SPravin B Shelar unsigned int max_headroom; /* The extra header space needed */
689186d9366Swenxu struct rtable *rt = NULL; /* Route to the other host */
6907ae29fd1SMatthias May __be16 payload_protocol;
691186d9366Swenxu bool use_cache = false;
692186d9366Swenxu struct flowi4 fl4;
693186d9366Swenxu bool md = false;
69422fb22eaSTimo Teräs bool connected;
695186d9366Swenxu u8 tos, ttl;
696186d9366Swenxu __be32 dst;
697186d9366Swenxu __be16 df;
698c5441932SPravin B Shelar
699c5441932SPravin B Shelar inner_iph = (const struct iphdr *)skb_inner_network_header(skb);
70022fb22eaSTimo Teräs connected = (tunnel->parms.iph.daddr != 0);
7017ae29fd1SMatthias May payload_protocol = skb_protocol(skb, true);
702c5441932SPravin B Shelar
7035146d1f1SBernie Harris memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
7045146d1f1SBernie Harris
705c5441932SPravin B Shelar dst = tnl_params->daddr;
706c5441932SPravin B Shelar if (dst == 0) {
707c5441932SPravin B Shelar /* NBMA tunnel */
708c5441932SPravin B Shelar
70951456b29SIan Morris if (!skb_dst(skb)) {
710c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_fifo_errors);
711c5441932SPravin B Shelar goto tx_error;
712c5441932SPravin B Shelar }
713c5441932SPravin B Shelar
714d71b5753Swenxu tun_info = skb_tunnel_info(skb);
715d71b5753Swenxu if (tun_info && (tun_info->mode & IP_TUNNEL_INFO_TX) &&
716d71b5753Swenxu ip_tunnel_info_af(tun_info) == AF_INET &&
717186d9366Swenxu tun_info->key.u.ipv4.dst) {
718d71b5753Swenxu dst = tun_info->key.u.ipv4.dst;
719186d9366Swenxu md = true;
720186d9366Swenxu connected = true;
7217ae29fd1SMatthias May } else if (payload_protocol == htons(ETH_P_IP)) {
722c5441932SPravin B Shelar rt = skb_rtable(skb);
723c5441932SPravin B Shelar dst = rt_nexthop(rt, inner_iph->daddr);
724c5441932SPravin B Shelar }
725c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
7267ae29fd1SMatthias May else if (payload_protocol == htons(ETH_P_IPV6)) {
727c5441932SPravin B Shelar const struct in6_addr *addr6;
728c5441932SPravin B Shelar struct neighbour *neigh;
729c5441932SPravin B Shelar bool do_tx_error_icmp;
730c5441932SPravin B Shelar int addr_type;
731c5441932SPravin B Shelar
732c5441932SPravin B Shelar neigh = dst_neigh_lookup(skb_dst(skb),
733c5441932SPravin B Shelar &ipv6_hdr(skb)->daddr);
73451456b29SIan Morris if (!neigh)
735c5441932SPravin B Shelar goto tx_error;
736c5441932SPravin B Shelar
737c5441932SPravin B Shelar addr6 = (const struct in6_addr *)&neigh->primary_key;
738c5441932SPravin B Shelar addr_type = ipv6_addr_type(addr6);
739c5441932SPravin B Shelar
740c5441932SPravin B Shelar if (addr_type == IPV6_ADDR_ANY) {
741c5441932SPravin B Shelar addr6 = &ipv6_hdr(skb)->daddr;
742c5441932SPravin B Shelar addr_type = ipv6_addr_type(addr6);
743c5441932SPravin B Shelar }
744c5441932SPravin B Shelar
745c5441932SPravin B Shelar if ((addr_type & IPV6_ADDR_COMPATv4) == 0)
746c5441932SPravin B Shelar do_tx_error_icmp = true;
747c5441932SPravin B Shelar else {
748c5441932SPravin B Shelar do_tx_error_icmp = false;
749c5441932SPravin B Shelar dst = addr6->s6_addr32[3];
750c5441932SPravin B Shelar }
751c5441932SPravin B Shelar neigh_release(neigh);
752c5441932SPravin B Shelar if (do_tx_error_icmp)
753c5441932SPravin B Shelar goto tx_error_icmp;
754c5441932SPravin B Shelar }
755c5441932SPravin B Shelar #endif
756c5441932SPravin B Shelar else
757c5441932SPravin B Shelar goto tx_error;
7587d442fabSTom Herbert
759186d9366Swenxu if (!md)
7607d442fabSTom Herbert connected = false;
761c5441932SPravin B Shelar }
762c5441932SPravin B Shelar
763c5441932SPravin B Shelar tos = tnl_params->tos;
764c5441932SPravin B Shelar if (tos & 0x1) {
765c5441932SPravin B Shelar tos &= ~0x1;
7667ae29fd1SMatthias May if (payload_protocol == htons(ETH_P_IP)) {
767c5441932SPravin B Shelar tos = inner_iph->tos;
7687d442fabSTom Herbert connected = false;
7697ae29fd1SMatthias May } else if (payload_protocol == htons(ETH_P_IPV6)) {
770c5441932SPravin B Shelar tos = ipv6_get_dsfield((const struct ipv6hdr *)inner_iph);
7717d442fabSTom Herbert connected = false;
7727d442fabSTom Herbert }
773c5441932SPravin B Shelar }
774c5441932SPravin B Shelar
775b0066da5SPetr Machata ip_tunnel_init_flow(&fl4, protocol, dst, tnl_params->saddr,
7767e9aa1a0SIdo Schimmel tunnel->parms.o_key, tos & INET_DSCP_MASK,
77736eff866SXiao Liang tunnel->net, READ_ONCE(tunnel->parms.link),
7787ec9fce4SEyal Birger tunnel->fwmark, skb_get_hash(skb), 0);
7797d442fabSTom Herbert
780ac931d4cSChristian Ehrig if (ip_tunnel_encap(skb, &tunnel->encap, &protocol, &fl4) < 0)
78156328486STom Herbert goto tx_error;
78256328486STom Herbert
783186d9366Swenxu if (connected && md) {
784186d9366Swenxu use_cache = ip_tunnel_dst_cache_usable(skb, tun_info);
785186d9366Swenxu if (use_cache)
786186d9366Swenxu rt = dst_cache_get_ip4(&tun_info->dst_cache,
787186d9366Swenxu &fl4.saddr);
788186d9366Swenxu } else {
789186d9366Swenxu rt = connected ? dst_cache_get_ip4(&tunnel->dst_cache,
790186d9366Swenxu &fl4.saddr) : NULL;
791186d9366Swenxu }
7927d442fabSTom Herbert
7937d442fabSTom Herbert if (!rt) {
7947d442fabSTom Herbert rt = ip_route_output_key(tunnel->net, &fl4);
7957d442fabSTom Herbert
796c5441932SPravin B Shelar if (IS_ERR(rt)) {
797c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_carrier_errors);
798c5441932SPravin B Shelar goto tx_error;
799c5441932SPravin B Shelar }
800186d9366Swenxu if (use_cache)
801186d9366Swenxu dst_cache_set_ip4(&tun_info->dst_cache, &rt->dst,
802186d9366Swenxu fl4.saddr);
803186d9366Swenxu else if (!md && connected)
804e09acddfSPaolo Abeni dst_cache_set_ip4(&tunnel->dst_cache, &rt->dst,
805e09acddfSPaolo Abeni fl4.saddr);
8067d442fabSTom Herbert }
8077d442fabSTom Herbert
8080e6fbc5bSPravin B Shelar if (rt->dst.dev == dev) {
809c5441932SPravin B Shelar ip_rt_put(rt);
810c4794d22SEric Dumazet DEV_STATS_INC(dev, collisions);
811c5441932SPravin B Shelar goto tx_error;
812c5441932SPravin B Shelar }
813c5441932SPravin B Shelar
81450c66167SFlorian Westphal df = tnl_params->frag_off;
8157ae29fd1SMatthias May if (payload_protocol == htons(ETH_P_IP) && !tunnel->ignore_df)
81650c66167SFlorian Westphal df |= (inner_iph->frag_off & htons(IP_DF));
81750c66167SFlorian Westphal
81850c66167SFlorian Westphal if (tnl_update_pmtu(dev, skb, rt, df, inner_iph, 0, 0, false)) {
819c5441932SPravin B Shelar ip_rt_put(rt);
820c5441932SPravin B Shelar goto tx_error;
821c5441932SPravin B Shelar }
822c5441932SPravin B Shelar
823c5441932SPravin B Shelar if (tunnel->err_count > 0) {
824c5441932SPravin B Shelar if (time_before(jiffies,
825c5441932SPravin B Shelar tunnel->err_time + IPTUNNEL_ERR_TIMEO)) {
826c5441932SPravin B Shelar tunnel->err_count--;
827c5441932SPravin B Shelar
828c5441932SPravin B Shelar dst_link_failure(skb);
829c5441932SPravin B Shelar } else
830c5441932SPravin B Shelar tunnel->err_count = 0;
831c5441932SPravin B Shelar }
832c5441932SPravin B Shelar
833d4a71b15SPravin B Shelar tos = ip_tunnel_ecn_encap(tos, inner_iph, skb);
834c5441932SPravin B Shelar ttl = tnl_params->ttl;
835c5441932SPravin B Shelar if (ttl == 0) {
8367ae29fd1SMatthias May if (payload_protocol == htons(ETH_P_IP))
837c5441932SPravin B Shelar ttl = inner_iph->ttl;
838c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
8397ae29fd1SMatthias May else if (payload_protocol == htons(ETH_P_IPV6))
840c5441932SPravin B Shelar ttl = ((const struct ipv6hdr *)inner_iph)->hop_limit;
841c5441932SPravin B Shelar #endif
842c5441932SPravin B Shelar else
843c5441932SPravin B Shelar ttl = ip4_dst_hoplimit(&rt->dst);
844c5441932SPravin B Shelar }
845c5441932SPravin B Shelar
8460e6fbc5bSPravin B Shelar max_headroom = LL_RESERVED_SPACE(rt->dst.dev) + sizeof(struct iphdr)
8477371e022STom Herbert + rt->dst.header_len + ip_encap_hlen(&tunnel->encap);
8483e08f4a7SSteffen Klassert
849a0a1db40SFlorian Westphal if (skb_cow_head(skb, max_headroom)) {
850586d5fc8SDmitry Popov ip_rt_put(rt);
851c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_dropped);
8523acfa1e7SEric Dumazet kfree_skb(skb);
853c5441932SPravin B Shelar return;
854c5441932SPravin B Shelar }
855c5441932SPravin B Shelar
856a0a1db40SFlorian Westphal ip_tunnel_adj_headroom(dev, max_headroom);
857a0a1db40SFlorian Westphal
858039f5062SPravin B Shelar iptunnel_xmit(NULL, rt, skb, fl4.saddr, fl4.daddr, protocol, tos, ttl,
859039f5062SPravin B Shelar df, !net_eq(tunnel->net, dev_net(dev)));
860c5441932SPravin B Shelar return;
861c5441932SPravin B Shelar
862c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
863c5441932SPravin B Shelar tx_error_icmp:
864c5441932SPravin B Shelar dst_link_failure(skb);
865c5441932SPravin B Shelar #endif
866c5441932SPravin B Shelar tx_error:
867c4794d22SEric Dumazet DEV_STATS_INC(dev, tx_errors);
8683acfa1e7SEric Dumazet kfree_skb(skb);
869c5441932SPravin B Shelar }
870c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_xmit);
871c5441932SPravin B Shelar
ip_tunnel_update(struct ip_tunnel_net * itn,struct ip_tunnel * t,struct net_device * dev,struct ip_tunnel_parm * p,bool set_mtu,__u32 fwmark)872c5441932SPravin B Shelar static void ip_tunnel_update(struct ip_tunnel_net *itn,
873c5441932SPravin B Shelar struct ip_tunnel *t,
874c5441932SPravin B Shelar struct net_device *dev,
875c5441932SPravin B Shelar struct ip_tunnel_parm *p,
8769830ad4cSCraig Gallek bool set_mtu,
8779830ad4cSCraig Gallek __u32 fwmark)
878c5441932SPravin B Shelar {
8792e15ea39SPravin B Shelar ip_tunnel_del(itn, t);
880c5441932SPravin B Shelar t->parms.iph.saddr = p->iph.saddr;
881c5441932SPravin B Shelar t->parms.iph.daddr = p->iph.daddr;
882c5441932SPravin B Shelar t->parms.i_key = p->i_key;
883c5441932SPravin B Shelar t->parms.o_key = p->o_key;
884c5441932SPravin B Shelar if (dev->type != ARPHRD_ETHER) {
8855a1b7e1aSJakub Kicinski __dev_addr_set(dev, &p->iph.saddr, 4);
886c5441932SPravin B Shelar memcpy(dev->broadcast, &p->iph.daddr, 4);
887c5441932SPravin B Shelar }
888c5441932SPravin B Shelar ip_tunnel_add(itn, t);
889c5441932SPravin B Shelar
890c5441932SPravin B Shelar t->parms.iph.ttl = p->iph.ttl;
891c5441932SPravin B Shelar t->parms.iph.tos = p->iph.tos;
892c5441932SPravin B Shelar t->parms.iph.frag_off = p->iph.frag_off;
893c5441932SPravin B Shelar
8949830ad4cSCraig Gallek if (t->parms.link != p->link || t->fwmark != fwmark) {
895c5441932SPravin B Shelar int mtu;
896c5441932SPravin B Shelar
89777b1e00fSEric Dumazet WRITE_ONCE(t->parms.link, p->link);
8989830ad4cSCraig Gallek t->fwmark = fwmark;
899c5441932SPravin B Shelar mtu = ip_tunnel_bind_dev(dev);
900c5441932SPravin B Shelar if (set_mtu)
901c5441932SPravin B Shelar dev->mtu = mtu;
902c5441932SPravin B Shelar }
903e09acddfSPaolo Abeni dst_cache_reset(&t->dst_cache);
904c5441932SPravin B Shelar netdev_state_change(dev);
905c5441932SPravin B Shelar }
906c5441932SPravin B Shelar
ip_tunnel_ctl(struct net_device * dev,struct ip_tunnel_parm * p,int cmd)907607259a6SChristoph Hellwig int ip_tunnel_ctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd)
908c5441932SPravin B Shelar {
909c5441932SPravin B Shelar int err = 0;
9108c923ce2SNicolas Dichtel struct ip_tunnel *t = netdev_priv(dev);
9118c923ce2SNicolas Dichtel struct net *net = t->net;
9128c923ce2SNicolas Dichtel struct ip_tunnel_net *itn = net_generic(net, t->ip_tnl_net_id);
913c5441932SPravin B Shelar
914c5441932SPravin B Shelar switch (cmd) {
915c5441932SPravin B Shelar case SIOCGETTUNNEL:
9168c923ce2SNicolas Dichtel if (dev == itn->fb_tunnel_dev) {
917c5441932SPravin B Shelar t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
91851456b29SIan Morris if (!t)
919c5441932SPravin B Shelar t = netdev_priv(dev);
9208c923ce2SNicolas Dichtel }
921c5441932SPravin B Shelar memcpy(p, &t->parms, sizeof(*p));
922c5441932SPravin B Shelar break;
923c5441932SPravin B Shelar
924c5441932SPravin B Shelar case SIOCADDTUNNEL:
925c5441932SPravin B Shelar case SIOCCHGTUNNEL:
926c5441932SPravin B Shelar err = -EPERM;
927c5441932SPravin B Shelar if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
928c5441932SPravin B Shelar goto done;
929c5441932SPravin B Shelar if (p->iph.ttl)
930c5441932SPravin B Shelar p->iph.frag_off |= htons(IP_DF);
9317c8e6b9cSDmitry Popov if (!(p->i_flags & VTI_ISVTI)) {
932c5441932SPravin B Shelar if (!(p->i_flags & TUNNEL_KEY))
933c5441932SPravin B Shelar p->i_key = 0;
934c5441932SPravin B Shelar if (!(p->o_flags & TUNNEL_KEY))
935c5441932SPravin B Shelar p->o_key = 0;
9367c8e6b9cSDmitry Popov }
937c5441932SPravin B Shelar
93879134e6cSEric Dumazet t = ip_tunnel_find(itn, p, itn->type);
939c5441932SPravin B Shelar
940d61746b2SSteffen Klassert if (cmd == SIOCADDTUNNEL) {
941d61746b2SSteffen Klassert if (!t) {
942c5441932SPravin B Shelar t = ip_tunnel_create(net, itn, p);
943ee30ef4dSDuan Jiong err = PTR_ERR_OR_ZERO(t);
9446dd3c9ecSFlorian Westphal break;
9456dd3c9ecSFlorian Westphal }
946d61746b2SSteffen Klassert
947d61746b2SSteffen Klassert err = -EEXIST;
948d61746b2SSteffen Klassert break;
949d61746b2SSteffen Klassert }
950c5441932SPravin B Shelar if (dev != itn->fb_tunnel_dev && cmd == SIOCCHGTUNNEL) {
95100db4124SIan Morris if (t) {
952c5441932SPravin B Shelar if (t->dev != dev) {
953c5441932SPravin B Shelar err = -EEXIST;
954c5441932SPravin B Shelar break;
955c5441932SPravin B Shelar }
956c5441932SPravin B Shelar } else {
957c5441932SPravin B Shelar unsigned int nflags = 0;
958c5441932SPravin B Shelar
959c5441932SPravin B Shelar if (ipv4_is_multicast(p->iph.daddr))
960c5441932SPravin B Shelar nflags = IFF_BROADCAST;
961c5441932SPravin B Shelar else if (p->iph.daddr)
962c5441932SPravin B Shelar nflags = IFF_POINTOPOINT;
963c5441932SPravin B Shelar
964c5441932SPravin B Shelar if ((dev->flags^nflags)&(IFF_POINTOPOINT|IFF_BROADCAST)) {
965c5441932SPravin B Shelar err = -EINVAL;
966c5441932SPravin B Shelar break;
967c5441932SPravin B Shelar }
968c5441932SPravin B Shelar
969c5441932SPravin B Shelar t = netdev_priv(dev);
970c5441932SPravin B Shelar }
971c5441932SPravin B Shelar }
972c5441932SPravin B Shelar
973c5441932SPravin B Shelar if (t) {
974c5441932SPravin B Shelar err = 0;
9759830ad4cSCraig Gallek ip_tunnel_update(itn, t, dev, p, true, 0);
9766dd3c9ecSFlorian Westphal } else {
9776dd3c9ecSFlorian Westphal err = -ENOENT;
9786dd3c9ecSFlorian Westphal }
979c5441932SPravin B Shelar break;
980c5441932SPravin B Shelar
981c5441932SPravin B Shelar case SIOCDELTUNNEL:
982c5441932SPravin B Shelar err = -EPERM;
983c5441932SPravin B Shelar if (!ns_capable(net->user_ns, CAP_NET_ADMIN))
984c5441932SPravin B Shelar goto done;
985c5441932SPravin B Shelar
986c5441932SPravin B Shelar if (dev == itn->fb_tunnel_dev) {
987c5441932SPravin B Shelar err = -ENOENT;
988c5441932SPravin B Shelar t = ip_tunnel_find(itn, p, itn->fb_tunnel_dev->type);
98951456b29SIan Morris if (!t)
990c5441932SPravin B Shelar goto done;
991c5441932SPravin B Shelar err = -EPERM;
992c5441932SPravin B Shelar if (t == netdev_priv(itn->fb_tunnel_dev))
993c5441932SPravin B Shelar goto done;
994c5441932SPravin B Shelar dev = t->dev;
995c5441932SPravin B Shelar }
996c5441932SPravin B Shelar unregister_netdevice(dev);
997c5441932SPravin B Shelar err = 0;
998c5441932SPravin B Shelar break;
999c5441932SPravin B Shelar
1000c5441932SPravin B Shelar default:
1001c5441932SPravin B Shelar err = -EINVAL;
1002c5441932SPravin B Shelar }
1003c5441932SPravin B Shelar
1004c5441932SPravin B Shelar done:
1005c5441932SPravin B Shelar return err;
1006c5441932SPravin B Shelar }
1007607259a6SChristoph Hellwig EXPORT_SYMBOL_GPL(ip_tunnel_ctl);
1008607259a6SChristoph Hellwig
ip_tunnel_siocdevprivate(struct net_device * dev,struct ifreq * ifr,void __user * data,int cmd)10093e7a1c7cSArnd Bergmann int ip_tunnel_siocdevprivate(struct net_device *dev, struct ifreq *ifr,
10103e7a1c7cSArnd Bergmann void __user *data, int cmd)
1011607259a6SChristoph Hellwig {
1012607259a6SChristoph Hellwig struct ip_tunnel_parm p;
1013607259a6SChristoph Hellwig int err;
1014607259a6SChristoph Hellwig
10153e7a1c7cSArnd Bergmann if (copy_from_user(&p, data, sizeof(p)))
1016607259a6SChristoph Hellwig return -EFAULT;
1017607259a6SChristoph Hellwig err = dev->netdev_ops->ndo_tunnel_ctl(dev, &p, cmd);
10183e7a1c7cSArnd Bergmann if (!err && copy_to_user(data, &p, sizeof(p)))
1019607259a6SChristoph Hellwig return -EFAULT;
1020607259a6SChristoph Hellwig return err;
1021607259a6SChristoph Hellwig }
10223e7a1c7cSArnd Bergmann EXPORT_SYMBOL_GPL(ip_tunnel_siocdevprivate);
1023c5441932SPravin B Shelar
__ip_tunnel_change_mtu(struct net_device * dev,int new_mtu,bool strict)10247e059158SDavid Wragg int __ip_tunnel_change_mtu(struct net_device *dev, int new_mtu, bool strict)
1025c5441932SPravin B Shelar {
1026c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
1027c5441932SPravin B Shelar int t_hlen = tunnel->hlen + sizeof(struct iphdr);
102828e104d0SVadim Fedorenko int max_mtu = IP_MAX_MTU - t_hlen;
1029c5441932SPravin B Shelar
10309992a078SHangbin Liu if (dev->type == ARPHRD_ETHER)
10319992a078SHangbin Liu max_mtu -= dev->hard_header_len;
10329992a078SHangbin Liu
1033b96f9afeSJarod Wilson if (new_mtu < ETH_MIN_MTU)
1034c5441932SPravin B Shelar return -EINVAL;
10357e059158SDavid Wragg
10367e059158SDavid Wragg if (new_mtu > max_mtu) {
10377e059158SDavid Wragg if (strict)
10387e059158SDavid Wragg return -EINVAL;
10397e059158SDavid Wragg
10407e059158SDavid Wragg new_mtu = max_mtu;
10417e059158SDavid Wragg }
10427e059158SDavid Wragg
1043c5441932SPravin B Shelar dev->mtu = new_mtu;
1044c5441932SPravin B Shelar return 0;
1045c5441932SPravin B Shelar }
10467e059158SDavid Wragg EXPORT_SYMBOL_GPL(__ip_tunnel_change_mtu);
10477e059158SDavid Wragg
ip_tunnel_change_mtu(struct net_device * dev,int new_mtu)10487e059158SDavid Wragg int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu)
10497e059158SDavid Wragg {
10507e059158SDavid Wragg return __ip_tunnel_change_mtu(dev, new_mtu, true);
10517e059158SDavid Wragg }
1052c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_change_mtu);
1053c5441932SPravin B Shelar
ip_tunnel_dev_free(struct net_device * dev)1054c5441932SPravin B Shelar static void ip_tunnel_dev_free(struct net_device *dev)
1055c5441932SPravin B Shelar {
1056c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
1057c5441932SPravin B Shelar
1058c5441932SPravin B Shelar gro_cells_destroy(&tunnel->gro_cells);
1059e09acddfSPaolo Abeni dst_cache_destroy(&tunnel->dst_cache);
1060c5441932SPravin B Shelar free_percpu(dev->tstats);
1061c5441932SPravin B Shelar }
1062c5441932SPravin B Shelar
ip_tunnel_dellink(struct net_device * dev,struct list_head * head)1063c5441932SPravin B Shelar void ip_tunnel_dellink(struct net_device *dev, struct list_head *head)
1064c5441932SPravin B Shelar {
1065c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
1066c5441932SPravin B Shelar struct ip_tunnel_net *itn;
1067c5441932SPravin B Shelar
10686c742e71SNicolas Dichtel itn = net_generic(tunnel->net, tunnel->ip_tnl_net_id);
1069c5441932SPravin B Shelar
1070c5441932SPravin B Shelar if (itn->fb_tunnel_dev != dev) {
10712e15ea39SPravin B Shelar ip_tunnel_del(itn, netdev_priv(dev));
1072c5441932SPravin B Shelar unregister_netdevice_queue(dev, head);
1073c5441932SPravin B Shelar }
1074c5441932SPravin B Shelar }
1075c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_dellink);
1076c5441932SPravin B Shelar
ip_tunnel_get_link_net(const struct net_device * dev)10771728d4faSNicolas Dichtel struct net *ip_tunnel_get_link_net(const struct net_device *dev)
10781728d4faSNicolas Dichtel {
10791728d4faSNicolas Dichtel struct ip_tunnel *tunnel = netdev_priv(dev);
10801728d4faSNicolas Dichtel
10811728d4faSNicolas Dichtel return tunnel->net;
10821728d4faSNicolas Dichtel }
10831728d4faSNicolas Dichtel EXPORT_SYMBOL(ip_tunnel_get_link_net);
10841728d4faSNicolas Dichtel
ip_tunnel_get_iflink(const struct net_device * dev)10851e99584bSNicolas Dichtel int ip_tunnel_get_iflink(const struct net_device *dev)
10861e99584bSNicolas Dichtel {
108777b1e00fSEric Dumazet const struct ip_tunnel *tunnel = netdev_priv(dev);
10881e99584bSNicolas Dichtel
108977b1e00fSEric Dumazet return READ_ONCE(tunnel->parms.link);
10901e99584bSNicolas Dichtel }
10911e99584bSNicolas Dichtel EXPORT_SYMBOL(ip_tunnel_get_iflink);
10921e99584bSNicolas Dichtel
ip_tunnel_init_net(struct net * net,unsigned int ip_tnl_net_id,struct rtnl_link_ops * ops,char * devname)1093c7d03a00SAlexey Dobriyan int ip_tunnel_init_net(struct net *net, unsigned int ip_tnl_net_id,
1094c5441932SPravin B Shelar struct rtnl_link_ops *ops, char *devname)
1095c5441932SPravin B Shelar {
1096c5441932SPravin B Shelar struct ip_tunnel_net *itn = net_generic(net, ip_tnl_net_id);
1097c5441932SPravin B Shelar struct ip_tunnel_parm parms;
10986261d983Sstephen hemminger unsigned int i;
1099c5441932SPravin B Shelar
110079134e6cSEric Dumazet itn->rtnl_link_ops = ops;
11016261d983Sstephen hemminger for (i = 0; i < IP_TNL_HASH_SIZE; i++)
11026261d983Sstephen hemminger INIT_HLIST_HEAD(&itn->tunnels[i]);
1103c5441932SPravin B Shelar
110479134e6cSEric Dumazet if (!ops || !net_has_fallback_tunnels(net)) {
110579134e6cSEric Dumazet struct ip_tunnel_net *it_init_net;
110679134e6cSEric Dumazet
110779134e6cSEric Dumazet it_init_net = net_generic(&init_net, ip_tnl_net_id);
110879134e6cSEric Dumazet itn->type = it_init_net->type;
1109c5441932SPravin B Shelar itn->fb_tunnel_dev = NULL;
1110c5441932SPravin B Shelar return 0;
1111c5441932SPravin B Shelar }
11126261d983Sstephen hemminger
1113c5441932SPravin B Shelar memset(&parms, 0, sizeof(parms));
1114c5441932SPravin B Shelar if (devname)
1115512b2dc4SXueBing Chen strscpy(parms.name, devname, IFNAMSIZ);
1116c5441932SPravin B Shelar
1117c5441932SPravin B Shelar rtnl_lock();
1118c5441932SPravin B Shelar itn->fb_tunnel_dev = __ip_tunnel_create(net, ops, &parms);
1119ea857f28SDan Carpenter /* FB netdevice is special: we have one, and only one per netns.
1120ea857f28SDan Carpenter * Allowing to move it to another netns is clearly unsafe.
1121ea857f28SDan Carpenter */
112267013282SSteffen Klassert if (!IS_ERR(itn->fb_tunnel_dev)) {
1123ea857f28SDan Carpenter itn->fb_tunnel_dev->features |= NETIF_F_NETNS_LOCAL;
112478ff4be4SSteffen Klassert itn->fb_tunnel_dev->mtu = ip_tunnel_bind_dev(itn->fb_tunnel_dev);
112567013282SSteffen Klassert ip_tunnel_add(itn, netdev_priv(itn->fb_tunnel_dev));
112679134e6cSEric Dumazet itn->type = itn->fb_tunnel_dev->type;
112767013282SSteffen Klassert }
1128b4de77adSDan Carpenter rtnl_unlock();
1129c5441932SPravin B Shelar
113027d79f3bSSachin Kamat return PTR_ERR_OR_ZERO(itn->fb_tunnel_dev);
1131c5441932SPravin B Shelar }
1132c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_init_net);
1133c5441932SPravin B Shelar
ip_tunnel_destroy(struct net * net,struct ip_tunnel_net * itn,struct list_head * head,struct rtnl_link_ops * ops)113479134e6cSEric Dumazet static void ip_tunnel_destroy(struct net *net, struct ip_tunnel_net *itn,
113579134e6cSEric Dumazet struct list_head *head,
11366c742e71SNicolas Dichtel struct rtnl_link_ops *ops)
1137c5441932SPravin B Shelar {
11386c742e71SNicolas Dichtel struct net_device *dev, *aux;
1139c5441932SPravin B Shelar int h;
1140c5441932SPravin B Shelar
11416c742e71SNicolas Dichtel for_each_netdev_safe(net, dev, aux)
11426c742e71SNicolas Dichtel if (dev->rtnl_link_ops == ops)
11436c742e71SNicolas Dichtel unregister_netdevice_queue(dev, head);
11446c742e71SNicolas Dichtel
1145c5441932SPravin B Shelar for (h = 0; h < IP_TNL_HASH_SIZE; h++) {
1146c5441932SPravin B Shelar struct ip_tunnel *t;
1147c5441932SPravin B Shelar struct hlist_node *n;
1148c5441932SPravin B Shelar struct hlist_head *thead = &itn->tunnels[h];
1149c5441932SPravin B Shelar
1150c5441932SPravin B Shelar hlist_for_each_entry_safe(t, n, thead, hash_node)
11516c742e71SNicolas Dichtel /* If dev is in the same netns, it has already
11526c742e71SNicolas Dichtel * been added to the list by the previous loop.
11536c742e71SNicolas Dichtel */
11546c742e71SNicolas Dichtel if (!net_eq(dev_net(t->dev), net))
1155c5441932SPravin B Shelar unregister_netdevice_queue(t->dev, head);
1156c5441932SPravin B Shelar }
1157c5441932SPravin B Shelar }
1158c5441932SPravin B Shelar
ip_tunnel_delete_nets(struct list_head * net_list,unsigned int id,struct rtnl_link_ops * ops)115964bc1781SEric Dumazet void ip_tunnel_delete_nets(struct list_head *net_list, unsigned int id,
116064bc1781SEric Dumazet struct rtnl_link_ops *ops)
1161c5441932SPravin B Shelar {
116264bc1781SEric Dumazet struct ip_tunnel_net *itn;
116364bc1781SEric Dumazet struct net *net;
1164c5441932SPravin B Shelar LIST_HEAD(list);
1165c5441932SPravin B Shelar
1166c5441932SPravin B Shelar rtnl_lock();
116764bc1781SEric Dumazet list_for_each_entry(net, net_list, exit_list) {
116864bc1781SEric Dumazet itn = net_generic(net, id);
116979134e6cSEric Dumazet ip_tunnel_destroy(net, itn, &list, ops);
117064bc1781SEric Dumazet }
1171c5441932SPravin B Shelar unregister_netdevice_many(&list);
1172c5441932SPravin B Shelar rtnl_unlock();
1173c5441932SPravin B Shelar }
117464bc1781SEric Dumazet EXPORT_SYMBOL_GPL(ip_tunnel_delete_nets);
1175c5441932SPravin B Shelar
ip_tunnel_newlink(struct net_device * dev,struct nlattr * tb[],struct ip_tunnel_parm * p,__u32 fwmark)1176c5441932SPravin B Shelar int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[],
11779830ad4cSCraig Gallek struct ip_tunnel_parm *p, __u32 fwmark)
1178c5441932SPravin B Shelar {
1179c5441932SPravin B Shelar struct ip_tunnel *nt;
1180c5441932SPravin B Shelar struct net *net = dev_net(dev);
1181c5441932SPravin B Shelar struct ip_tunnel_net *itn;
1182c5441932SPravin B Shelar int mtu;
1183c5441932SPravin B Shelar int err;
1184c5441932SPravin B Shelar
1185c5441932SPravin B Shelar nt = netdev_priv(dev);
1186c5441932SPravin B Shelar itn = net_generic(net, nt->ip_tnl_net_id);
1187c5441932SPravin B Shelar
11882e15ea39SPravin B Shelar if (nt->collect_md) {
11892e15ea39SPravin B Shelar if (rtnl_dereference(itn->collect_md_tun))
11902e15ea39SPravin B Shelar return -EEXIST;
11912e15ea39SPravin B Shelar } else {
1192c5441932SPravin B Shelar if (ip_tunnel_find(itn, p, dev->type))
1193c5441932SPravin B Shelar return -EEXIST;
11942e15ea39SPravin B Shelar }
1195c5441932SPravin B Shelar
11965e6700b3SNicolas Dichtel nt->net = net;
1197c5441932SPravin B Shelar nt->parms = *p;
11989830ad4cSCraig Gallek nt->fwmark = fwmark;
1199c5441932SPravin B Shelar err = register_netdevice(dev);
1200c5441932SPravin B Shelar if (err)
1201f6cc9c05SPetr Machata goto err_register_netdevice;
1202c5441932SPravin B Shelar
1203c5441932SPravin B Shelar if (dev->type == ARPHRD_ETHER && !tb[IFLA_ADDRESS])
1204c5441932SPravin B Shelar eth_hw_addr_random(dev);
1205c5441932SPravin B Shelar
1206c5441932SPravin B Shelar mtu = ip_tunnel_bind_dev(dev);
120724fc7979SStefano Brivio if (tb[IFLA_MTU]) {
120828e104d0SVadim Fedorenko unsigned int max = IP_MAX_MTU - (nt->hlen + sizeof(struct iphdr));
120924fc7979SStefano Brivio
12109992a078SHangbin Liu if (dev->type == ARPHRD_ETHER)
12119992a078SHangbin Liu max -= dev->hard_header_len;
12129992a078SHangbin Liu
121328e104d0SVadim Fedorenko mtu = clamp(dev->mtu, (unsigned int)ETH_MIN_MTU, max);
12145568cdc3SDavid S. Miller }
12155568cdc3SDavid S. Miller
1216f6cc9c05SPetr Machata err = dev_set_mtu(dev, mtu);
1217f6cc9c05SPetr Machata if (err)
1218f6cc9c05SPetr Machata goto err_dev_set_mtu;
1219c5441932SPravin B Shelar
1220c5441932SPravin B Shelar ip_tunnel_add(itn, nt);
1221f6cc9c05SPetr Machata return 0;
1222f6cc9c05SPetr Machata
1223f6cc9c05SPetr Machata err_dev_set_mtu:
1224f6cc9c05SPetr Machata unregister_netdevice(dev);
1225f6cc9c05SPetr Machata err_register_netdevice:
1226c5441932SPravin B Shelar return err;
1227c5441932SPravin B Shelar }
1228c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_newlink);
1229c5441932SPravin B Shelar
ip_tunnel_changelink(struct net_device * dev,struct nlattr * tb[],struct ip_tunnel_parm * p,__u32 fwmark)1230c5441932SPravin B Shelar int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[],
12319830ad4cSCraig Gallek struct ip_tunnel_parm *p, __u32 fwmark)
1232c5441932SPravin B Shelar {
12336c742e71SNicolas Dichtel struct ip_tunnel *t;
1234c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
12356c742e71SNicolas Dichtel struct net *net = tunnel->net;
1236c5441932SPravin B Shelar struct ip_tunnel_net *itn = net_generic(net, tunnel->ip_tnl_net_id);
1237c5441932SPravin B Shelar
1238c5441932SPravin B Shelar if (dev == itn->fb_tunnel_dev)
1239c5441932SPravin B Shelar return -EINVAL;
1240c5441932SPravin B Shelar
1241c5441932SPravin B Shelar t = ip_tunnel_find(itn, p, dev->type);
1242c5441932SPravin B Shelar
1243c5441932SPravin B Shelar if (t) {
1244c5441932SPravin B Shelar if (t->dev != dev)
1245c5441932SPravin B Shelar return -EEXIST;
1246c5441932SPravin B Shelar } else {
12476c742e71SNicolas Dichtel t = tunnel;
1248c5441932SPravin B Shelar
1249c5441932SPravin B Shelar if (dev->type != ARPHRD_ETHER) {
1250c5441932SPravin B Shelar unsigned int nflags = 0;
1251c5441932SPravin B Shelar
1252c5441932SPravin B Shelar if (ipv4_is_multicast(p->iph.daddr))
1253c5441932SPravin B Shelar nflags = IFF_BROADCAST;
1254c5441932SPravin B Shelar else if (p->iph.daddr)
1255c5441932SPravin B Shelar nflags = IFF_POINTOPOINT;
1256c5441932SPravin B Shelar
1257c5441932SPravin B Shelar if ((dev->flags ^ nflags) &
1258c5441932SPravin B Shelar (IFF_POINTOPOINT | IFF_BROADCAST))
1259c5441932SPravin B Shelar return -EINVAL;
1260c5441932SPravin B Shelar }
1261c5441932SPravin B Shelar }
1262c5441932SPravin B Shelar
12639830ad4cSCraig Gallek ip_tunnel_update(itn, t, dev, p, !tb[IFLA_MTU], fwmark);
1264c5441932SPravin B Shelar return 0;
1265c5441932SPravin B Shelar }
1266c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_changelink);
1267c5441932SPravin B Shelar
ip_tunnel_init(struct net_device * dev)1268c5441932SPravin B Shelar int ip_tunnel_init(struct net_device *dev)
1269c5441932SPravin B Shelar {
1270c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
1271c5441932SPravin B Shelar struct iphdr *iph = &tunnel->parms.iph;
12721c213bd2SWANG Cong int err;
1273c5441932SPravin B Shelar
1274cf124db5SDavid S. Miller dev->needs_free_netdev = true;
1275cf124db5SDavid S. Miller dev->priv_destructor = ip_tunnel_dev_free;
12761c213bd2SWANG Cong dev->tstats = netdev_alloc_pcpu_stats(struct pcpu_sw_netstats);
1277c5441932SPravin B Shelar if (!dev->tstats)
1278c5441932SPravin B Shelar return -ENOMEM;
1279c5441932SPravin B Shelar
1280e09acddfSPaolo Abeni err = dst_cache_init(&tunnel->dst_cache, GFP_KERNEL);
1281e09acddfSPaolo Abeni if (err) {
12829a4aa9afSTom Herbert free_percpu(dev->tstats);
1283e09acddfSPaolo Abeni return err;
12849a4aa9afSTom Herbert }
12859a4aa9afSTom Herbert
1286c5441932SPravin B Shelar err = gro_cells_init(&tunnel->gro_cells, dev);
1287c5441932SPravin B Shelar if (err) {
1288e09acddfSPaolo Abeni dst_cache_destroy(&tunnel->dst_cache);
1289c5441932SPravin B Shelar free_percpu(dev->tstats);
1290c5441932SPravin B Shelar return err;
1291c5441932SPravin B Shelar }
1292c5441932SPravin B Shelar
1293c5441932SPravin B Shelar tunnel->dev = dev;
12946c742e71SNicolas Dichtel tunnel->net = dev_net(dev);
1295c5441932SPravin B Shelar strcpy(tunnel->parms.name, dev->name);
1296c5441932SPravin B Shelar iph->version = 4;
1297c5441932SPravin B Shelar iph->ihl = 5;
1298c5441932SPravin B Shelar
1299d0f41851SWilliam Dauchy if (tunnel->collect_md)
13002e15ea39SPravin B Shelar netif_keep_dst(dev);
1301a7b862abSEric Dumazet netdev_lockdep_set_classes(dev);
1302c5441932SPravin B Shelar return 0;
1303c5441932SPravin B Shelar }
1304c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_init);
1305c5441932SPravin B Shelar
ip_tunnel_uninit(struct net_device * dev)1306c5441932SPravin B Shelar void ip_tunnel_uninit(struct net_device *dev)
1307c5441932SPravin B Shelar {
1308c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
13096c742e71SNicolas Dichtel struct net *net = tunnel->net;
1310c5441932SPravin B Shelar struct ip_tunnel_net *itn;
1311c5441932SPravin B Shelar
1312c5441932SPravin B Shelar itn = net_generic(net, tunnel->ip_tnl_net_id);
13132e15ea39SPravin B Shelar ip_tunnel_del(itn, netdev_priv(dev));
1314ba61539cSTaehee Yoo if (itn->fb_tunnel_dev == dev)
1315ba61539cSTaehee Yoo WRITE_ONCE(itn->fb_tunnel_dev, NULL);
13167d442fabSTom Herbert
1317e09acddfSPaolo Abeni dst_cache_reset(&tunnel->dst_cache);
1318c5441932SPravin B Shelar }
1319c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_uninit);
1320c5441932SPravin B Shelar
1321c5441932SPravin B Shelar /* Do least required initialization, rest of init is done in tunnel_init call */
ip_tunnel_setup(struct net_device * dev,unsigned int net_id)1322c7d03a00SAlexey Dobriyan void ip_tunnel_setup(struct net_device *dev, unsigned int net_id)
1323c5441932SPravin B Shelar {
1324c5441932SPravin B Shelar struct ip_tunnel *tunnel = netdev_priv(dev);
1325c5441932SPravin B Shelar tunnel->ip_tnl_net_id = net_id;
1326c5441932SPravin B Shelar }
1327c5441932SPravin B Shelar EXPORT_SYMBOL_GPL(ip_tunnel_setup);
1328c5441932SPravin B Shelar
1329c5441932SPravin B Shelar MODULE_LICENSE("GPL");
1330