xref: /openbmc/linux/include/net/ip_tunnels.h (revision 376534a3)
1c5441932SPravin B Shelar #ifndef __NET_IP_TUNNELS_H
2c5441932SPravin B Shelar #define __NET_IP_TUNNELS_H 1
3c5441932SPravin B Shelar 
4c5441932SPravin B Shelar #include <linux/if_tunnel.h>
5c5441932SPravin B Shelar #include <linux/netdevice.h>
6c5441932SPravin B Shelar #include <linux/skbuff.h>
7c5441932SPravin B Shelar #include <linux/types.h>
8c5441932SPravin B Shelar #include <linux/u64_stats_sync.h>
9c5441932SPravin B Shelar #include <net/dsfield.h>
10c5441932SPravin B Shelar #include <net/gro_cells.h>
11c5441932SPravin B Shelar #include <net/inet_ecn.h>
1256328486STom Herbert #include <net/netns/generic.h>
13c5441932SPravin B Shelar #include <net/rtnetlink.h>
143093fbe7SThomas Graf #include <net/lwtunnel.h>
15c5441932SPravin B Shelar 
16c5441932SPravin B Shelar #if IS_ENABLED(CONFIG_IPV6)
17c5441932SPravin B Shelar #include <net/ipv6.h>
18c5441932SPravin B Shelar #include <net/ip6_fib.h>
19c5441932SPravin B Shelar #include <net/ip6_route.h>
20c5441932SPravin B Shelar #endif
21c5441932SPravin B Shelar 
22c5441932SPravin B Shelar /* Keep error state on tunnel for 30 sec */
23c5441932SPravin B Shelar #define IPTUNNEL_ERR_TIMEO	(30*HZ)
24c5441932SPravin B Shelar 
251d8fff90SThomas Graf /* Used to memset ip_tunnel padding. */
26376534a3SJiri Benc #define IP_TUNNEL_KEY_SIZE	offsetofend(struct ip_tunnel_key, tp_dst)
271d8fff90SThomas Graf 
281d8fff90SThomas Graf struct ip_tunnel_key {
291d8fff90SThomas Graf 	__be64			tun_id;
301d8fff90SThomas Graf 	__be32			ipv4_src;
311d8fff90SThomas Graf 	__be32			ipv4_dst;
321d8fff90SThomas Graf 	__be16			tun_flags;
336b8847c5SJiri Benc 	u8			ipv4_tos;
346b8847c5SJiri Benc 	u8			ipv4_ttl;
351d8fff90SThomas Graf 	__be16			tp_src;
361d8fff90SThomas Graf 	__be16			tp_dst;
37ac1cf399SJiri Benc };
381d8fff90SThomas Graf 
39ee122c79SThomas Graf /* Indicates whether the tunnel info structure represents receive
40ee122c79SThomas Graf  * or transmit tunnel parameters.
41ee122c79SThomas Graf  */
42ee122c79SThomas Graf enum {
43ee122c79SThomas Graf 	IP_TUNNEL_INFO_RX,
44ee122c79SThomas Graf 	IP_TUNNEL_INFO_TX,
45ee122c79SThomas Graf };
46ee122c79SThomas Graf 
471d8fff90SThomas Graf struct ip_tunnel_info {
481d8fff90SThomas Graf 	struct ip_tunnel_key	key;
491d8fff90SThomas Graf 	const void		*options;
501d8fff90SThomas Graf 	u8			options_len;
51ee122c79SThomas Graf 	u8			mode;
521d8fff90SThomas Graf };
531d8fff90SThomas Graf 
54c5441932SPravin B Shelar /* 6rd prefix/relay information */
55c5441932SPravin B Shelar #ifdef CONFIG_IPV6_SIT_6RD
56c5441932SPravin B Shelar struct ip_tunnel_6rd_parm {
57c5441932SPravin B Shelar 	struct in6_addr		prefix;
58c5441932SPravin B Shelar 	__be32			relay_prefix;
59c5441932SPravin B Shelar 	u16			prefixlen;
60c5441932SPravin B Shelar 	u16			relay_prefixlen;
61c5441932SPravin B Shelar };
62c5441932SPravin B Shelar #endif
63c5441932SPravin B Shelar 
6456328486STom Herbert struct ip_tunnel_encap {
656b8847c5SJiri Benc 	u16			type;
666b8847c5SJiri Benc 	u16			flags;
6756328486STom Herbert 	__be16			sport;
6856328486STom Herbert 	__be16			dport;
6956328486STom Herbert };
7056328486STom Herbert 
71c5441932SPravin B Shelar struct ip_tunnel_prl_entry {
72c5441932SPravin B Shelar 	struct ip_tunnel_prl_entry __rcu *next;
73c5441932SPravin B Shelar 	__be32				addr;
74c5441932SPravin B Shelar 	u16				flags;
75c5441932SPravin B Shelar 	struct rcu_head			rcu_head;
76c5441932SPravin B Shelar };
77c5441932SPravin B Shelar 
789a4aa9afSTom Herbert struct ip_tunnel_dst {
799a4aa9afSTom Herbert 	struct dst_entry __rcu 		*dst;
8095cb5745SDmitry Popov 	__be32				 saddr;
819a4aa9afSTom Herbert };
829a4aa9afSTom Herbert 
832e15ea39SPravin B Shelar struct metadata_dst;
842e15ea39SPravin B Shelar 
85c5441932SPravin B Shelar struct ip_tunnel {
86c5441932SPravin B Shelar 	struct ip_tunnel __rcu	*next;
87c5441932SPravin B Shelar 	struct hlist_node hash_node;
88c5441932SPravin B Shelar 	struct net_device	*dev;
895e6700b3SNicolas Dichtel 	struct net		*net;	/* netns for packet i/o */
90c5441932SPravin B Shelar 
91c5441932SPravin B Shelar 	int		err_count;	/* Number of arrived ICMP errors */
92c5441932SPravin B Shelar 	unsigned long	err_time;	/* Time when the last ICMP error
93c5441932SPravin B Shelar 					 * arrived */
94c5441932SPravin B Shelar 
95c5441932SPravin B Shelar 	/* These four fields used only by GRE */
966b8847c5SJiri Benc 	u32		i_seqno;	/* The last seen seqno	*/
976b8847c5SJiri Benc 	u32		o_seqno;	/* The last output seqno */
9856328486STom Herbert 	int		tun_hlen;	/* Precalculated header length */
99c5441932SPravin B Shelar 	int		mlink;
100c5441932SPravin B Shelar 
1019a4aa9afSTom Herbert 	struct ip_tunnel_dst __percpu *dst_cache;
1027d442fabSTom Herbert 
103c5441932SPravin B Shelar 	struct ip_tunnel_parm parms;
104c5441932SPravin B Shelar 
10556328486STom Herbert 	int		encap_hlen;	/* Encap header length (FOU,GUE) */
10656328486STom Herbert 	struct ip_tunnel_encap encap;
10756328486STom Herbert 
10856328486STom Herbert 	int		hlen;		/* tun_hlen + encap_hlen */
10956328486STom Herbert 
110c5441932SPravin B Shelar 	/* for SIT */
111c5441932SPravin B Shelar #ifdef CONFIG_IPV6_SIT_6RD
112c5441932SPravin B Shelar 	struct ip_tunnel_6rd_parm ip6rd;
113c5441932SPravin B Shelar #endif
114c5441932SPravin B Shelar 	struct ip_tunnel_prl_entry __rcu *prl;	/* potential router list */
115c5441932SPravin B Shelar 	unsigned int		prl_count;	/* # of entries in PRL */
116c5441932SPravin B Shelar 	int			ip_tnl_net_id;
117c5441932SPravin B Shelar 	struct gro_cells	gro_cells;
1182e15ea39SPravin B Shelar 	bool			collect_md;
119c5441932SPravin B Shelar };
120c5441932SPravin B Shelar 
121c5441932SPravin B Shelar #define TUNNEL_CSUM		__cpu_to_be16(0x01)
122c5441932SPravin B Shelar #define TUNNEL_ROUTING		__cpu_to_be16(0x02)
123c5441932SPravin B Shelar #define TUNNEL_KEY		__cpu_to_be16(0x04)
124c5441932SPravin B Shelar #define TUNNEL_SEQ		__cpu_to_be16(0x08)
125c5441932SPravin B Shelar #define TUNNEL_STRICT		__cpu_to_be16(0x10)
126c5441932SPravin B Shelar #define TUNNEL_REC		__cpu_to_be16(0x20)
127c5441932SPravin B Shelar #define TUNNEL_VERSION		__cpu_to_be16(0x40)
128c5441932SPravin B Shelar #define TUNNEL_NO_KEY		__cpu_to_be16(0x80)
1299a628224SPravin B Shelar #define TUNNEL_DONT_FRAGMENT    __cpu_to_be16(0x0100)
1300b5e8b8eSAndy Zhou #define TUNNEL_OAM		__cpu_to_be16(0x0200)
1310b5e8b8eSAndy Zhou #define TUNNEL_CRIT_OPT		__cpu_to_be16(0x0400)
1321dd144cfSThomas Graf #define TUNNEL_GENEVE_OPT	__cpu_to_be16(0x0800)
1331dd144cfSThomas Graf #define TUNNEL_VXLAN_OPT	__cpu_to_be16(0x1000)
1341dd144cfSThomas Graf 
1351dd144cfSThomas Graf #define TUNNEL_OPTIONS_PRESENT	(TUNNEL_GENEVE_OPT | TUNNEL_VXLAN_OPT)
136c5441932SPravin B Shelar 
137c5441932SPravin B Shelar struct tnl_ptk_info {
138c5441932SPravin B Shelar 	__be16 flags;
139c5441932SPravin B Shelar 	__be16 proto;
140c5441932SPravin B Shelar 	__be32 key;
141c5441932SPravin B Shelar 	__be32 seq;
142c5441932SPravin B Shelar };
143c5441932SPravin B Shelar 
144c5441932SPravin B Shelar #define PACKET_RCVD	0
145c5441932SPravin B Shelar #define PACKET_REJECT	1
146c5441932SPravin B Shelar 
1476261d983Sstephen hemminger #define IP_TNL_HASH_BITS   7
148c5441932SPravin B Shelar #define IP_TNL_HASH_SIZE   (1 << IP_TNL_HASH_BITS)
149c5441932SPravin B Shelar 
150c5441932SPravin B Shelar struct ip_tunnel_net {
151c5441932SPravin B Shelar 	struct net_device *fb_tunnel_dev;
1526261d983Sstephen hemminger 	struct hlist_head tunnels[IP_TNL_HASH_SIZE];
1532e15ea39SPravin B Shelar 	struct ip_tunnel __rcu *collect_md_tun;
154c5441932SPravin B Shelar };
155c5441932SPravin B Shelar 
156a8c5f90fSTom Herbert struct ip_tunnel_encap_ops {
157a8c5f90fSTom Herbert 	size_t (*encap_hlen)(struct ip_tunnel_encap *e);
158a8c5f90fSTom Herbert 	int (*build_header)(struct sk_buff *skb, struct ip_tunnel_encap *e,
159a8c5f90fSTom Herbert 			    u8 *protocol, struct flowi4 *fl4);
160a8c5f90fSTom Herbert };
161a8c5f90fSTom Herbert 
162a8c5f90fSTom Herbert #define MAX_IPTUN_ENCAP_OPS 8
163a8c5f90fSTom Herbert 
164a8c5f90fSTom Herbert extern const struct ip_tunnel_encap_ops __rcu *
165a8c5f90fSTom Herbert 		iptun_encaps[MAX_IPTUN_ENCAP_OPS];
166a8c5f90fSTom Herbert 
167a8c5f90fSTom Herbert int ip_tunnel_encap_add_ops(const struct ip_tunnel_encap_ops *op,
168a8c5f90fSTom Herbert 			    unsigned int num);
169a8c5f90fSTom Herbert int ip_tunnel_encap_del_ops(const struct ip_tunnel_encap_ops *op,
170a8c5f90fSTom Herbert 			    unsigned int num);
171a8c5f90fSTom Herbert 
1721d8fff90SThomas Graf static inline void __ip_tunnel_info_init(struct ip_tunnel_info *tun_info,
1731d8fff90SThomas Graf 					 __be32 saddr, __be32 daddr,
1741d8fff90SThomas Graf 					 u8 tos, u8 ttl,
1751d8fff90SThomas Graf 					 __be16 tp_src, __be16 tp_dst,
1761d8fff90SThomas Graf 					 __be64 tun_id, __be16 tun_flags,
1771d8fff90SThomas Graf 					 const void *opts, u8 opts_len)
1781d8fff90SThomas Graf {
1791d8fff90SThomas Graf 	tun_info->key.tun_id = tun_id;
1801d8fff90SThomas Graf 	tun_info->key.ipv4_src = saddr;
1811d8fff90SThomas Graf 	tun_info->key.ipv4_dst = daddr;
1821d8fff90SThomas Graf 	tun_info->key.ipv4_tos = tos;
1831d8fff90SThomas Graf 	tun_info->key.ipv4_ttl = ttl;
1841d8fff90SThomas Graf 	tun_info->key.tun_flags = tun_flags;
1851d8fff90SThomas Graf 
1861d8fff90SThomas Graf 	/* For the tunnel types on the top of IPsec, the tp_src and tp_dst of
1871d8fff90SThomas Graf 	 * the upper tunnel are used.
1881d8fff90SThomas Graf 	 * E.g: GRE over IPSEC, the tp_src and tp_port are zero.
1891d8fff90SThomas Graf 	 */
1901d8fff90SThomas Graf 	tun_info->key.tp_src = tp_src;
1911d8fff90SThomas Graf 	tun_info->key.tp_dst = tp_dst;
1921d8fff90SThomas Graf 
1931d8fff90SThomas Graf 	/* Clear struct padding. */
1941d8fff90SThomas Graf 	if (sizeof(tun_info->key) != IP_TUNNEL_KEY_SIZE)
1951d8fff90SThomas Graf 		memset((unsigned char *)&tun_info->key + IP_TUNNEL_KEY_SIZE,
1961d8fff90SThomas Graf 		       0, sizeof(tun_info->key) - IP_TUNNEL_KEY_SIZE);
1971d8fff90SThomas Graf 
1981d8fff90SThomas Graf 	tun_info->options = opts;
1991d8fff90SThomas Graf 	tun_info->options_len = opts_len;
2001d8fff90SThomas Graf }
2011d8fff90SThomas Graf 
2021d8fff90SThomas Graf static inline void ip_tunnel_info_init(struct ip_tunnel_info *tun_info,
2031d8fff90SThomas Graf 				       const struct iphdr *iph,
2041d8fff90SThomas Graf 				       __be16 tp_src, __be16 tp_dst,
2051d8fff90SThomas Graf 				       __be64 tun_id, __be16 tun_flags,
2061d8fff90SThomas Graf 				       const void *opts, u8 opts_len)
2071d8fff90SThomas Graf {
2081d8fff90SThomas Graf 	__ip_tunnel_info_init(tun_info, iph->saddr, iph->daddr,
2091d8fff90SThomas Graf 			      iph->tos, iph->ttl, tp_src, tp_dst,
2101d8fff90SThomas Graf 			      tun_id, tun_flags, opts, opts_len);
2111d8fff90SThomas Graf }
2121d8fff90SThomas Graf 
2135243b6acSJesse Gross #ifdef CONFIG_INET
2145243b6acSJesse Gross 
215c5441932SPravin B Shelar int ip_tunnel_init(struct net_device *dev);
216c5441932SPravin B Shelar void ip_tunnel_uninit(struct net_device *dev);
217c5441932SPravin B Shelar void  ip_tunnel_dellink(struct net_device *dev, struct list_head *head);
2181728d4faSNicolas Dichtel struct net *ip_tunnel_get_link_net(const struct net_device *dev);
2191e99584bSNicolas Dichtel int ip_tunnel_get_iflink(const struct net_device *dev);
220d3b6f614SEric Dumazet int ip_tunnel_init_net(struct net *net, int ip_tnl_net_id,
221c5441932SPravin B Shelar 		       struct rtnl_link_ops *ops, char *devname);
222c5441932SPravin B Shelar 
2236c742e71SNicolas Dichtel void ip_tunnel_delete_net(struct ip_tunnel_net *itn, struct rtnl_link_ops *ops);
224c5441932SPravin B Shelar 
225c5441932SPravin B Shelar void ip_tunnel_xmit(struct sk_buff *skb, struct net_device *dev,
226bf3d6a8fSNicolas Dichtel 		    const struct iphdr *tnl_params, const u8 protocol);
227c5441932SPravin B Shelar int ip_tunnel_ioctl(struct net_device *dev, struct ip_tunnel_parm *p, int cmd);
22856328486STom Herbert int ip_tunnel_encap(struct sk_buff *skb, struct ip_tunnel *t,
22956328486STom Herbert 		    u8 *protocol, struct flowi4 *fl4);
230c5441932SPravin B Shelar int ip_tunnel_change_mtu(struct net_device *dev, int new_mtu);
231c5441932SPravin B Shelar 
232c5441932SPravin B Shelar struct rtnl_link_stats64 *ip_tunnel_get_stats64(struct net_device *dev,
233c5441932SPravin B Shelar 						struct rtnl_link_stats64 *tot);
234c5441932SPravin B Shelar struct ip_tunnel *ip_tunnel_lookup(struct ip_tunnel_net *itn,
235c5441932SPravin B Shelar 				   int link, __be16 flags,
236c5441932SPravin B Shelar 				   __be32 remote, __be32 local,
237c5441932SPravin B Shelar 				   __be32 key);
238c5441932SPravin B Shelar 
239c5441932SPravin B Shelar int ip_tunnel_rcv(struct ip_tunnel *tunnel, struct sk_buff *skb,
2402e15ea39SPravin B Shelar 		  const struct tnl_ptk_info *tpi, struct metadata_dst *tun_dst,
2412e15ea39SPravin B Shelar 		  bool log_ecn_error);
242c5441932SPravin B Shelar int ip_tunnel_changelink(struct net_device *dev, struct nlattr *tb[],
243c5441932SPravin B Shelar 			 struct ip_tunnel_parm *p);
244c5441932SPravin B Shelar int ip_tunnel_newlink(struct net_device *dev, struct nlattr *tb[],
245c5441932SPravin B Shelar 		      struct ip_tunnel_parm *p);
246c5441932SPravin B Shelar void ip_tunnel_setup(struct net_device *dev, int net_id);
247cf71d2bcSNicolas Dichtel void ip_tunnel_dst_reset_all(struct ip_tunnel *t);
24856328486STom Herbert int ip_tunnel_encap_setup(struct ip_tunnel *t,
24956328486STom Herbert 			  struct ip_tunnel_encap *ipencap);
250c5441932SPravin B Shelar 
251c5441932SPravin B Shelar /* Extract dsfield from inner protocol */
252c5441932SPravin B Shelar static inline u8 ip_tunnel_get_dsfield(const struct iphdr *iph,
253c5441932SPravin B Shelar 				       const struct sk_buff *skb)
254c5441932SPravin B Shelar {
255c5441932SPravin B Shelar 	if (skb->protocol == htons(ETH_P_IP))
256c5441932SPravin B Shelar 		return iph->tos;
257c5441932SPravin B Shelar 	else if (skb->protocol == htons(ETH_P_IPV6))
258c5441932SPravin B Shelar 		return ipv6_get_dsfield((const struct ipv6hdr *)iph);
259c5441932SPravin B Shelar 	else
260c5441932SPravin B Shelar 		return 0;
261c5441932SPravin B Shelar }
262c5441932SPravin B Shelar 
263c5441932SPravin B Shelar /* Propogate ECN bits out */
264c5441932SPravin B Shelar static inline u8 ip_tunnel_ecn_encap(u8 tos, const struct iphdr *iph,
265c5441932SPravin B Shelar 				     const struct sk_buff *skb)
266c5441932SPravin B Shelar {
267c5441932SPravin B Shelar 	u8 inner = ip_tunnel_get_dsfield(iph, skb);
268c5441932SPravin B Shelar 
269c5441932SPravin B Shelar 	return INET_ECN_encapsulate(tos, inner);
270c5441932SPravin B Shelar }
271c5441932SPravin B Shelar 
2723d7b46cdSPravin B Shelar int iptunnel_pull_header(struct sk_buff *skb, int hdr_len, __be16 inner_proto);
273aad88724SEric Dumazet int iptunnel_xmit(struct sock *sk, struct rtable *rt, struct sk_buff *skb,
2746b8847c5SJiri Benc 		  __be32 src, __be32 dst, u8 proto,
2756b8847c5SJiri Benc 		  u8 tos, u8 ttl, __be16 df, bool xnet);
2760e6fbc5bSPravin B Shelar 
2772d26f0a3SEric Dumazet struct sk_buff *iptunnel_handle_offloads(struct sk_buff *skb, bool gre_csum,
2782d26f0a3SEric Dumazet 					 int gso_type_mask);
2792d26f0a3SEric Dumazet 
2800e6fbc5bSPravin B Shelar static inline void iptunnel_xmit_stats(int err,
2810e6fbc5bSPravin B Shelar 				       struct net_device_stats *err_stats,
2828f84985fSLi RongQing 				       struct pcpu_sw_netstats __percpu *stats)
283c5441932SPravin B Shelar {
2840e6fbc5bSPravin B Shelar 	if (err > 0) {
2858f84985fSLi RongQing 		struct pcpu_sw_netstats *tstats = this_cpu_ptr(stats);
286c5441932SPravin B Shelar 
287c5441932SPravin B Shelar 		u64_stats_update_begin(&tstats->syncp);
2880e6fbc5bSPravin B Shelar 		tstats->tx_bytes += err;
289c5441932SPravin B Shelar 		tstats->tx_packets++;
290c5441932SPravin B Shelar 		u64_stats_update_end(&tstats->syncp);
2910e6fbc5bSPravin B Shelar 	} else if (err < 0) {
2920e6fbc5bSPravin B Shelar 		err_stats->tx_errors++;
2930e6fbc5bSPravin B Shelar 		err_stats->tx_aborted_errors++;
294c5441932SPravin B Shelar 	} else {
2950e6fbc5bSPravin B Shelar 		err_stats->tx_dropped++;
296c5441932SPravin B Shelar 	}
297c5441932SPravin B Shelar }
2985243b6acSJesse Gross 
299ee122c79SThomas Graf static inline void *ip_tunnel_info_opts(struct ip_tunnel_info *info, size_t n)
300ee122c79SThomas Graf {
301ee122c79SThomas Graf 	return info + 1;
302ee122c79SThomas Graf }
303ee122c79SThomas Graf 
3043093fbe7SThomas Graf static inline struct ip_tunnel_info *lwt_tun_info(struct lwtunnel_state *lwtstate)
3053093fbe7SThomas Graf {
3063093fbe7SThomas Graf 	return (struct ip_tunnel_info *)lwtstate->data;
3073093fbe7SThomas Graf }
3083093fbe7SThomas Graf 
309e7030878SThomas Graf extern struct static_key ip_tunnel_metadata_cnt;
310e7030878SThomas Graf 
311e7030878SThomas Graf /* Returns > 0 if metadata should be collected */
312e7030878SThomas Graf static inline int ip_tunnel_collect_metadata(void)
313e7030878SThomas Graf {
314e7030878SThomas Graf 	return static_key_false(&ip_tunnel_metadata_cnt);
315e7030878SThomas Graf }
316e7030878SThomas Graf 
317045a0fa0SThomas Graf void __init ip_tunnel_core_init(void);
318045a0fa0SThomas Graf 
319e7030878SThomas Graf void ip_tunnel_need_metadata(void);
320e7030878SThomas Graf void ip_tunnel_unneed_metadata(void);
321e7030878SThomas Graf 
32205283187SThomas Graf #else /* CONFIG_INET */
32305283187SThomas Graf 
32405283187SThomas Graf static inline struct ip_tunnel_info *lwt_tun_info(struct lwtunnel_state *lwtstate)
32505283187SThomas Graf {
32605283187SThomas Graf 	return NULL;
32705283187SThomas Graf }
32805283187SThomas Graf 
32905283187SThomas Graf static inline void ip_tunnel_need_metadata(void)
33005283187SThomas Graf {
33105283187SThomas Graf }
33205283187SThomas Graf 
33305283187SThomas Graf static inline void ip_tunnel_unneed_metadata(void)
33405283187SThomas Graf {
33505283187SThomas Graf }
33605283187SThomas Graf 
3375243b6acSJesse Gross #endif /* CONFIG_INET */
3385243b6acSJesse Gross 
339c5441932SPravin B Shelar #endif /* __NET_IP_TUNNELS_H */
340