xref: /openbmc/linux/net/ipv6/seg6_iptunnel.c (revision 0f9b4c3ca5fdf3e177266ef994071b1a03f07318)
12874c5fdSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
26c8702c6SDavid Lebrun /*
36c8702c6SDavid Lebrun  *  SR-IPv6 implementation
46c8702c6SDavid Lebrun  *
56c8702c6SDavid Lebrun  *  Author:
66c8702c6SDavid Lebrun  *  David Lebrun <david.lebrun@uclouvain.be>
76c8702c6SDavid Lebrun  */
86c8702c6SDavid Lebrun 
96c8702c6SDavid Lebrun #include <linux/types.h>
106c8702c6SDavid Lebrun #include <linux/skbuff.h>
116c8702c6SDavid Lebrun #include <linux/net.h>
126c8702c6SDavid Lebrun #include <linux/module.h>
136c8702c6SDavid Lebrun #include <net/ip.h>
145807b22cSDavid Lebrun #include <net/ip_tunnels.h>
156c8702c6SDavid Lebrun #include <net/lwtunnel.h>
166c8702c6SDavid Lebrun #include <net/netevent.h>
176c8702c6SDavid Lebrun #include <net/netns/generic.h>
186c8702c6SDavid Lebrun #include <net/ip6_fib.h>
196c8702c6SDavid Lebrun #include <net/route.h>
206c8702c6SDavid Lebrun #include <net/seg6.h>
216c8702c6SDavid Lebrun #include <linux/seg6.h>
226c8702c6SDavid Lebrun #include <linux/seg6_iptunnel.h>
236c8702c6SDavid Lebrun #include <net/addrconf.h>
246c8702c6SDavid Lebrun #include <net/ip6_route.h>
256c8702c6SDavid Lebrun #include <net/dst_cache.h>
269baee834SDavid Lebrun #ifdef CONFIG_IPV6_SEG6_HMAC
279baee834SDavid Lebrun #include <net/seg6_hmac.h>
289baee834SDavid Lebrun #endif
297a3f5b0dSRyoga Saito #include <linux/netfilter.h>
306c8702c6SDavid Lebrun 
seg6_lwt_headroom(struct seg6_iptunnel_encap * tuninfo)3188fab21cSIoana-Ruxandra Stăncioi static size_t seg6_lwt_headroom(struct seg6_iptunnel_encap *tuninfo)
3288fab21cSIoana-Ruxandra Stăncioi {
3388fab21cSIoana-Ruxandra Stăncioi 	int head = 0;
3488fab21cSIoana-Ruxandra Stăncioi 
3588fab21cSIoana-Ruxandra Stăncioi 	switch (tuninfo->mode) {
3688fab21cSIoana-Ruxandra Stăncioi 	case SEG6_IPTUN_MODE_INLINE:
3788fab21cSIoana-Ruxandra Stăncioi 		break;
3888fab21cSIoana-Ruxandra Stăncioi 	case SEG6_IPTUN_MODE_ENCAP:
39b07c8cdbSAndrea Mayer 	case SEG6_IPTUN_MODE_ENCAP_RED:
4088fab21cSIoana-Ruxandra Stăncioi 		head = sizeof(struct ipv6hdr);
4188fab21cSIoana-Ruxandra Stăncioi 		break;
4288fab21cSIoana-Ruxandra Stăncioi 	case SEG6_IPTUN_MODE_L2ENCAP:
4313f0296bSAndrea Mayer 	case SEG6_IPTUN_MODE_L2ENCAP_RED:
4488fab21cSIoana-Ruxandra Stăncioi 		return 0;
4588fab21cSIoana-Ruxandra Stăncioi 	}
4688fab21cSIoana-Ruxandra Stăncioi 
4788fab21cSIoana-Ruxandra Stăncioi 	return ((tuninfo->srh->hdrlen + 1) << 3) + head;
4888fab21cSIoana-Ruxandra Stăncioi }
4988fab21cSIoana-Ruxandra Stăncioi 
506c8702c6SDavid Lebrun struct seg6_lwt {
516c8702c6SDavid Lebrun 	struct dst_cache cache;
52b0c9a2d9SGustavo A. R. Silva 	struct seg6_iptunnel_encap tuninfo[];
536c8702c6SDavid Lebrun };
546c8702c6SDavid Lebrun 
seg6_lwt_lwtunnel(struct lwtunnel_state * lwt)556c8702c6SDavid Lebrun static inline struct seg6_lwt *seg6_lwt_lwtunnel(struct lwtunnel_state *lwt)
566c8702c6SDavid Lebrun {
576c8702c6SDavid Lebrun 	return (struct seg6_lwt *)lwt->data;
586c8702c6SDavid Lebrun }
596c8702c6SDavid Lebrun 
606c8702c6SDavid Lebrun static inline struct seg6_iptunnel_encap *
seg6_encap_lwtunnel(struct lwtunnel_state * lwt)616c8702c6SDavid Lebrun seg6_encap_lwtunnel(struct lwtunnel_state *lwt)
626c8702c6SDavid Lebrun {
636c8702c6SDavid Lebrun 	return seg6_lwt_lwtunnel(lwt)->tuninfo;
646c8702c6SDavid Lebrun }
656c8702c6SDavid Lebrun 
666c8702c6SDavid Lebrun static const struct nla_policy seg6_iptunnel_policy[SEG6_IPTUNNEL_MAX + 1] = {
676c8702c6SDavid Lebrun 	[SEG6_IPTUNNEL_SRH]	= { .type = NLA_BINARY },
686c8702c6SDavid Lebrun };
696c8702c6SDavid Lebrun 
nla_put_srh(struct sk_buff * skb,int attrtype,struct seg6_iptunnel_encap * tuninfo)70bb4005baSWei Yongjun static int nla_put_srh(struct sk_buff *skb, int attrtype,
716c8702c6SDavid Lebrun 		       struct seg6_iptunnel_encap *tuninfo)
726c8702c6SDavid Lebrun {
736c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *data;
746c8702c6SDavid Lebrun 	struct nlattr *nla;
756c8702c6SDavid Lebrun 	int len;
766c8702c6SDavid Lebrun 
776c8702c6SDavid Lebrun 	len = SEG6_IPTUN_ENCAP_SIZE(tuninfo);
786c8702c6SDavid Lebrun 
796c8702c6SDavid Lebrun 	nla = nla_reserve(skb, attrtype, len);
806c8702c6SDavid Lebrun 	if (!nla)
816c8702c6SDavid Lebrun 		return -EMSGSIZE;
826c8702c6SDavid Lebrun 
836c8702c6SDavid Lebrun 	data = nla_data(nla);
846c8702c6SDavid Lebrun 	memcpy(data, tuninfo, len);
856c8702c6SDavid Lebrun 
866c8702c6SDavid Lebrun 	return 0;
876c8702c6SDavid Lebrun }
886c8702c6SDavid Lebrun 
set_tun_src(struct net * net,struct net_device * dev,struct in6_addr * daddr,struct in6_addr * saddr)896c8702c6SDavid Lebrun static void set_tun_src(struct net *net, struct net_device *dev,
906c8702c6SDavid Lebrun 			struct in6_addr *daddr, struct in6_addr *saddr)
916c8702c6SDavid Lebrun {
926c8702c6SDavid Lebrun 	struct seg6_pernet_data *sdata = seg6_pernet(net);
936c8702c6SDavid Lebrun 	struct in6_addr *tun_src;
946c8702c6SDavid Lebrun 
956c8702c6SDavid Lebrun 	rcu_read_lock();
966c8702c6SDavid Lebrun 
976c8702c6SDavid Lebrun 	tun_src = rcu_dereference(sdata->tun_src);
986c8702c6SDavid Lebrun 
996c8702c6SDavid Lebrun 	if (!ipv6_addr_any(tun_src)) {
1006c8702c6SDavid Lebrun 		memcpy(saddr, tun_src, sizeof(struct in6_addr));
1016c8702c6SDavid Lebrun 	} else {
1026c8702c6SDavid Lebrun 		ipv6_dev_get_saddr(net, dev, daddr, IPV6_PREFER_SRC_PUBLIC,
1036c8702c6SDavid Lebrun 				   saddr);
1046c8702c6SDavid Lebrun 	}
1056c8702c6SDavid Lebrun 
1066c8702c6SDavid Lebrun 	rcu_read_unlock();
1076c8702c6SDavid Lebrun }
1086c8702c6SDavid Lebrun 
109b5facfdbSAhmed Abdelsalam /* Compute flowlabel for outer IPv6 header */
seg6_make_flowlabel(struct net * net,struct sk_buff * skb,struct ipv6hdr * inner_hdr)110b5facfdbSAhmed Abdelsalam static __be32 seg6_make_flowlabel(struct net *net, struct sk_buff *skb,
111b5facfdbSAhmed Abdelsalam 				  struct ipv6hdr *inner_hdr)
112b5facfdbSAhmed Abdelsalam {
113b5facfdbSAhmed Abdelsalam 	int do_flowlabel = net->ipv6.sysctl.seg6_flowlabel;
114b5facfdbSAhmed Abdelsalam 	__be32 flowlabel = 0;
115b5facfdbSAhmed Abdelsalam 	u32 hash;
116b5facfdbSAhmed Abdelsalam 
117b5facfdbSAhmed Abdelsalam 	if (do_flowlabel > 0) {
118b5facfdbSAhmed Abdelsalam 		hash = skb_get_hash(skb);
1193ee593adSColin Ian King 		hash = rol32(hash, 16);
120b5facfdbSAhmed Abdelsalam 		flowlabel = (__force __be32)hash & IPV6_FLOWLABEL_MASK;
121b5facfdbSAhmed Abdelsalam 	} else if (!do_flowlabel && skb->protocol == htons(ETH_P_IPV6)) {
122b5facfdbSAhmed Abdelsalam 		flowlabel = ip6_flowlabel(inner_hdr);
123b5facfdbSAhmed Abdelsalam 	}
124b5facfdbSAhmed Abdelsalam 	return flowlabel;
125b5facfdbSAhmed Abdelsalam }
126b5facfdbSAhmed Abdelsalam 
__seg6_do_srh_encap(struct sk_buff * skb,struct ipv6_sr_hdr * osrh,int proto,struct dst_entry * cache_dst)127ab9de9c4SJustin Iurman static int __seg6_do_srh_encap(struct sk_buff *skb, struct ipv6_sr_hdr *osrh,
128ab9de9c4SJustin Iurman 			       int proto, struct dst_entry *cache_dst)
1296c8702c6SDavid Lebrun {
1308936ef76SDavid Lebrun 	struct dst_entry *dst = skb_dst(skb);
1318936ef76SDavid Lebrun 	struct net *net = dev_net(dst->dev);
1326c8702c6SDavid Lebrun 	struct ipv6hdr *hdr, *inner_hdr;
1336c8702c6SDavid Lebrun 	struct ipv6_sr_hdr *isrh;
1346c8702c6SDavid Lebrun 	int hdrlen, tot_len, err;
135b5facfdbSAhmed Abdelsalam 	__be32 flowlabel;
1366c8702c6SDavid Lebrun 
1376c8702c6SDavid Lebrun 	hdrlen = (osrh->hdrlen + 1) << 3;
1386c8702c6SDavid Lebrun 	tot_len = hdrlen + sizeof(*hdr);
1396c8702c6SDavid Lebrun 
140ab9de9c4SJustin Iurman 	err = skb_cow_head(skb, tot_len + dst_dev_overhead(cache_dst, skb));
1416c8702c6SDavid Lebrun 	if (unlikely(err))
1426c8702c6SDavid Lebrun 		return err;
1436c8702c6SDavid Lebrun 
1446c8702c6SDavid Lebrun 	inner_hdr = ipv6_hdr(skb);
1456df93462SAhmed Abdelsalam 	flowlabel = seg6_make_flowlabel(net, skb, inner_hdr);
1466c8702c6SDavid Lebrun 
1476c8702c6SDavid Lebrun 	skb_push(skb, tot_len);
1486c8702c6SDavid Lebrun 	skb_reset_network_header(skb);
1496c8702c6SDavid Lebrun 	skb_mac_header_rebuild(skb);
1506c8702c6SDavid Lebrun 	hdr = ipv6_hdr(skb);
1516c8702c6SDavid Lebrun 
1526c8702c6SDavid Lebrun 	/* inherit tc, flowlabel and hlim
1536c8702c6SDavid Lebrun 	 * hlim will be decremented in ip6_forward() afterwards and
1546c8702c6SDavid Lebrun 	 * decapsulation will overwrite inner hlim with outer hlim
1556c8702c6SDavid Lebrun 	 */
15632d99d0bSDavid Lebrun 
15732d99d0bSDavid Lebrun 	if (skb->protocol == htons(ETH_P_IPV6)) {
1586c8702c6SDavid Lebrun 		ip6_flow_hdr(hdr, ip6_tclass(ip6_flowinfo(inner_hdr)),
159b5facfdbSAhmed Abdelsalam 			     flowlabel);
1606c8702c6SDavid Lebrun 		hdr->hop_limit = inner_hdr->hop_limit;
16132d99d0bSDavid Lebrun 	} else {
162b5facfdbSAhmed Abdelsalam 		ip6_flow_hdr(hdr, 0, flowlabel);
16332d99d0bSDavid Lebrun 		hdr->hop_limit = ip6_dst_hoplimit(skb_dst(skb));
164ef489749SYohei Kanemaru 
165ef489749SYohei Kanemaru 		memset(IP6CB(skb), 0, sizeof(*IP6CB(skb)));
166ae68d933SAndrea Mayer 
167ae68d933SAndrea Mayer 		/* the control block has been erased, so we have to set the
168ae68d933SAndrea Mayer 		 * iif once again.
169ae68d933SAndrea Mayer 		 * We read the receiving interface index directly from the
170ae68d933SAndrea Mayer 		 * skb->skb_iif as it is done in the IPv4 receiving path (i.e.:
171ae68d933SAndrea Mayer 		 * ip_rcv_core(...)).
172ae68d933SAndrea Mayer 		 */
173ae68d933SAndrea Mayer 		IP6CB(skb)->iif = skb->skb_iif;
17432d99d0bSDavid Lebrun 	}
17532d99d0bSDavid Lebrun 
1766c8702c6SDavid Lebrun 	hdr->nexthdr = NEXTHDR_ROUTING;
1776c8702c6SDavid Lebrun 
1786c8702c6SDavid Lebrun 	isrh = (void *)hdr + sizeof(*hdr);
1796c8702c6SDavid Lebrun 	memcpy(isrh, osrh, hdrlen);
1806c8702c6SDavid Lebrun 
18132d99d0bSDavid Lebrun 	isrh->nexthdr = proto;
1826c8702c6SDavid Lebrun 
1836c8702c6SDavid Lebrun 	hdr->daddr = isrh->segments[isrh->first_segment];
184a957fa19SAhmed Abdelsalam 	set_tun_src(net, dst->dev, &hdr->daddr, &hdr->saddr);
1856c8702c6SDavid Lebrun 
1869baee834SDavid Lebrun #ifdef CONFIG_IPV6_SEG6_HMAC
1879baee834SDavid Lebrun 	if (sr_has_hmac(isrh)) {
1889baee834SDavid Lebrun 		err = seg6_push_hmac(net, &hdr->saddr, isrh);
1899baee834SDavid Lebrun 		if (unlikely(err))
1909baee834SDavid Lebrun 			return err;
1919baee834SDavid Lebrun 	}
1929baee834SDavid Lebrun #endif
1939baee834SDavid Lebrun 
194df8386d1SAndrea Mayer 	hdr->payload_len = htons(skb->len - sizeof(struct ipv6hdr));
195df8386d1SAndrea Mayer 
1966c8702c6SDavid Lebrun 	skb_postpush_rcsum(skb, hdr, tot_len);
1976c8702c6SDavid Lebrun 
1986c8702c6SDavid Lebrun 	return 0;
1996c8702c6SDavid Lebrun }
200ab9de9c4SJustin Iurman 
201ab9de9c4SJustin Iurman /* encapsulate an IPv6 packet within an outer IPv6 header with a given SRH */
seg6_do_srh_encap(struct sk_buff * skb,struct ipv6_sr_hdr * osrh,int proto)202ab9de9c4SJustin Iurman int seg6_do_srh_encap(struct sk_buff *skb, struct ipv6_sr_hdr *osrh, int proto)
203ab9de9c4SJustin Iurman {
204ab9de9c4SJustin Iurman 	return __seg6_do_srh_encap(skb, osrh, proto, NULL);
205ab9de9c4SJustin Iurman }
206b04c80d3SDavid Lebrun EXPORT_SYMBOL_GPL(seg6_do_srh_encap);
2076c8702c6SDavid Lebrun 
208b07c8cdbSAndrea Mayer /* encapsulate an IPv6 packet within an outer IPv6 header with reduced SRH */
seg6_do_srh_encap_red(struct sk_buff * skb,struct ipv6_sr_hdr * osrh,int proto,struct dst_entry * cache_dst)209b07c8cdbSAndrea Mayer static int seg6_do_srh_encap_red(struct sk_buff *skb,
210ab9de9c4SJustin Iurman 				 struct ipv6_sr_hdr *osrh, int proto,
211ab9de9c4SJustin Iurman 				 struct dst_entry *cache_dst)
212b07c8cdbSAndrea Mayer {
213b07c8cdbSAndrea Mayer 	__u8 first_seg = osrh->first_segment;
214b07c8cdbSAndrea Mayer 	struct dst_entry *dst = skb_dst(skb);
215b07c8cdbSAndrea Mayer 	struct net *net = dev_net(dst->dev);
216b07c8cdbSAndrea Mayer 	struct ipv6hdr *hdr, *inner_hdr;
217b07c8cdbSAndrea Mayer 	int hdrlen = ipv6_optlen(osrh);
218b07c8cdbSAndrea Mayer 	int red_tlv_offset, tlv_offset;
219b07c8cdbSAndrea Mayer 	struct ipv6_sr_hdr *isrh;
220b07c8cdbSAndrea Mayer 	bool skip_srh = false;
221b07c8cdbSAndrea Mayer 	__be32 flowlabel;
222b07c8cdbSAndrea Mayer 	int tot_len, err;
223b07c8cdbSAndrea Mayer 	int red_hdrlen;
224b07c8cdbSAndrea Mayer 	int tlvs_len;
225b07c8cdbSAndrea Mayer 
226b07c8cdbSAndrea Mayer 	if (first_seg > 0) {
227b07c8cdbSAndrea Mayer 		red_hdrlen = hdrlen - sizeof(struct in6_addr);
228b07c8cdbSAndrea Mayer 	} else {
229b07c8cdbSAndrea Mayer 		/* NOTE: if tag/flags and/or other TLVs are introduced in the
230b07c8cdbSAndrea Mayer 		 * seg6_iptunnel infrastructure, they should be considered when
231b07c8cdbSAndrea Mayer 		 * deciding to skip the SRH.
232b07c8cdbSAndrea Mayer 		 */
233b07c8cdbSAndrea Mayer 		skip_srh = !sr_has_hmac(osrh);
234b07c8cdbSAndrea Mayer 
235b07c8cdbSAndrea Mayer 		red_hdrlen = skip_srh ? 0 : hdrlen;
236b07c8cdbSAndrea Mayer 	}
237b07c8cdbSAndrea Mayer 
238b07c8cdbSAndrea Mayer 	tot_len = red_hdrlen + sizeof(struct ipv6hdr);
239b07c8cdbSAndrea Mayer 
240ab9de9c4SJustin Iurman 	err = skb_cow_head(skb, tot_len + dst_dev_overhead(cache_dst, skb));
241b07c8cdbSAndrea Mayer 	if (unlikely(err))
242b07c8cdbSAndrea Mayer 		return err;
243b07c8cdbSAndrea Mayer 
244b07c8cdbSAndrea Mayer 	inner_hdr = ipv6_hdr(skb);
245b07c8cdbSAndrea Mayer 	flowlabel = seg6_make_flowlabel(net, skb, inner_hdr);
246b07c8cdbSAndrea Mayer 
247b07c8cdbSAndrea Mayer 	skb_push(skb, tot_len);
248b07c8cdbSAndrea Mayer 	skb_reset_network_header(skb);
249b07c8cdbSAndrea Mayer 	skb_mac_header_rebuild(skb);
250b07c8cdbSAndrea Mayer 	hdr = ipv6_hdr(skb);
251b07c8cdbSAndrea Mayer 
252b07c8cdbSAndrea Mayer 	/* based on seg6_do_srh_encap() */
253b07c8cdbSAndrea Mayer 	if (skb->protocol == htons(ETH_P_IPV6)) {
254b07c8cdbSAndrea Mayer 		ip6_flow_hdr(hdr, ip6_tclass(ip6_flowinfo(inner_hdr)),
255b07c8cdbSAndrea Mayer 			     flowlabel);
256b07c8cdbSAndrea Mayer 		hdr->hop_limit = inner_hdr->hop_limit;
257b07c8cdbSAndrea Mayer 	} else {
258b07c8cdbSAndrea Mayer 		ip6_flow_hdr(hdr, 0, flowlabel);
259b07c8cdbSAndrea Mayer 		hdr->hop_limit = ip6_dst_hoplimit(skb_dst(skb));
260b07c8cdbSAndrea Mayer 
261b07c8cdbSAndrea Mayer 		memset(IP6CB(skb), 0, sizeof(*IP6CB(skb)));
262b07c8cdbSAndrea Mayer 		IP6CB(skb)->iif = skb->skb_iif;
263b07c8cdbSAndrea Mayer 	}
264b07c8cdbSAndrea Mayer 
265b07c8cdbSAndrea Mayer 	/* no matter if we have to skip the SRH or not, the first segment
266b07c8cdbSAndrea Mayer 	 * always comes in the pushed IPv6 header.
267b07c8cdbSAndrea Mayer 	 */
268b07c8cdbSAndrea Mayer 	hdr->daddr = osrh->segments[first_seg];
269b07c8cdbSAndrea Mayer 
270b07c8cdbSAndrea Mayer 	if (skip_srh) {
271b07c8cdbSAndrea Mayer 		hdr->nexthdr = proto;
272b07c8cdbSAndrea Mayer 
273b07c8cdbSAndrea Mayer 		set_tun_src(net, dst->dev, &hdr->daddr, &hdr->saddr);
274b07c8cdbSAndrea Mayer 		goto out;
275b07c8cdbSAndrea Mayer 	}
276b07c8cdbSAndrea Mayer 
277b07c8cdbSAndrea Mayer 	/* we cannot skip the SRH, slow path */
278b07c8cdbSAndrea Mayer 
279b07c8cdbSAndrea Mayer 	hdr->nexthdr = NEXTHDR_ROUTING;
280b07c8cdbSAndrea Mayer 	isrh = (void *)hdr + sizeof(struct ipv6hdr);
281b07c8cdbSAndrea Mayer 
282b07c8cdbSAndrea Mayer 	if (unlikely(!first_seg)) {
283b07c8cdbSAndrea Mayer 		/* this is a very rare case; we have only one SID but
284b07c8cdbSAndrea Mayer 		 * we cannot skip the SRH since we are carrying some
285b07c8cdbSAndrea Mayer 		 * other info.
286b07c8cdbSAndrea Mayer 		 */
287b07c8cdbSAndrea Mayer 		memcpy(isrh, osrh, hdrlen);
288b07c8cdbSAndrea Mayer 		goto srcaddr;
289b07c8cdbSAndrea Mayer 	}
290b07c8cdbSAndrea Mayer 
291b07c8cdbSAndrea Mayer 	tlv_offset = sizeof(*osrh) + (first_seg + 1) * sizeof(struct in6_addr);
292b07c8cdbSAndrea Mayer 	red_tlv_offset = tlv_offset - sizeof(struct in6_addr);
293b07c8cdbSAndrea Mayer 
294b07c8cdbSAndrea Mayer 	memcpy(isrh, osrh, red_tlv_offset);
295b07c8cdbSAndrea Mayer 
296b07c8cdbSAndrea Mayer 	tlvs_len = hdrlen - tlv_offset;
297b07c8cdbSAndrea Mayer 	if (unlikely(tlvs_len > 0)) {
298b07c8cdbSAndrea Mayer 		const void *s = (const void *)osrh + tlv_offset;
299b07c8cdbSAndrea Mayer 		void *d = (void *)isrh + red_tlv_offset;
300b07c8cdbSAndrea Mayer 
301b07c8cdbSAndrea Mayer 		memcpy(d, s, tlvs_len);
302b07c8cdbSAndrea Mayer 	}
303b07c8cdbSAndrea Mayer 
304b07c8cdbSAndrea Mayer 	--isrh->first_segment;
305b07c8cdbSAndrea Mayer 	isrh->hdrlen -= 2;
306b07c8cdbSAndrea Mayer 
307b07c8cdbSAndrea Mayer srcaddr:
308b07c8cdbSAndrea Mayer 	isrh->nexthdr = proto;
309b07c8cdbSAndrea Mayer 	set_tun_src(net, dst->dev, &hdr->daddr, &hdr->saddr);
310b07c8cdbSAndrea Mayer 
311b07c8cdbSAndrea Mayer #ifdef CONFIG_IPV6_SEG6_HMAC
312b07c8cdbSAndrea Mayer 	if (unlikely(!skip_srh && sr_has_hmac(isrh))) {
313b07c8cdbSAndrea Mayer 		err = seg6_push_hmac(net, &hdr->saddr, isrh);
314b07c8cdbSAndrea Mayer 		if (unlikely(err))
315b07c8cdbSAndrea Mayer 			return err;
316b07c8cdbSAndrea Mayer 	}
317b07c8cdbSAndrea Mayer #endif
318b07c8cdbSAndrea Mayer 
319b07c8cdbSAndrea Mayer out:
320b07c8cdbSAndrea Mayer 	hdr->payload_len = htons(skb->len - sizeof(struct ipv6hdr));
321b07c8cdbSAndrea Mayer 
322b07c8cdbSAndrea Mayer 	skb_postpush_rcsum(skb, hdr, tot_len);
323b07c8cdbSAndrea Mayer 
324b07c8cdbSAndrea Mayer 	return 0;
325b07c8cdbSAndrea Mayer }
326b07c8cdbSAndrea Mayer 
__seg6_do_srh_inline(struct sk_buff * skb,struct ipv6_sr_hdr * osrh,struct dst_entry * cache_dst)327ab9de9c4SJustin Iurman static int __seg6_do_srh_inline(struct sk_buff *skb, struct ipv6_sr_hdr *osrh,
328ab9de9c4SJustin Iurman 				struct dst_entry *cache_dst)
3296c8702c6SDavid Lebrun {
3306c8702c6SDavid Lebrun 	struct ipv6hdr *hdr, *oldhdr;
3316c8702c6SDavid Lebrun 	struct ipv6_sr_hdr *isrh;
3326c8702c6SDavid Lebrun 	int hdrlen, err;
3336c8702c6SDavid Lebrun 
3346c8702c6SDavid Lebrun 	hdrlen = (osrh->hdrlen + 1) << 3;
3356c8702c6SDavid Lebrun 
336ab9de9c4SJustin Iurman 	err = skb_cow_head(skb, hdrlen + dst_dev_overhead(cache_dst, skb));
3376c8702c6SDavid Lebrun 	if (unlikely(err))
3386c8702c6SDavid Lebrun 		return err;
3396c8702c6SDavid Lebrun 
3406c8702c6SDavid Lebrun 	oldhdr = ipv6_hdr(skb);
3416c8702c6SDavid Lebrun 
3426c8702c6SDavid Lebrun 	skb_pull(skb, sizeof(struct ipv6hdr));
3436c8702c6SDavid Lebrun 	skb_postpull_rcsum(skb, skb_network_header(skb),
3446c8702c6SDavid Lebrun 			   sizeof(struct ipv6hdr));
3456c8702c6SDavid Lebrun 
3466c8702c6SDavid Lebrun 	skb_push(skb, sizeof(struct ipv6hdr) + hdrlen);
3476c8702c6SDavid Lebrun 	skb_reset_network_header(skb);
3486c8702c6SDavid Lebrun 	skb_mac_header_rebuild(skb);
3496c8702c6SDavid Lebrun 
3506c8702c6SDavid Lebrun 	hdr = ipv6_hdr(skb);
3516c8702c6SDavid Lebrun 
3526c8702c6SDavid Lebrun 	memmove(hdr, oldhdr, sizeof(*hdr));
3536c8702c6SDavid Lebrun 
3546c8702c6SDavid Lebrun 	isrh = (void *)hdr + sizeof(*hdr);
3556c8702c6SDavid Lebrun 	memcpy(isrh, osrh, hdrlen);
3566c8702c6SDavid Lebrun 
3576c8702c6SDavid Lebrun 	isrh->nexthdr = hdr->nexthdr;
3586c8702c6SDavid Lebrun 	hdr->nexthdr = NEXTHDR_ROUTING;
3596c8702c6SDavid Lebrun 
3606c8702c6SDavid Lebrun 	isrh->segments[0] = hdr->daddr;
3616c8702c6SDavid Lebrun 	hdr->daddr = isrh->segments[isrh->first_segment];
3626c8702c6SDavid Lebrun 
3639baee834SDavid Lebrun #ifdef CONFIG_IPV6_SEG6_HMAC
3649baee834SDavid Lebrun 	if (sr_has_hmac(isrh)) {
3659baee834SDavid Lebrun 		struct net *net = dev_net(skb_dst(skb)->dev);
3669baee834SDavid Lebrun 
3679baee834SDavid Lebrun 		err = seg6_push_hmac(net, &hdr->saddr, isrh);
3689baee834SDavid Lebrun 		if (unlikely(err))
3699baee834SDavid Lebrun 			return err;
3709baee834SDavid Lebrun 	}
3719baee834SDavid Lebrun #endif
3729baee834SDavid Lebrun 
373df8386d1SAndrea Mayer 	hdr->payload_len = htons(skb->len - sizeof(struct ipv6hdr));
374df8386d1SAndrea Mayer 
3756c8702c6SDavid Lebrun 	skb_postpush_rcsum(skb, hdr, sizeof(struct ipv6hdr) + hdrlen);
3766c8702c6SDavid Lebrun 
3776c8702c6SDavid Lebrun 	return 0;
3786c8702c6SDavid Lebrun }
3796c8702c6SDavid Lebrun 
seg6_do_srh(struct sk_buff * skb,struct dst_entry * cache_dst)380ab9de9c4SJustin Iurman static int seg6_do_srh(struct sk_buff *skb, struct dst_entry *cache_dst)
3816c8702c6SDavid Lebrun {
3826c8702c6SDavid Lebrun 	struct dst_entry *dst = skb_dst(skb);
3836c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *tinfo;
38432d99d0bSDavid Lebrun 	int proto, err = 0;
3856c8702c6SDavid Lebrun 
3866c8702c6SDavid Lebrun 	tinfo = seg6_encap_lwtunnel(dst->lwtstate);
3876c8702c6SDavid Lebrun 
3886c8702c6SDavid Lebrun 	switch (tinfo->mode) {
3896c8702c6SDavid Lebrun 	case SEG6_IPTUN_MODE_INLINE:
39032d99d0bSDavid Lebrun 		if (skb->protocol != htons(ETH_P_IPV6))
39132d99d0bSDavid Lebrun 			return -EINVAL;
39232d99d0bSDavid Lebrun 
393ab9de9c4SJustin Iurman 		err = __seg6_do_srh_inline(skb, tinfo->srh, cache_dst);
39432d99d0bSDavid Lebrun 		if (err)
39532d99d0bSDavid Lebrun 			return err;
3966c8702c6SDavid Lebrun 		break;
3976c8702c6SDavid Lebrun 	case SEG6_IPTUN_MODE_ENCAP:
398b07c8cdbSAndrea Mayer 	case SEG6_IPTUN_MODE_ENCAP_RED:
3995807b22cSDavid Lebrun 		err = iptunnel_handle_offloads(skb, SKB_GSO_IPXIP6);
4005807b22cSDavid Lebrun 		if (err)
4015807b22cSDavid Lebrun 			return err;
4025807b22cSDavid Lebrun 
40332d99d0bSDavid Lebrun 		if (skb->protocol == htons(ETH_P_IPV6))
40432d99d0bSDavid Lebrun 			proto = IPPROTO_IPV6;
40532d99d0bSDavid Lebrun 		else if (skb->protocol == htons(ETH_P_IP))
40632d99d0bSDavid Lebrun 			proto = IPPROTO_IPIP;
40732d99d0bSDavid Lebrun 		else
40832d99d0bSDavid Lebrun 			return -EINVAL;
4096c8702c6SDavid Lebrun 
410b07c8cdbSAndrea Mayer 		if (tinfo->mode == SEG6_IPTUN_MODE_ENCAP)
411ab9de9c4SJustin Iurman 			err = __seg6_do_srh_encap(skb, tinfo->srh,
412ab9de9c4SJustin Iurman 						  proto, cache_dst);
413b07c8cdbSAndrea Mayer 		else
414ab9de9c4SJustin Iurman 			err = seg6_do_srh_encap_red(skb, tinfo->srh,
415ab9de9c4SJustin Iurman 						    proto, cache_dst);
416b07c8cdbSAndrea Mayer 
4176c8702c6SDavid Lebrun 		if (err)
4186c8702c6SDavid Lebrun 			return err;
4196c8702c6SDavid Lebrun 
4205807b22cSDavid Lebrun 		skb_set_inner_transport_header(skb, skb_transport_offset(skb));
4215807b22cSDavid Lebrun 		skb_set_inner_protocol(skb, skb->protocol);
42232d99d0bSDavid Lebrun 		skb->protocol = htons(ETH_P_IPV6);
42332d99d0bSDavid Lebrun 		break;
42438ee7f2dSDavid Lebrun 	case SEG6_IPTUN_MODE_L2ENCAP:
42513f0296bSAndrea Mayer 	case SEG6_IPTUN_MODE_L2ENCAP_RED:
42638ee7f2dSDavid Lebrun 		if (!skb_mac_header_was_set(skb))
42738ee7f2dSDavid Lebrun 			return -EINVAL;
42838ee7f2dSDavid Lebrun 
42938ee7f2dSDavid Lebrun 		if (pskb_expand_head(skb, skb->mac_len, 0, GFP_ATOMIC) < 0)
43038ee7f2dSDavid Lebrun 			return -ENOMEM;
43138ee7f2dSDavid Lebrun 
43238ee7f2dSDavid Lebrun 		skb_mac_header_rebuild(skb);
43338ee7f2dSDavid Lebrun 		skb_push(skb, skb->mac_len);
43438ee7f2dSDavid Lebrun 
43513f0296bSAndrea Mayer 		if (tinfo->mode == SEG6_IPTUN_MODE_L2ENCAP)
436ab9de9c4SJustin Iurman 			err = __seg6_do_srh_encap(skb, tinfo->srh,
437ab9de9c4SJustin Iurman 						  IPPROTO_ETHERNET,
438ab9de9c4SJustin Iurman 						  cache_dst);
43913f0296bSAndrea Mayer 		else
44013f0296bSAndrea Mayer 			err = seg6_do_srh_encap_red(skb, tinfo->srh,
441ab9de9c4SJustin Iurman 						    IPPROTO_ETHERNET,
442ab9de9c4SJustin Iurman 						    cache_dst);
44313f0296bSAndrea Mayer 
44438ee7f2dSDavid Lebrun 		if (err)
44538ee7f2dSDavid Lebrun 			return err;
44638ee7f2dSDavid Lebrun 
44738ee7f2dSDavid Lebrun 		skb->protocol = htons(ETH_P_IPV6);
44838ee7f2dSDavid Lebrun 		break;
44932d99d0bSDavid Lebrun 	}
45032d99d0bSDavid Lebrun 
4516c8702c6SDavid Lebrun 	skb_set_transport_header(skb, sizeof(struct ipv6hdr));
4527a3f5b0dSRyoga Saito 	nf_reset_ct(skb);
4536c8702c6SDavid Lebrun 
4546c8702c6SDavid Lebrun 	return 0;
4556c8702c6SDavid Lebrun }
4566c8702c6SDavid Lebrun 
457ab9de9c4SJustin Iurman /* insert an SRH within an IPv6 packet, just after the IPv6 header */
seg6_do_srh_inline(struct sk_buff * skb,struct ipv6_sr_hdr * osrh)458ab9de9c4SJustin Iurman int seg6_do_srh_inline(struct sk_buff *skb, struct ipv6_sr_hdr *osrh)
459ab9de9c4SJustin Iurman {
460ab9de9c4SJustin Iurman 	return __seg6_do_srh_inline(skb, osrh, NULL);
461ab9de9c4SJustin Iurman }
462ab9de9c4SJustin Iurman EXPORT_SYMBOL_GPL(seg6_do_srh_inline);
463ab9de9c4SJustin Iurman 
seg6_input_finish(struct net * net,struct sock * sk,struct sk_buff * skb)4647a3f5b0dSRyoga Saito static int seg6_input_finish(struct net *net, struct sock *sk,
4657a3f5b0dSRyoga Saito 			     struct sk_buff *skb)
4667a3f5b0dSRyoga Saito {
4677a3f5b0dSRyoga Saito 	return dst_input(skb);
4687a3f5b0dSRyoga Saito }
4697a3f5b0dSRyoga Saito 
seg6_input_core(struct net * net,struct sock * sk,struct sk_buff * skb)4707a3f5b0dSRyoga Saito static int seg6_input_core(struct net *net, struct sock *sk,
4717a3f5b0dSRyoga Saito 			   struct sk_buff *skb)
4726c8702c6SDavid Lebrun {
473af4a2209SDavid Lebrun 	struct dst_entry *orig_dst = skb_dst(skb);
474af4a2209SDavid Lebrun 	struct dst_entry *dst = NULL;
475*c441f928SJustin Iurman 	struct lwtunnel_state *lwtst;
476af4a2209SDavid Lebrun 	struct seg6_lwt *slwt;
4776c8702c6SDavid Lebrun 	int err;
4786c8702c6SDavid Lebrun 
479*c441f928SJustin Iurman 	/* We cannot dereference "orig_dst" once ip6_route_input() or
480*c441f928SJustin Iurman 	 * skb_dst_drop() is called. However, in order to detect a dst loop, we
481*c441f928SJustin Iurman 	 * need the address of its lwtstate. So, save the address of lwtstate
482*c441f928SJustin Iurman 	 * now and use it later as a comparison.
483*c441f928SJustin Iurman 	 */
484*c441f928SJustin Iurman 	lwtst = orig_dst->lwtstate;
485*c441f928SJustin Iurman 
486*c441f928SJustin Iurman 	slwt = seg6_lwt_lwtunnel(lwtst);
487af4a2209SDavid Lebrun 
488f8dd092eSEric Dumazet 	local_bh_disable();
489af4a2209SDavid Lebrun 	dst = dst_cache_get(&slwt->cache);
490ab9de9c4SJustin Iurman 	local_bh_enable();
491ab9de9c4SJustin Iurman 
492ab9de9c4SJustin Iurman 	err = seg6_do_srh(skb, dst);
493ab9de9c4SJustin Iurman 	if (unlikely(err))
494ab9de9c4SJustin Iurman 		goto drop;
495af4a2209SDavid Lebrun 
496af4a2209SDavid Lebrun 	if (!dst) {
4976c8702c6SDavid Lebrun 		ip6_route_input(skb);
498af4a2209SDavid Lebrun 		dst = skb_dst(skb);
499*c441f928SJustin Iurman 
500*c441f928SJustin Iurman 		/* cache only if we don't create a dst reference loop */
501*c441f928SJustin Iurman 		if (!dst->error && lwtst != dst->lwtstate) {
502ab9de9c4SJustin Iurman 			local_bh_disable();
503af4a2209SDavid Lebrun 			dst_cache_set_ip6(&slwt->cache, dst,
504af4a2209SDavid Lebrun 					  &ipv6_hdr(skb)->saddr);
505f8dd092eSEric Dumazet 			local_bh_enable();
506ab9de9c4SJustin Iurman 		}
5076c8702c6SDavid Lebrun 
508af3b5158SDavid Lebrun 		err = skb_cow_head(skb, LL_RESERVED_SPACE(dst->dev));
509af3b5158SDavid Lebrun 		if (unlikely(err))
510f4df8c76SAndrea Mayer 			goto drop;
511ab9de9c4SJustin Iurman 	} else {
512ab9de9c4SJustin Iurman 		skb_dst_drop(skb);
513ab9de9c4SJustin Iurman 		skb_dst_set(skb, dst);
514ab9de9c4SJustin Iurman 	}
515af3b5158SDavid Lebrun 
5167a3f5b0dSRyoga Saito 	if (static_branch_unlikely(&nf_hooks_lwtunnel_enabled))
5177a3f5b0dSRyoga Saito 		return NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT,
5187a3f5b0dSRyoga Saito 			       dev_net(skb->dev), NULL, skb, NULL,
5197a3f5b0dSRyoga Saito 			       skb_dst(skb)->dev, seg6_input_finish);
5207a3f5b0dSRyoga Saito 
5217a3f5b0dSRyoga Saito 	return seg6_input_finish(dev_net(skb->dev), NULL, skb);
522f4df8c76SAndrea Mayer drop:
523f4df8c76SAndrea Mayer 	kfree_skb(skb);
524f4df8c76SAndrea Mayer 	return err;
5256c8702c6SDavid Lebrun }
5266c8702c6SDavid Lebrun 
seg6_input_nf(struct sk_buff * skb)5277a3f5b0dSRyoga Saito static int seg6_input_nf(struct sk_buff *skb)
5287a3f5b0dSRyoga Saito {
5297a3f5b0dSRyoga Saito 	struct net_device *dev = skb_dst(skb)->dev;
5307a3f5b0dSRyoga Saito 	struct net *net = dev_net(skb->dev);
5317a3f5b0dSRyoga Saito 
5327a3f5b0dSRyoga Saito 	switch (skb->protocol) {
5337a3f5b0dSRyoga Saito 	case htons(ETH_P_IP):
5347a3f5b0dSRyoga Saito 		return NF_HOOK(NFPROTO_IPV4, NF_INET_POST_ROUTING, net, NULL,
5357a3f5b0dSRyoga Saito 			       skb, NULL, dev, seg6_input_core);
5367a3f5b0dSRyoga Saito 	case htons(ETH_P_IPV6):
5377a3f5b0dSRyoga Saito 		return NF_HOOK(NFPROTO_IPV6, NF_INET_POST_ROUTING, net, NULL,
5387a3f5b0dSRyoga Saito 			       skb, NULL, dev, seg6_input_core);
5397a3f5b0dSRyoga Saito 	}
5407a3f5b0dSRyoga Saito 
5417a3f5b0dSRyoga Saito 	return -EINVAL;
5427a3f5b0dSRyoga Saito }
5437a3f5b0dSRyoga Saito 
seg6_input(struct sk_buff * skb)5447a3f5b0dSRyoga Saito static int seg6_input(struct sk_buff *skb)
5457a3f5b0dSRyoga Saito {
5467a3f5b0dSRyoga Saito 	if (static_branch_unlikely(&nf_hooks_lwtunnel_enabled))
5477a3f5b0dSRyoga Saito 		return seg6_input_nf(skb);
5487a3f5b0dSRyoga Saito 
5497a3f5b0dSRyoga Saito 	return seg6_input_core(dev_net(skb->dev), NULL, skb);
5507a3f5b0dSRyoga Saito }
5517a3f5b0dSRyoga Saito 
seg6_output_core(struct net * net,struct sock * sk,struct sk_buff * skb)5527a3f5b0dSRyoga Saito static int seg6_output_core(struct net *net, struct sock *sk,
5537a3f5b0dSRyoga Saito 			    struct sk_buff *skb)
5546c8702c6SDavid Lebrun {
5556c8702c6SDavid Lebrun 	struct dst_entry *orig_dst = skb_dst(skb);
5566c8702c6SDavid Lebrun 	struct dst_entry *dst = NULL;
5576c8702c6SDavid Lebrun 	struct seg6_lwt *slwt;
558bf0df73aSColin Ian King 	int err;
5596c8702c6SDavid Lebrun 
5606c8702c6SDavid Lebrun 	slwt = seg6_lwt_lwtunnel(orig_dst->lwtstate);
5616c8702c6SDavid Lebrun 
562f8dd092eSEric Dumazet 	local_bh_disable();
5636c8702c6SDavid Lebrun 	dst = dst_cache_get(&slwt->cache);
564f8dd092eSEric Dumazet 	local_bh_enable();
5656c8702c6SDavid Lebrun 
566ab9de9c4SJustin Iurman 	err = seg6_do_srh(skb, dst);
567ab9de9c4SJustin Iurman 	if (unlikely(err))
568ab9de9c4SJustin Iurman 		goto drop;
569ab9de9c4SJustin Iurman 
5706c8702c6SDavid Lebrun 	if (unlikely(!dst)) {
5716c8702c6SDavid Lebrun 		struct ipv6hdr *hdr = ipv6_hdr(skb);
5726c8702c6SDavid Lebrun 		struct flowi6 fl6;
5736c8702c6SDavid Lebrun 
5741b4e5ad5SShmulik Ladkani 		memset(&fl6, 0, sizeof(fl6));
5756c8702c6SDavid Lebrun 		fl6.daddr = hdr->daddr;
5766c8702c6SDavid Lebrun 		fl6.saddr = hdr->saddr;
5776c8702c6SDavid Lebrun 		fl6.flowlabel = ip6_flowinfo(hdr);
5786c8702c6SDavid Lebrun 		fl6.flowi6_mark = skb->mark;
5796c8702c6SDavid Lebrun 		fl6.flowi6_proto = hdr->nexthdr;
5806c8702c6SDavid Lebrun 
5816c8702c6SDavid Lebrun 		dst = ip6_route_output(net, NULL, &fl6);
5826c8702c6SDavid Lebrun 		if (dst->error) {
5836c8702c6SDavid Lebrun 			err = dst->error;
5846c8702c6SDavid Lebrun 			dst_release(dst);
5856c8702c6SDavid Lebrun 			goto drop;
5866c8702c6SDavid Lebrun 		}
5876c8702c6SDavid Lebrun 
588f8dd092eSEric Dumazet 		local_bh_disable();
5896c8702c6SDavid Lebrun 		dst_cache_set_ip6(&slwt->cache, dst, &fl6.saddr);
590f8dd092eSEric Dumazet 		local_bh_enable();
5916c8702c6SDavid Lebrun 
592af3b5158SDavid Lebrun 		err = skb_cow_head(skb, LL_RESERVED_SPACE(dst->dev));
593af3b5158SDavid Lebrun 		if (unlikely(err))
594af3b5158SDavid Lebrun 			goto drop;
595ab9de9c4SJustin Iurman 	}
596ab9de9c4SJustin Iurman 
597ab9de9c4SJustin Iurman 	skb_dst_drop(skb);
598ab9de9c4SJustin Iurman 	skb_dst_set(skb, dst);
599af3b5158SDavid Lebrun 
6007a3f5b0dSRyoga Saito 	if (static_branch_unlikely(&nf_hooks_lwtunnel_enabled))
6017a3f5b0dSRyoga Saito 		return NF_HOOK(NFPROTO_IPV6, NF_INET_LOCAL_OUT, net, sk, skb,
6027a3f5b0dSRyoga Saito 			       NULL, skb_dst(skb)->dev, dst_output);
6037a3f5b0dSRyoga Saito 
6046c8702c6SDavid Lebrun 	return dst_output(net, sk, skb);
6056c8702c6SDavid Lebrun drop:
6066c8702c6SDavid Lebrun 	kfree_skb(skb);
6076c8702c6SDavid Lebrun 	return err;
6086c8702c6SDavid Lebrun }
6096c8702c6SDavid Lebrun 
seg6_output_nf(struct net * net,struct sock * sk,struct sk_buff * skb)6107a3f5b0dSRyoga Saito static int seg6_output_nf(struct net *net, struct sock *sk, struct sk_buff *skb)
6117a3f5b0dSRyoga Saito {
6127a3f5b0dSRyoga Saito 	struct net_device *dev = skb_dst(skb)->dev;
6137a3f5b0dSRyoga Saito 
6147a3f5b0dSRyoga Saito 	switch (skb->protocol) {
6157a3f5b0dSRyoga Saito 	case htons(ETH_P_IP):
6167a3f5b0dSRyoga Saito 		return NF_HOOK(NFPROTO_IPV4, NF_INET_POST_ROUTING, net, sk, skb,
6177a3f5b0dSRyoga Saito 			       NULL, dev, seg6_output_core);
6187a3f5b0dSRyoga Saito 	case htons(ETH_P_IPV6):
6197a3f5b0dSRyoga Saito 		return NF_HOOK(NFPROTO_IPV6, NF_INET_POST_ROUTING, net, sk, skb,
6207a3f5b0dSRyoga Saito 			       NULL, dev, seg6_output_core);
6217a3f5b0dSRyoga Saito 	}
6227a3f5b0dSRyoga Saito 
6237a3f5b0dSRyoga Saito 	return -EINVAL;
6247a3f5b0dSRyoga Saito }
6257a3f5b0dSRyoga Saito 
seg6_output(struct net * net,struct sock * sk,struct sk_buff * skb)6267a3f5b0dSRyoga Saito static int seg6_output(struct net *net, struct sock *sk, struct sk_buff *skb)
6277a3f5b0dSRyoga Saito {
6287a3f5b0dSRyoga Saito 	if (static_branch_unlikely(&nf_hooks_lwtunnel_enabled))
6297a3f5b0dSRyoga Saito 		return seg6_output_nf(net, sk, skb);
6307a3f5b0dSRyoga Saito 
6317a3f5b0dSRyoga Saito 	return seg6_output_core(net, sk, skb);
6327a3f5b0dSRyoga Saito }
6337a3f5b0dSRyoga Saito 
seg6_build_state(struct net * net,struct nlattr * nla,unsigned int family,const void * cfg,struct lwtunnel_state ** ts,struct netlink_ext_ack * extack)634faee6769SAlexander Aring static int seg6_build_state(struct net *net, struct nlattr *nla,
6356c8702c6SDavid Lebrun 			    unsigned int family, const void *cfg,
6369ae28727SDavid Ahern 			    struct lwtunnel_state **ts,
6379ae28727SDavid Ahern 			    struct netlink_ext_ack *extack)
6386c8702c6SDavid Lebrun {
6396c8702c6SDavid Lebrun 	struct nlattr *tb[SEG6_IPTUNNEL_MAX + 1];
6406c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *tuninfo;
6416c8702c6SDavid Lebrun 	struct lwtunnel_state *newts;
6426c8702c6SDavid Lebrun 	int tuninfo_len, min_size;
6436c8702c6SDavid Lebrun 	struct seg6_lwt *slwt;
6446c8702c6SDavid Lebrun 	int err;
6456c8702c6SDavid Lebrun 
64632d99d0bSDavid Lebrun 	if (family != AF_INET && family != AF_INET6)
64732d99d0bSDavid Lebrun 		return -EINVAL;
64832d99d0bSDavid Lebrun 
6498cb08174SJohannes Berg 	err = nla_parse_nested_deprecated(tb, SEG6_IPTUNNEL_MAX, nla,
6509ae28727SDavid Ahern 					  seg6_iptunnel_policy, extack);
6516c8702c6SDavid Lebrun 
6526c8702c6SDavid Lebrun 	if (err < 0)
6536c8702c6SDavid Lebrun 		return err;
6546c8702c6SDavid Lebrun 
6556c8702c6SDavid Lebrun 	if (!tb[SEG6_IPTUNNEL_SRH])
6566c8702c6SDavid Lebrun 		return -EINVAL;
6576c8702c6SDavid Lebrun 
6586c8702c6SDavid Lebrun 	tuninfo = nla_data(tb[SEG6_IPTUNNEL_SRH]);
6596c8702c6SDavid Lebrun 	tuninfo_len = nla_len(tb[SEG6_IPTUNNEL_SRH]);
6606c8702c6SDavid Lebrun 
6616c8702c6SDavid Lebrun 	/* tuninfo must contain at least the iptunnel encap structure,
6626c8702c6SDavid Lebrun 	 * the SRH and one segment
6636c8702c6SDavid Lebrun 	 */
6646c8702c6SDavid Lebrun 	min_size = sizeof(*tuninfo) + sizeof(struct ipv6_sr_hdr) +
6656c8702c6SDavid Lebrun 		   sizeof(struct in6_addr);
6666c8702c6SDavid Lebrun 	if (tuninfo_len < min_size)
6676c8702c6SDavid Lebrun 		return -EINVAL;
6686c8702c6SDavid Lebrun 
6696c8702c6SDavid Lebrun 	switch (tuninfo->mode) {
6706c8702c6SDavid Lebrun 	case SEG6_IPTUN_MODE_INLINE:
67132d99d0bSDavid Lebrun 		if (family != AF_INET6)
67232d99d0bSDavid Lebrun 			return -EINVAL;
67332d99d0bSDavid Lebrun 
6746c8702c6SDavid Lebrun 		break;
6756c8702c6SDavid Lebrun 	case SEG6_IPTUN_MODE_ENCAP:
6766c8702c6SDavid Lebrun 		break;
67738ee7f2dSDavid Lebrun 	case SEG6_IPTUN_MODE_L2ENCAP:
67838ee7f2dSDavid Lebrun 		break;
679b07c8cdbSAndrea Mayer 	case SEG6_IPTUN_MODE_ENCAP_RED:
680b07c8cdbSAndrea Mayer 		break;
68113f0296bSAndrea Mayer 	case SEG6_IPTUN_MODE_L2ENCAP_RED:
68213f0296bSAndrea Mayer 		break;
6836c8702c6SDavid Lebrun 	default:
6846c8702c6SDavid Lebrun 		return -EINVAL;
6856c8702c6SDavid Lebrun 	}
6866c8702c6SDavid Lebrun 
6876c8702c6SDavid Lebrun 	/* verify that SRH is consistent */
688bb986a50SAhmed Abdelsalam 	if (!seg6_validate_srh(tuninfo->srh, tuninfo_len - sizeof(*tuninfo), false))
6896c8702c6SDavid Lebrun 		return -EINVAL;
6906c8702c6SDavid Lebrun 
6916c8702c6SDavid Lebrun 	newts = lwtunnel_state_alloc(tuninfo_len + sizeof(*slwt));
6926c8702c6SDavid Lebrun 	if (!newts)
6936c8702c6SDavid Lebrun 		return -ENOMEM;
6946c8702c6SDavid Lebrun 
6956c8702c6SDavid Lebrun 	slwt = seg6_lwt_lwtunnel(newts);
6966c8702c6SDavid Lebrun 
697191f86caSDavid Lebrun 	err = dst_cache_init(&slwt->cache, GFP_ATOMIC);
6986c8702c6SDavid Lebrun 	if (err) {
6996c8702c6SDavid Lebrun 		kfree(newts);
7006c8702c6SDavid Lebrun 		return err;
7016c8702c6SDavid Lebrun 	}
7026c8702c6SDavid Lebrun 
7036c8702c6SDavid Lebrun 	memcpy(&slwt->tuninfo, tuninfo, tuninfo_len);
7046c8702c6SDavid Lebrun 
7056c8702c6SDavid Lebrun 	newts->type = LWTUNNEL_ENCAP_SEG6;
70638ee7f2dSDavid Lebrun 	newts->flags |= LWTUNNEL_STATE_INPUT_REDIRECT;
70738ee7f2dSDavid Lebrun 
70838ee7f2dSDavid Lebrun 	if (tuninfo->mode != SEG6_IPTUN_MODE_L2ENCAP)
70938ee7f2dSDavid Lebrun 		newts->flags |= LWTUNNEL_STATE_OUTPUT_REDIRECT;
71038ee7f2dSDavid Lebrun 
7116c8702c6SDavid Lebrun 	newts->headroom = seg6_lwt_headroom(tuninfo);
7126c8702c6SDavid Lebrun 
7136c8702c6SDavid Lebrun 	*ts = newts;
7146c8702c6SDavid Lebrun 
7156c8702c6SDavid Lebrun 	return 0;
7166c8702c6SDavid Lebrun }
7176c8702c6SDavid Lebrun 
seg6_destroy_state(struct lwtunnel_state * lwt)7186c8702c6SDavid Lebrun static void seg6_destroy_state(struct lwtunnel_state *lwt)
7196c8702c6SDavid Lebrun {
7206c8702c6SDavid Lebrun 	dst_cache_destroy(&seg6_lwt_lwtunnel(lwt)->cache);
7216c8702c6SDavid Lebrun }
7226c8702c6SDavid Lebrun 
seg6_fill_encap_info(struct sk_buff * skb,struct lwtunnel_state * lwtstate)7236c8702c6SDavid Lebrun static int seg6_fill_encap_info(struct sk_buff *skb,
7246c8702c6SDavid Lebrun 				struct lwtunnel_state *lwtstate)
7256c8702c6SDavid Lebrun {
7266c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *tuninfo = seg6_encap_lwtunnel(lwtstate);
7276c8702c6SDavid Lebrun 
7286c8702c6SDavid Lebrun 	if (nla_put_srh(skb, SEG6_IPTUNNEL_SRH, tuninfo))
7296c8702c6SDavid Lebrun 		return -EMSGSIZE;
7306c8702c6SDavid Lebrun 
7316c8702c6SDavid Lebrun 	return 0;
7326c8702c6SDavid Lebrun }
7336c8702c6SDavid Lebrun 
seg6_encap_nlsize(struct lwtunnel_state * lwtstate)7346c8702c6SDavid Lebrun static int seg6_encap_nlsize(struct lwtunnel_state *lwtstate)
7356c8702c6SDavid Lebrun {
7366c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *tuninfo = seg6_encap_lwtunnel(lwtstate);
7376c8702c6SDavid Lebrun 
7386c8702c6SDavid Lebrun 	return nla_total_size(SEG6_IPTUN_ENCAP_SIZE(tuninfo));
7396c8702c6SDavid Lebrun }
7406c8702c6SDavid Lebrun 
seg6_encap_cmp(struct lwtunnel_state * a,struct lwtunnel_state * b)7416c8702c6SDavid Lebrun static int seg6_encap_cmp(struct lwtunnel_state *a, struct lwtunnel_state *b)
7426c8702c6SDavid Lebrun {
7436c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *a_hdr = seg6_encap_lwtunnel(a);
7446c8702c6SDavid Lebrun 	struct seg6_iptunnel_encap *b_hdr = seg6_encap_lwtunnel(b);
7456c8702c6SDavid Lebrun 	int len = SEG6_IPTUN_ENCAP_SIZE(a_hdr);
7466c8702c6SDavid Lebrun 
7476c8702c6SDavid Lebrun 	if (len != SEG6_IPTUN_ENCAP_SIZE(b_hdr))
7486c8702c6SDavid Lebrun 		return 1;
7496c8702c6SDavid Lebrun 
7506c8702c6SDavid Lebrun 	return memcmp(a_hdr, b_hdr, len);
7516c8702c6SDavid Lebrun }
7526c8702c6SDavid Lebrun 
7536c8702c6SDavid Lebrun static const struct lwtunnel_encap_ops seg6_iptun_ops = {
7546c8702c6SDavid Lebrun 	.build_state = seg6_build_state,
7556c8702c6SDavid Lebrun 	.destroy_state = seg6_destroy_state,
7566c8702c6SDavid Lebrun 	.output = seg6_output,
7576c8702c6SDavid Lebrun 	.input = seg6_input,
7586c8702c6SDavid Lebrun 	.fill_encap = seg6_fill_encap_info,
7596c8702c6SDavid Lebrun 	.get_encap_size = seg6_encap_nlsize,
7606c8702c6SDavid Lebrun 	.cmp_encap = seg6_encap_cmp,
76188ff7334SRobert Shearman 	.owner = THIS_MODULE,
7626c8702c6SDavid Lebrun };
7636c8702c6SDavid Lebrun 
seg6_iptunnel_init(void)7646c8702c6SDavid Lebrun int __init seg6_iptunnel_init(void)
7656c8702c6SDavid Lebrun {
7666c8702c6SDavid Lebrun 	return lwtunnel_encap_add_ops(&seg6_iptun_ops, LWTUNNEL_ENCAP_SEG6);
7676c8702c6SDavid Lebrun }
7686c8702c6SDavid Lebrun 
seg6_iptunnel_exit(void)7696c8702c6SDavid Lebrun void seg6_iptunnel_exit(void)
7706c8702c6SDavid Lebrun {
7716c8702c6SDavid Lebrun 	lwtunnel_encap_del_ops(&seg6_iptun_ops, LWTUNNEL_ENCAP_SEG6);
7726c8702c6SDavid Lebrun }
773