xref: /openbmc/linux/net/ipv6/tcp_ipv6.c (revision b34e08d5)
1 /*
2  *	TCP over IPv6
3  *	Linux INET6 implementation
4  *
5  *	Authors:
6  *	Pedro Roque		<roque@di.fc.ul.pt>
7  *
8  *	Based on:
9  *	linux/net/ipv4/tcp.c
10  *	linux/net/ipv4/tcp_input.c
11  *	linux/net/ipv4/tcp_output.c
12  *
13  *	Fixes:
14  *	Hideaki YOSHIFUJI	:	sin6_scope_id support
15  *	YOSHIFUJI Hideaki @USAGI and:	Support IPV6_V6ONLY socket option, which
16  *	Alexey Kuznetsov		allow both IPv4 and IPv6 sockets to bind
17  *					a single port at the same time.
18  *	YOSHIFUJI Hideaki @USAGI:	convert /proc/net/tcp6 to seq_file.
19  *
20  *	This program is free software; you can redistribute it and/or
21  *      modify it under the terms of the GNU General Public License
22  *      as published by the Free Software Foundation; either version
23  *      2 of the License, or (at your option) any later version.
24  */
25 
26 #include <linux/bottom_half.h>
27 #include <linux/module.h>
28 #include <linux/errno.h>
29 #include <linux/types.h>
30 #include <linux/socket.h>
31 #include <linux/sockios.h>
32 #include <linux/net.h>
33 #include <linux/jiffies.h>
34 #include <linux/in.h>
35 #include <linux/in6.h>
36 #include <linux/netdevice.h>
37 #include <linux/init.h>
38 #include <linux/jhash.h>
39 #include <linux/ipsec.h>
40 #include <linux/times.h>
41 #include <linux/slab.h>
42 #include <linux/uaccess.h>
43 #include <linux/ipv6.h>
44 #include <linux/icmpv6.h>
45 #include <linux/random.h>
46 
47 #include <net/tcp.h>
48 #include <net/ndisc.h>
49 #include <net/inet6_hashtables.h>
50 #include <net/inet6_connection_sock.h>
51 #include <net/ipv6.h>
52 #include <net/transp_v6.h>
53 #include <net/addrconf.h>
54 #include <net/ip6_route.h>
55 #include <net/ip6_checksum.h>
56 #include <net/inet_ecn.h>
57 #include <net/protocol.h>
58 #include <net/xfrm.h>
59 #include <net/snmp.h>
60 #include <net/dsfield.h>
61 #include <net/timewait_sock.h>
62 #include <net/netdma.h>
63 #include <net/inet_common.h>
64 #include <net/secure_seq.h>
65 #include <net/tcp_memcontrol.h>
66 #include <net/busy_poll.h>
67 
68 #include <linux/proc_fs.h>
69 #include <linux/seq_file.h>
70 
71 #include <linux/crypto.h>
72 #include <linux/scatterlist.h>
73 
74 static void	tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb);
75 static void	tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
76 				      struct request_sock *req);
77 
78 static int	tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb);
79 
80 static const struct inet_connection_sock_af_ops ipv6_mapped;
81 static const struct inet_connection_sock_af_ops ipv6_specific;
82 #ifdef CONFIG_TCP_MD5SIG
83 static const struct tcp_sock_af_ops tcp_sock_ipv6_specific;
84 static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific;
85 #else
86 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
87 						   const struct in6_addr *addr)
88 {
89 	return NULL;
90 }
91 #endif
92 
93 static void inet6_sk_rx_dst_set(struct sock *sk, const struct sk_buff *skb)
94 {
95 	struct dst_entry *dst = skb_dst(skb);
96 	const struct rt6_info *rt = (const struct rt6_info *)dst;
97 
98 	dst_hold(dst);
99 	sk->sk_rx_dst = dst;
100 	inet_sk(sk)->rx_dst_ifindex = skb->skb_iif;
101 	if (rt->rt6i_node)
102 		inet6_sk(sk)->rx_dst_cookie = rt->rt6i_node->fn_sernum;
103 }
104 
105 static void tcp_v6_hash(struct sock *sk)
106 {
107 	if (sk->sk_state != TCP_CLOSE) {
108 		if (inet_csk(sk)->icsk_af_ops == &ipv6_mapped) {
109 			tcp_prot.hash(sk);
110 			return;
111 		}
112 		local_bh_disable();
113 		__inet6_hash(sk, NULL);
114 		local_bh_enable();
115 	}
116 }
117 
118 static __u32 tcp_v6_init_sequence(const struct sk_buff *skb)
119 {
120 	return secure_tcpv6_sequence_number(ipv6_hdr(skb)->daddr.s6_addr32,
121 					    ipv6_hdr(skb)->saddr.s6_addr32,
122 					    tcp_hdr(skb)->dest,
123 					    tcp_hdr(skb)->source);
124 }
125 
126 static int tcp_v6_connect(struct sock *sk, struct sockaddr *uaddr,
127 			  int addr_len)
128 {
129 	struct sockaddr_in6 *usin = (struct sockaddr_in6 *) uaddr;
130 	struct inet_sock *inet = inet_sk(sk);
131 	struct inet_connection_sock *icsk = inet_csk(sk);
132 	struct ipv6_pinfo *np = inet6_sk(sk);
133 	struct tcp_sock *tp = tcp_sk(sk);
134 	struct in6_addr *saddr = NULL, *final_p, final;
135 	struct rt6_info *rt;
136 	struct flowi6 fl6;
137 	struct dst_entry *dst;
138 	int addr_type;
139 	int err;
140 
141 	if (addr_len < SIN6_LEN_RFC2133)
142 		return -EINVAL;
143 
144 	if (usin->sin6_family != AF_INET6)
145 		return -EAFNOSUPPORT;
146 
147 	memset(&fl6, 0, sizeof(fl6));
148 
149 	if (np->sndflow) {
150 		fl6.flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
151 		IP6_ECN_flow_init(fl6.flowlabel);
152 		if (fl6.flowlabel&IPV6_FLOWLABEL_MASK) {
153 			struct ip6_flowlabel *flowlabel;
154 			flowlabel = fl6_sock_lookup(sk, fl6.flowlabel);
155 			if (flowlabel == NULL)
156 				return -EINVAL;
157 			fl6_sock_release(flowlabel);
158 		}
159 	}
160 
161 	/*
162 	 *	connect() to INADDR_ANY means loopback (BSD'ism).
163 	 */
164 
165 	if (ipv6_addr_any(&usin->sin6_addr))
166 		usin->sin6_addr.s6_addr[15] = 0x1;
167 
168 	addr_type = ipv6_addr_type(&usin->sin6_addr);
169 
170 	if (addr_type & IPV6_ADDR_MULTICAST)
171 		return -ENETUNREACH;
172 
173 	if (addr_type&IPV6_ADDR_LINKLOCAL) {
174 		if (addr_len >= sizeof(struct sockaddr_in6) &&
175 		    usin->sin6_scope_id) {
176 			/* If interface is set while binding, indices
177 			 * must coincide.
178 			 */
179 			if (sk->sk_bound_dev_if &&
180 			    sk->sk_bound_dev_if != usin->sin6_scope_id)
181 				return -EINVAL;
182 
183 			sk->sk_bound_dev_if = usin->sin6_scope_id;
184 		}
185 
186 		/* Connect to link-local address requires an interface */
187 		if (!sk->sk_bound_dev_if)
188 			return -EINVAL;
189 	}
190 
191 	if (tp->rx_opt.ts_recent_stamp &&
192 	    !ipv6_addr_equal(&sk->sk_v6_daddr, &usin->sin6_addr)) {
193 		tp->rx_opt.ts_recent = 0;
194 		tp->rx_opt.ts_recent_stamp = 0;
195 		tp->write_seq = 0;
196 	}
197 
198 	sk->sk_v6_daddr = usin->sin6_addr;
199 	np->flow_label = fl6.flowlabel;
200 
201 	/*
202 	 *	TCP over IPv4
203 	 */
204 
205 	if (addr_type == IPV6_ADDR_MAPPED) {
206 		u32 exthdrlen = icsk->icsk_ext_hdr_len;
207 		struct sockaddr_in sin;
208 
209 		SOCK_DEBUG(sk, "connect: ipv4 mapped\n");
210 
211 		if (__ipv6_only_sock(sk))
212 			return -ENETUNREACH;
213 
214 		sin.sin_family = AF_INET;
215 		sin.sin_port = usin->sin6_port;
216 		sin.sin_addr.s_addr = usin->sin6_addr.s6_addr32[3];
217 
218 		icsk->icsk_af_ops = &ipv6_mapped;
219 		sk->sk_backlog_rcv = tcp_v4_do_rcv;
220 #ifdef CONFIG_TCP_MD5SIG
221 		tp->af_specific = &tcp_sock_ipv6_mapped_specific;
222 #endif
223 
224 		err = tcp_v4_connect(sk, (struct sockaddr *)&sin, sizeof(sin));
225 
226 		if (err) {
227 			icsk->icsk_ext_hdr_len = exthdrlen;
228 			icsk->icsk_af_ops = &ipv6_specific;
229 			sk->sk_backlog_rcv = tcp_v6_do_rcv;
230 #ifdef CONFIG_TCP_MD5SIG
231 			tp->af_specific = &tcp_sock_ipv6_specific;
232 #endif
233 			goto failure;
234 		} else {
235 			ipv6_addr_set_v4mapped(inet->inet_saddr, &np->saddr);
236 			ipv6_addr_set_v4mapped(inet->inet_rcv_saddr,
237 					       &sk->sk_v6_rcv_saddr);
238 		}
239 
240 		return err;
241 	}
242 
243 	if (!ipv6_addr_any(&sk->sk_v6_rcv_saddr))
244 		saddr = &sk->sk_v6_rcv_saddr;
245 
246 	fl6.flowi6_proto = IPPROTO_TCP;
247 	fl6.daddr = sk->sk_v6_daddr;
248 	fl6.saddr = saddr ? *saddr : np->saddr;
249 	fl6.flowi6_oif = sk->sk_bound_dev_if;
250 	fl6.flowi6_mark = sk->sk_mark;
251 	fl6.fl6_dport = usin->sin6_port;
252 	fl6.fl6_sport = inet->inet_sport;
253 
254 	final_p = fl6_update_dst(&fl6, np->opt, &final);
255 
256 	security_sk_classify_flow(sk, flowi6_to_flowi(&fl6));
257 
258 	dst = ip6_dst_lookup_flow(sk, &fl6, final_p);
259 	if (IS_ERR(dst)) {
260 		err = PTR_ERR(dst);
261 		goto failure;
262 	}
263 
264 	if (saddr == NULL) {
265 		saddr = &fl6.saddr;
266 		sk->sk_v6_rcv_saddr = *saddr;
267 	}
268 
269 	/* set the source address */
270 	np->saddr = *saddr;
271 	inet->inet_rcv_saddr = LOOPBACK4_IPV6;
272 
273 	sk->sk_gso_type = SKB_GSO_TCPV6;
274 	__ip6_dst_store(sk, dst, NULL, NULL);
275 
276 	rt = (struct rt6_info *) dst;
277 	if (tcp_death_row.sysctl_tw_recycle &&
278 	    !tp->rx_opt.ts_recent_stamp &&
279 	    ipv6_addr_equal(&rt->rt6i_dst.addr, &sk->sk_v6_daddr))
280 		tcp_fetch_timewait_stamp(sk, dst);
281 
282 	icsk->icsk_ext_hdr_len = 0;
283 	if (np->opt)
284 		icsk->icsk_ext_hdr_len = (np->opt->opt_flen +
285 					  np->opt->opt_nflen);
286 
287 	tp->rx_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
288 
289 	inet->inet_dport = usin->sin6_port;
290 
291 	tcp_set_state(sk, TCP_SYN_SENT);
292 	err = inet6_hash_connect(&tcp_death_row, sk);
293 	if (err)
294 		goto late_failure;
295 
296 	if (!tp->write_seq && likely(!tp->repair))
297 		tp->write_seq = secure_tcpv6_sequence_number(np->saddr.s6_addr32,
298 							     sk->sk_v6_daddr.s6_addr32,
299 							     inet->inet_sport,
300 							     inet->inet_dport);
301 
302 	err = tcp_connect(sk);
303 	if (err)
304 		goto late_failure;
305 
306 	return 0;
307 
308 late_failure:
309 	tcp_set_state(sk, TCP_CLOSE);
310 	__sk_dst_reset(sk);
311 failure:
312 	inet->inet_dport = 0;
313 	sk->sk_route_caps = 0;
314 	return err;
315 }
316 
317 static void tcp_v6_mtu_reduced(struct sock *sk)
318 {
319 	struct dst_entry *dst;
320 
321 	if ((1 << sk->sk_state) & (TCPF_LISTEN | TCPF_CLOSE))
322 		return;
323 
324 	dst = inet6_csk_update_pmtu(sk, tcp_sk(sk)->mtu_info);
325 	if (!dst)
326 		return;
327 
328 	if (inet_csk(sk)->icsk_pmtu_cookie > dst_mtu(dst)) {
329 		tcp_sync_mss(sk, dst_mtu(dst));
330 		tcp_simple_retransmit(sk);
331 	}
332 }
333 
334 static void tcp_v6_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
335 		u8 type, u8 code, int offset, __be32 info)
336 {
337 	const struct ipv6hdr *hdr = (const struct ipv6hdr *)skb->data;
338 	const struct tcphdr *th = (struct tcphdr *)(skb->data+offset);
339 	struct ipv6_pinfo *np;
340 	struct sock *sk;
341 	int err;
342 	struct tcp_sock *tp;
343 	__u32 seq;
344 	struct net *net = dev_net(skb->dev);
345 
346 	sk = inet6_lookup(net, &tcp_hashinfo, &hdr->daddr,
347 			th->dest, &hdr->saddr, th->source, skb->dev->ifindex);
348 
349 	if (sk == NULL) {
350 		ICMP6_INC_STATS_BH(net, __in6_dev_get(skb->dev),
351 				   ICMP6_MIB_INERRORS);
352 		return;
353 	}
354 
355 	if (sk->sk_state == TCP_TIME_WAIT) {
356 		inet_twsk_put(inet_twsk(sk));
357 		return;
358 	}
359 
360 	bh_lock_sock(sk);
361 	if (sock_owned_by_user(sk) && type != ICMPV6_PKT_TOOBIG)
362 		NET_INC_STATS_BH(net, LINUX_MIB_LOCKDROPPEDICMPS);
363 
364 	if (sk->sk_state == TCP_CLOSE)
365 		goto out;
366 
367 	if (ipv6_hdr(skb)->hop_limit < inet6_sk(sk)->min_hopcount) {
368 		NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
369 		goto out;
370 	}
371 
372 	tp = tcp_sk(sk);
373 	seq = ntohl(th->seq);
374 	if (sk->sk_state != TCP_LISTEN &&
375 	    !between(seq, tp->snd_una, tp->snd_nxt)) {
376 		NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
377 		goto out;
378 	}
379 
380 	np = inet6_sk(sk);
381 
382 	if (type == NDISC_REDIRECT) {
383 		struct dst_entry *dst = __sk_dst_check(sk, np->dst_cookie);
384 
385 		if (dst)
386 			dst->ops->redirect(dst, sk, skb);
387 		goto out;
388 	}
389 
390 	if (type == ICMPV6_PKT_TOOBIG) {
391 		/* We are not interested in TCP_LISTEN and open_requests
392 		 * (SYN-ACKs send out by Linux are always <576bytes so
393 		 * they should go through unfragmented).
394 		 */
395 		if (sk->sk_state == TCP_LISTEN)
396 			goto out;
397 
398 		if (!ip6_sk_accept_pmtu(sk))
399 			goto out;
400 
401 		tp->mtu_info = ntohl(info);
402 		if (!sock_owned_by_user(sk))
403 			tcp_v6_mtu_reduced(sk);
404 		else if (!test_and_set_bit(TCP_MTU_REDUCED_DEFERRED,
405 					   &tp->tsq_flags))
406 			sock_hold(sk);
407 		goto out;
408 	}
409 
410 	icmpv6_err_convert(type, code, &err);
411 
412 	/* Might be for an request_sock */
413 	switch (sk->sk_state) {
414 		struct request_sock *req, **prev;
415 	case TCP_LISTEN:
416 		if (sock_owned_by_user(sk))
417 			goto out;
418 
419 		req = inet6_csk_search_req(sk, &prev, th->dest, &hdr->daddr,
420 					   &hdr->saddr, inet6_iif(skb));
421 		if (!req)
422 			goto out;
423 
424 		/* ICMPs are not backlogged, hence we cannot get
425 		 * an established socket here.
426 		 */
427 		WARN_ON(req->sk != NULL);
428 
429 		if (seq != tcp_rsk(req)->snt_isn) {
430 			NET_INC_STATS_BH(net, LINUX_MIB_OUTOFWINDOWICMPS);
431 			goto out;
432 		}
433 
434 		inet_csk_reqsk_queue_drop(sk, req, prev);
435 		NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
436 		goto out;
437 
438 	case TCP_SYN_SENT:
439 	case TCP_SYN_RECV:  /* Cannot happen.
440 			       It can, it SYNs are crossed. --ANK */
441 		if (!sock_owned_by_user(sk)) {
442 			sk->sk_err = err;
443 			sk->sk_error_report(sk);		/* Wake people up to see the error (see connect in sock.c) */
444 
445 			tcp_done(sk);
446 		} else
447 			sk->sk_err_soft = err;
448 		goto out;
449 	}
450 
451 	if (!sock_owned_by_user(sk) && np->recverr) {
452 		sk->sk_err = err;
453 		sk->sk_error_report(sk);
454 	} else
455 		sk->sk_err_soft = err;
456 
457 out:
458 	bh_unlock_sock(sk);
459 	sock_put(sk);
460 }
461 
462 
463 static int tcp_v6_send_synack(struct sock *sk, struct dst_entry *dst,
464 			      struct flowi6 *fl6,
465 			      struct request_sock *req,
466 			      u16 queue_mapping)
467 {
468 	struct inet_request_sock *ireq = inet_rsk(req);
469 	struct ipv6_pinfo *np = inet6_sk(sk);
470 	struct sk_buff *skb;
471 	int err = -ENOMEM;
472 
473 	/* First, grab a route. */
474 	if (!dst && (dst = inet6_csk_route_req(sk, fl6, req)) == NULL)
475 		goto done;
476 
477 	skb = tcp_make_synack(sk, dst, req, NULL);
478 
479 	if (skb) {
480 		__tcp_v6_send_check(skb, &ireq->ir_v6_loc_addr,
481 				    &ireq->ir_v6_rmt_addr);
482 
483 		fl6->daddr = ireq->ir_v6_rmt_addr;
484 		if (np->repflow && (ireq->pktopts != NULL))
485 			fl6->flowlabel = ip6_flowlabel(ipv6_hdr(ireq->pktopts));
486 
487 		skb_set_queue_mapping(skb, queue_mapping);
488 		err = ip6_xmit(sk, skb, fl6, np->opt, np->tclass);
489 		err = net_xmit_eval(err);
490 	}
491 
492 done:
493 	return err;
494 }
495 
496 static int tcp_v6_rtx_synack(struct sock *sk, struct request_sock *req)
497 {
498 	struct flowi6 fl6;
499 	int res;
500 
501 	res = tcp_v6_send_synack(sk, NULL, &fl6, req, 0);
502 	if (!res) {
503 		TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_RETRANSSEGS);
504 		NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPSYNRETRANS);
505 	}
506 	return res;
507 }
508 
509 static void tcp_v6_reqsk_destructor(struct request_sock *req)
510 {
511 	kfree_skb(inet_rsk(req)->pktopts);
512 }
513 
514 #ifdef CONFIG_TCP_MD5SIG
515 static struct tcp_md5sig_key *tcp_v6_md5_do_lookup(struct sock *sk,
516 						   const struct in6_addr *addr)
517 {
518 	return tcp_md5_do_lookup(sk, (union tcp_md5_addr *)addr, AF_INET6);
519 }
520 
521 static struct tcp_md5sig_key *tcp_v6_md5_lookup(struct sock *sk,
522 						struct sock *addr_sk)
523 {
524 	return tcp_v6_md5_do_lookup(sk, &addr_sk->sk_v6_daddr);
525 }
526 
527 static struct tcp_md5sig_key *tcp_v6_reqsk_md5_lookup(struct sock *sk,
528 						      struct request_sock *req)
529 {
530 	return tcp_v6_md5_do_lookup(sk, &inet_rsk(req)->ir_v6_rmt_addr);
531 }
532 
533 static int tcp_v6_parse_md5_keys(struct sock *sk, char __user *optval,
534 				 int optlen)
535 {
536 	struct tcp_md5sig cmd;
537 	struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *)&cmd.tcpm_addr;
538 
539 	if (optlen < sizeof(cmd))
540 		return -EINVAL;
541 
542 	if (copy_from_user(&cmd, optval, sizeof(cmd)))
543 		return -EFAULT;
544 
545 	if (sin6->sin6_family != AF_INET6)
546 		return -EINVAL;
547 
548 	if (!cmd.tcpm_keylen) {
549 		if (ipv6_addr_v4mapped(&sin6->sin6_addr))
550 			return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
551 					      AF_INET);
552 		return tcp_md5_do_del(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
553 				      AF_INET6);
554 	}
555 
556 	if (cmd.tcpm_keylen > TCP_MD5SIG_MAXKEYLEN)
557 		return -EINVAL;
558 
559 	if (ipv6_addr_v4mapped(&sin6->sin6_addr))
560 		return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr.s6_addr32[3],
561 				      AF_INET, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
562 
563 	return tcp_md5_do_add(sk, (union tcp_md5_addr *)&sin6->sin6_addr,
564 			      AF_INET6, cmd.tcpm_key, cmd.tcpm_keylen, GFP_KERNEL);
565 }
566 
567 static int tcp_v6_md5_hash_pseudoheader(struct tcp_md5sig_pool *hp,
568 					const struct in6_addr *daddr,
569 					const struct in6_addr *saddr, int nbytes)
570 {
571 	struct tcp6_pseudohdr *bp;
572 	struct scatterlist sg;
573 
574 	bp = &hp->md5_blk.ip6;
575 	/* 1. TCP pseudo-header (RFC2460) */
576 	bp->saddr = *saddr;
577 	bp->daddr = *daddr;
578 	bp->protocol = cpu_to_be32(IPPROTO_TCP);
579 	bp->len = cpu_to_be32(nbytes);
580 
581 	sg_init_one(&sg, bp, sizeof(*bp));
582 	return crypto_hash_update(&hp->md5_desc, &sg, sizeof(*bp));
583 }
584 
585 static int tcp_v6_md5_hash_hdr(char *md5_hash, struct tcp_md5sig_key *key,
586 			       const struct in6_addr *daddr, struct in6_addr *saddr,
587 			       const struct tcphdr *th)
588 {
589 	struct tcp_md5sig_pool *hp;
590 	struct hash_desc *desc;
591 
592 	hp = tcp_get_md5sig_pool();
593 	if (!hp)
594 		goto clear_hash_noput;
595 	desc = &hp->md5_desc;
596 
597 	if (crypto_hash_init(desc))
598 		goto clear_hash;
599 	if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, th->doff << 2))
600 		goto clear_hash;
601 	if (tcp_md5_hash_header(hp, th))
602 		goto clear_hash;
603 	if (tcp_md5_hash_key(hp, key))
604 		goto clear_hash;
605 	if (crypto_hash_final(desc, md5_hash))
606 		goto clear_hash;
607 
608 	tcp_put_md5sig_pool();
609 	return 0;
610 
611 clear_hash:
612 	tcp_put_md5sig_pool();
613 clear_hash_noput:
614 	memset(md5_hash, 0, 16);
615 	return 1;
616 }
617 
618 static int tcp_v6_md5_hash_skb(char *md5_hash, struct tcp_md5sig_key *key,
619 			       const struct sock *sk,
620 			       const struct request_sock *req,
621 			       const struct sk_buff *skb)
622 {
623 	const struct in6_addr *saddr, *daddr;
624 	struct tcp_md5sig_pool *hp;
625 	struct hash_desc *desc;
626 	const struct tcphdr *th = tcp_hdr(skb);
627 
628 	if (sk) {
629 		saddr = &inet6_sk(sk)->saddr;
630 		daddr = &sk->sk_v6_daddr;
631 	} else if (req) {
632 		saddr = &inet_rsk(req)->ir_v6_loc_addr;
633 		daddr = &inet_rsk(req)->ir_v6_rmt_addr;
634 	} else {
635 		const struct ipv6hdr *ip6h = ipv6_hdr(skb);
636 		saddr = &ip6h->saddr;
637 		daddr = &ip6h->daddr;
638 	}
639 
640 	hp = tcp_get_md5sig_pool();
641 	if (!hp)
642 		goto clear_hash_noput;
643 	desc = &hp->md5_desc;
644 
645 	if (crypto_hash_init(desc))
646 		goto clear_hash;
647 
648 	if (tcp_v6_md5_hash_pseudoheader(hp, daddr, saddr, skb->len))
649 		goto clear_hash;
650 	if (tcp_md5_hash_header(hp, th))
651 		goto clear_hash;
652 	if (tcp_md5_hash_skb_data(hp, skb, th->doff << 2))
653 		goto clear_hash;
654 	if (tcp_md5_hash_key(hp, key))
655 		goto clear_hash;
656 	if (crypto_hash_final(desc, md5_hash))
657 		goto clear_hash;
658 
659 	tcp_put_md5sig_pool();
660 	return 0;
661 
662 clear_hash:
663 	tcp_put_md5sig_pool();
664 clear_hash_noput:
665 	memset(md5_hash, 0, 16);
666 	return 1;
667 }
668 
669 static int tcp_v6_inbound_md5_hash(struct sock *sk, const struct sk_buff *skb)
670 {
671 	const __u8 *hash_location = NULL;
672 	struct tcp_md5sig_key *hash_expected;
673 	const struct ipv6hdr *ip6h = ipv6_hdr(skb);
674 	const struct tcphdr *th = tcp_hdr(skb);
675 	int genhash;
676 	u8 newhash[16];
677 
678 	hash_expected = tcp_v6_md5_do_lookup(sk, &ip6h->saddr);
679 	hash_location = tcp_parse_md5sig_option(th);
680 
681 	/* We've parsed the options - do we have a hash? */
682 	if (!hash_expected && !hash_location)
683 		return 0;
684 
685 	if (hash_expected && !hash_location) {
686 		NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5NOTFOUND);
687 		return 1;
688 	}
689 
690 	if (!hash_expected && hash_location) {
691 		NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_TCPMD5UNEXPECTED);
692 		return 1;
693 	}
694 
695 	/* check the signature */
696 	genhash = tcp_v6_md5_hash_skb(newhash,
697 				      hash_expected,
698 				      NULL, NULL, skb);
699 
700 	if (genhash || memcmp(hash_location, newhash, 16) != 0) {
701 		net_info_ratelimited("MD5 Hash %s for [%pI6c]:%u->[%pI6c]:%u\n",
702 				     genhash ? "failed" : "mismatch",
703 				     &ip6h->saddr, ntohs(th->source),
704 				     &ip6h->daddr, ntohs(th->dest));
705 		return 1;
706 	}
707 	return 0;
708 }
709 #endif
710 
711 struct request_sock_ops tcp6_request_sock_ops __read_mostly = {
712 	.family		=	AF_INET6,
713 	.obj_size	=	sizeof(struct tcp6_request_sock),
714 	.rtx_syn_ack	=	tcp_v6_rtx_synack,
715 	.send_ack	=	tcp_v6_reqsk_send_ack,
716 	.destructor	=	tcp_v6_reqsk_destructor,
717 	.send_reset	=	tcp_v6_send_reset,
718 	.syn_ack_timeout =	tcp_syn_ack_timeout,
719 };
720 
721 #ifdef CONFIG_TCP_MD5SIG
722 static const struct tcp_request_sock_ops tcp_request_sock_ipv6_ops = {
723 	.md5_lookup	=	tcp_v6_reqsk_md5_lookup,
724 	.calc_md5_hash	=	tcp_v6_md5_hash_skb,
725 };
726 #endif
727 
728 static void tcp_v6_send_response(struct sk_buff *skb, u32 seq, u32 ack, u32 win,
729 				 u32 tsval, u32 tsecr, int oif,
730 				 struct tcp_md5sig_key *key, int rst, u8 tclass,
731 				 u32 label)
732 {
733 	const struct tcphdr *th = tcp_hdr(skb);
734 	struct tcphdr *t1;
735 	struct sk_buff *buff;
736 	struct flowi6 fl6;
737 	struct net *net = dev_net(skb_dst(skb)->dev);
738 	struct sock *ctl_sk = net->ipv6.tcp_sk;
739 	unsigned int tot_len = sizeof(struct tcphdr);
740 	struct dst_entry *dst;
741 	__be32 *topt;
742 
743 	if (tsecr)
744 		tot_len += TCPOLEN_TSTAMP_ALIGNED;
745 #ifdef CONFIG_TCP_MD5SIG
746 	if (key)
747 		tot_len += TCPOLEN_MD5SIG_ALIGNED;
748 #endif
749 
750 	buff = alloc_skb(MAX_HEADER + sizeof(struct ipv6hdr) + tot_len,
751 			 GFP_ATOMIC);
752 	if (buff == NULL)
753 		return;
754 
755 	skb_reserve(buff, MAX_HEADER + sizeof(struct ipv6hdr) + tot_len);
756 
757 	t1 = (struct tcphdr *) skb_push(buff, tot_len);
758 	skb_reset_transport_header(buff);
759 
760 	/* Swap the send and the receive. */
761 	memset(t1, 0, sizeof(*t1));
762 	t1->dest = th->source;
763 	t1->source = th->dest;
764 	t1->doff = tot_len / 4;
765 	t1->seq = htonl(seq);
766 	t1->ack_seq = htonl(ack);
767 	t1->ack = !rst || !th->ack;
768 	t1->rst = rst;
769 	t1->window = htons(win);
770 
771 	topt = (__be32 *)(t1 + 1);
772 
773 	if (tsecr) {
774 		*topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
775 				(TCPOPT_TIMESTAMP << 8) | TCPOLEN_TIMESTAMP);
776 		*topt++ = htonl(tsval);
777 		*topt++ = htonl(tsecr);
778 	}
779 
780 #ifdef CONFIG_TCP_MD5SIG
781 	if (key) {
782 		*topt++ = htonl((TCPOPT_NOP << 24) | (TCPOPT_NOP << 16) |
783 				(TCPOPT_MD5SIG << 8) | TCPOLEN_MD5SIG);
784 		tcp_v6_md5_hash_hdr((__u8 *)topt, key,
785 				    &ipv6_hdr(skb)->saddr,
786 				    &ipv6_hdr(skb)->daddr, t1);
787 	}
788 #endif
789 
790 	memset(&fl6, 0, sizeof(fl6));
791 	fl6.daddr = ipv6_hdr(skb)->saddr;
792 	fl6.saddr = ipv6_hdr(skb)->daddr;
793 	fl6.flowlabel = label;
794 
795 	buff->ip_summed = CHECKSUM_PARTIAL;
796 	buff->csum = 0;
797 
798 	__tcp_v6_send_check(buff, &fl6.saddr, &fl6.daddr);
799 
800 	fl6.flowi6_proto = IPPROTO_TCP;
801 	if (rt6_need_strict(&fl6.daddr) && !oif)
802 		fl6.flowi6_oif = inet6_iif(skb);
803 	else
804 		fl6.flowi6_oif = oif;
805 	fl6.fl6_dport = t1->dest;
806 	fl6.fl6_sport = t1->source;
807 	security_skb_classify_flow(skb, flowi6_to_flowi(&fl6));
808 
809 	/* Pass a socket to ip6_dst_lookup either it is for RST
810 	 * Underlying function will use this to retrieve the network
811 	 * namespace
812 	 */
813 	dst = ip6_dst_lookup_flow(ctl_sk, &fl6, NULL);
814 	if (!IS_ERR(dst)) {
815 		skb_dst_set(buff, dst);
816 		ip6_xmit(ctl_sk, buff, &fl6, NULL, tclass);
817 		TCP_INC_STATS_BH(net, TCP_MIB_OUTSEGS);
818 		if (rst)
819 			TCP_INC_STATS_BH(net, TCP_MIB_OUTRSTS);
820 		return;
821 	}
822 
823 	kfree_skb(buff);
824 }
825 
826 static void tcp_v6_send_reset(struct sock *sk, struct sk_buff *skb)
827 {
828 	const struct tcphdr *th = tcp_hdr(skb);
829 	u32 seq = 0, ack_seq = 0;
830 	struct tcp_md5sig_key *key = NULL;
831 #ifdef CONFIG_TCP_MD5SIG
832 	const __u8 *hash_location = NULL;
833 	struct ipv6hdr *ipv6h = ipv6_hdr(skb);
834 	unsigned char newhash[16];
835 	int genhash;
836 	struct sock *sk1 = NULL;
837 #endif
838 	int oif;
839 
840 	if (th->rst)
841 		return;
842 
843 	if (!ipv6_unicast_destination(skb))
844 		return;
845 
846 #ifdef CONFIG_TCP_MD5SIG
847 	hash_location = tcp_parse_md5sig_option(th);
848 	if (!sk && hash_location) {
849 		/*
850 		 * active side is lost. Try to find listening socket through
851 		 * source port, and then find md5 key through listening socket.
852 		 * we are not loose security here:
853 		 * Incoming packet is checked with md5 hash with finding key,
854 		 * no RST generated if md5 hash doesn't match.
855 		 */
856 		sk1 = inet6_lookup_listener(dev_net(skb_dst(skb)->dev),
857 					   &tcp_hashinfo, &ipv6h->saddr,
858 					   th->source, &ipv6h->daddr,
859 					   ntohs(th->source), inet6_iif(skb));
860 		if (!sk1)
861 			return;
862 
863 		rcu_read_lock();
864 		key = tcp_v6_md5_do_lookup(sk1, &ipv6h->saddr);
865 		if (!key)
866 			goto release_sk1;
867 
868 		genhash = tcp_v6_md5_hash_skb(newhash, key, NULL, NULL, skb);
869 		if (genhash || memcmp(hash_location, newhash, 16) != 0)
870 			goto release_sk1;
871 	} else {
872 		key = sk ? tcp_v6_md5_do_lookup(sk, &ipv6h->saddr) : NULL;
873 	}
874 #endif
875 
876 	if (th->ack)
877 		seq = ntohl(th->ack_seq);
878 	else
879 		ack_seq = ntohl(th->seq) + th->syn + th->fin + skb->len -
880 			  (th->doff << 2);
881 
882 	oif = sk ? sk->sk_bound_dev_if : 0;
883 	tcp_v6_send_response(skb, seq, ack_seq, 0, 0, 0, oif, key, 1, 0, 0);
884 
885 #ifdef CONFIG_TCP_MD5SIG
886 release_sk1:
887 	if (sk1) {
888 		rcu_read_unlock();
889 		sock_put(sk1);
890 	}
891 #endif
892 }
893 
894 static void tcp_v6_send_ack(struct sk_buff *skb, u32 seq, u32 ack,
895 			    u32 win, u32 tsval, u32 tsecr, int oif,
896 			    struct tcp_md5sig_key *key, u8 tclass,
897 			    u32 label)
898 {
899 	tcp_v6_send_response(skb, seq, ack, win, tsval, tsecr, oif, key, 0, tclass,
900 			     label);
901 }
902 
903 static void tcp_v6_timewait_ack(struct sock *sk, struct sk_buff *skb)
904 {
905 	struct inet_timewait_sock *tw = inet_twsk(sk);
906 	struct tcp_timewait_sock *tcptw = tcp_twsk(sk);
907 
908 	tcp_v6_send_ack(skb, tcptw->tw_snd_nxt, tcptw->tw_rcv_nxt,
909 			tcptw->tw_rcv_wnd >> tw->tw_rcv_wscale,
910 			tcp_time_stamp + tcptw->tw_ts_offset,
911 			tcptw->tw_ts_recent, tw->tw_bound_dev_if, tcp_twsk_md5_key(tcptw),
912 			tw->tw_tclass, (tw->tw_flowlabel << 12));
913 
914 	inet_twsk_put(tw);
915 }
916 
917 static void tcp_v6_reqsk_send_ack(struct sock *sk, struct sk_buff *skb,
918 				  struct request_sock *req)
919 {
920 	tcp_v6_send_ack(skb, tcp_rsk(req)->snt_isn + 1, tcp_rsk(req)->rcv_isn + 1,
921 			req->rcv_wnd, tcp_time_stamp, req->ts_recent, sk->sk_bound_dev_if,
922 			tcp_v6_md5_do_lookup(sk, &ipv6_hdr(skb)->daddr),
923 			0, 0);
924 }
925 
926 
927 static struct sock *tcp_v6_hnd_req(struct sock *sk, struct sk_buff *skb)
928 {
929 	struct request_sock *req, **prev;
930 	const struct tcphdr *th = tcp_hdr(skb);
931 	struct sock *nsk;
932 
933 	/* Find possible connection requests. */
934 	req = inet6_csk_search_req(sk, &prev, th->source,
935 				   &ipv6_hdr(skb)->saddr,
936 				   &ipv6_hdr(skb)->daddr, inet6_iif(skb));
937 	if (req)
938 		return tcp_check_req(sk, skb, req, prev, false);
939 
940 	nsk = __inet6_lookup_established(sock_net(sk), &tcp_hashinfo,
941 			&ipv6_hdr(skb)->saddr, th->source,
942 			&ipv6_hdr(skb)->daddr, ntohs(th->dest), inet6_iif(skb));
943 
944 	if (nsk) {
945 		if (nsk->sk_state != TCP_TIME_WAIT) {
946 			bh_lock_sock(nsk);
947 			return nsk;
948 		}
949 		inet_twsk_put(inet_twsk(nsk));
950 		return NULL;
951 	}
952 
953 #ifdef CONFIG_SYN_COOKIES
954 	if (!th->syn)
955 		sk = cookie_v6_check(sk, skb);
956 #endif
957 	return sk;
958 }
959 
960 /* FIXME: this is substantially similar to the ipv4 code.
961  * Can some kind of merge be done? -- erics
962  */
963 static int tcp_v6_conn_request(struct sock *sk, struct sk_buff *skb)
964 {
965 	struct tcp_options_received tmp_opt;
966 	struct request_sock *req;
967 	struct inet_request_sock *ireq;
968 	struct ipv6_pinfo *np = inet6_sk(sk);
969 	struct tcp_sock *tp = tcp_sk(sk);
970 	__u32 isn = TCP_SKB_CB(skb)->when;
971 	struct dst_entry *dst = NULL;
972 	struct flowi6 fl6;
973 	bool want_cookie = false;
974 
975 	if (skb->protocol == htons(ETH_P_IP))
976 		return tcp_v4_conn_request(sk, skb);
977 
978 	if (!ipv6_unicast_destination(skb))
979 		goto drop;
980 
981 	if ((sysctl_tcp_syncookies == 2 ||
982 	     inet_csk_reqsk_queue_is_full(sk)) && !isn) {
983 		want_cookie = tcp_syn_flood_action(sk, skb, "TCPv6");
984 		if (!want_cookie)
985 			goto drop;
986 	}
987 
988 	if (sk_acceptq_is_full(sk) && inet_csk_reqsk_queue_young(sk) > 1) {
989 		NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
990 		goto drop;
991 	}
992 
993 	req = inet6_reqsk_alloc(&tcp6_request_sock_ops);
994 	if (req == NULL)
995 		goto drop;
996 
997 #ifdef CONFIG_TCP_MD5SIG
998 	tcp_rsk(req)->af_specific = &tcp_request_sock_ipv6_ops;
999 #endif
1000 
1001 	tcp_clear_options(&tmp_opt);
1002 	tmp_opt.mss_clamp = IPV6_MIN_MTU - sizeof(struct tcphdr) - sizeof(struct ipv6hdr);
1003 	tmp_opt.user_mss = tp->rx_opt.user_mss;
1004 	tcp_parse_options(skb, &tmp_opt, 0, NULL);
1005 
1006 	if (want_cookie && !tmp_opt.saw_tstamp)
1007 		tcp_clear_options(&tmp_opt);
1008 
1009 	tmp_opt.tstamp_ok = tmp_opt.saw_tstamp;
1010 	tcp_openreq_init(req, &tmp_opt, skb);
1011 
1012 	ireq = inet_rsk(req);
1013 	ireq->ir_v6_rmt_addr = ipv6_hdr(skb)->saddr;
1014 	ireq->ir_v6_loc_addr = ipv6_hdr(skb)->daddr;
1015 	if (!want_cookie || tmp_opt.tstamp_ok)
1016 		TCP_ECN_create_request(req, skb, sock_net(sk));
1017 
1018 	ireq->ir_iif = sk->sk_bound_dev_if;
1019 
1020 	/* So that link locals have meaning */
1021 	if (!sk->sk_bound_dev_if &&
1022 	    ipv6_addr_type(&ireq->ir_v6_rmt_addr) & IPV6_ADDR_LINKLOCAL)
1023 		ireq->ir_iif = inet6_iif(skb);
1024 
1025 	if (!isn) {
1026 		if (ipv6_opt_accepted(sk, skb) ||
1027 		    np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo ||
1028 		    np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim ||
1029 		    np->repflow) {
1030 			atomic_inc(&skb->users);
1031 			ireq->pktopts = skb;
1032 		}
1033 
1034 		if (want_cookie) {
1035 			isn = cookie_v6_init_sequence(sk, skb, &req->mss);
1036 			req->cookie_ts = tmp_opt.tstamp_ok;
1037 			goto have_isn;
1038 		}
1039 
1040 		/* VJ's idea. We save last timestamp seen
1041 		 * from the destination in peer table, when entering
1042 		 * state TIME-WAIT, and check against it before
1043 		 * accepting new connection request.
1044 		 *
1045 		 * If "isn" is not zero, this request hit alive
1046 		 * timewait bucket, so that all the necessary checks
1047 		 * are made in the function processing timewait state.
1048 		 */
1049 		if (tmp_opt.saw_tstamp &&
1050 		    tcp_death_row.sysctl_tw_recycle &&
1051 		    (dst = inet6_csk_route_req(sk, &fl6, req)) != NULL) {
1052 			if (!tcp_peer_is_proven(req, dst, true)) {
1053 				NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_PAWSPASSIVEREJECTED);
1054 				goto drop_and_release;
1055 			}
1056 		}
1057 		/* Kill the following clause, if you dislike this way. */
1058 		else if (!sysctl_tcp_syncookies &&
1059 			 (sysctl_max_syn_backlog - inet_csk_reqsk_queue_len(sk) <
1060 			  (sysctl_max_syn_backlog >> 2)) &&
1061 			 !tcp_peer_is_proven(req, dst, false)) {
1062 			/* Without syncookies last quarter of
1063 			 * backlog is filled with destinations,
1064 			 * proven to be alive.
1065 			 * It means that we continue to communicate
1066 			 * to destinations, already remembered
1067 			 * to the moment of synflood.
1068 			 */
1069 			LIMIT_NETDEBUG(KERN_DEBUG "TCP: drop open request from %pI6/%u\n",
1070 				       &ireq->ir_v6_rmt_addr, ntohs(tcp_hdr(skb)->source));
1071 			goto drop_and_release;
1072 		}
1073 
1074 		isn = tcp_v6_init_sequence(skb);
1075 	}
1076 have_isn:
1077 	tcp_rsk(req)->snt_isn = isn;
1078 
1079 	if (security_inet_conn_request(sk, skb, req))
1080 		goto drop_and_release;
1081 
1082 	if (tcp_v6_send_synack(sk, dst, &fl6, req,
1083 			       skb_get_queue_mapping(skb)) ||
1084 	    want_cookie)
1085 		goto drop_and_free;
1086 
1087 	tcp_rsk(req)->snt_synack = tcp_time_stamp;
1088 	tcp_rsk(req)->listener = NULL;
1089 	inet6_csk_reqsk_queue_hash_add(sk, req, TCP_TIMEOUT_INIT);
1090 	return 0;
1091 
1092 drop_and_release:
1093 	dst_release(dst);
1094 drop_and_free:
1095 	reqsk_free(req);
1096 drop:
1097 	NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1098 	return 0; /* don't send reset */
1099 }
1100 
1101 static struct sock *tcp_v6_syn_recv_sock(struct sock *sk, struct sk_buff *skb,
1102 					 struct request_sock *req,
1103 					 struct dst_entry *dst)
1104 {
1105 	struct inet_request_sock *ireq;
1106 	struct ipv6_pinfo *newnp, *np = inet6_sk(sk);
1107 	struct tcp6_sock *newtcp6sk;
1108 	struct inet_sock *newinet;
1109 	struct tcp_sock *newtp;
1110 	struct sock *newsk;
1111 #ifdef CONFIG_TCP_MD5SIG
1112 	struct tcp_md5sig_key *key;
1113 #endif
1114 	struct flowi6 fl6;
1115 
1116 	if (skb->protocol == htons(ETH_P_IP)) {
1117 		/*
1118 		 *	v6 mapped
1119 		 */
1120 
1121 		newsk = tcp_v4_syn_recv_sock(sk, skb, req, dst);
1122 
1123 		if (newsk == NULL)
1124 			return NULL;
1125 
1126 		newtcp6sk = (struct tcp6_sock *)newsk;
1127 		inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1128 
1129 		newinet = inet_sk(newsk);
1130 		newnp = inet6_sk(newsk);
1131 		newtp = tcp_sk(newsk);
1132 
1133 		memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1134 
1135 		ipv6_addr_set_v4mapped(newinet->inet_daddr, &newsk->sk_v6_daddr);
1136 
1137 		ipv6_addr_set_v4mapped(newinet->inet_saddr, &newnp->saddr);
1138 
1139 		newsk->sk_v6_rcv_saddr = newnp->saddr;
1140 
1141 		inet_csk(newsk)->icsk_af_ops = &ipv6_mapped;
1142 		newsk->sk_backlog_rcv = tcp_v4_do_rcv;
1143 #ifdef CONFIG_TCP_MD5SIG
1144 		newtp->af_specific = &tcp_sock_ipv6_mapped_specific;
1145 #endif
1146 
1147 		newnp->ipv6_ac_list = NULL;
1148 		newnp->ipv6_fl_list = NULL;
1149 		newnp->pktoptions  = NULL;
1150 		newnp->opt	   = NULL;
1151 		newnp->mcast_oif   = inet6_iif(skb);
1152 		newnp->mcast_hops  = ipv6_hdr(skb)->hop_limit;
1153 		newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
1154 		if (np->repflow)
1155 			newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
1156 
1157 		/*
1158 		 * No need to charge this sock to the relevant IPv6 refcnt debug socks count
1159 		 * here, tcp_create_openreq_child now does this for us, see the comment in
1160 		 * that function for the gory details. -acme
1161 		 */
1162 
1163 		/* It is tricky place. Until this moment IPv4 tcp
1164 		   worked with IPv6 icsk.icsk_af_ops.
1165 		   Sync it now.
1166 		 */
1167 		tcp_sync_mss(newsk, inet_csk(newsk)->icsk_pmtu_cookie);
1168 
1169 		return newsk;
1170 	}
1171 
1172 	ireq = inet_rsk(req);
1173 
1174 	if (sk_acceptq_is_full(sk))
1175 		goto out_overflow;
1176 
1177 	if (!dst) {
1178 		dst = inet6_csk_route_req(sk, &fl6, req);
1179 		if (!dst)
1180 			goto out;
1181 	}
1182 
1183 	newsk = tcp_create_openreq_child(sk, req, skb);
1184 	if (newsk == NULL)
1185 		goto out_nonewsk;
1186 
1187 	/*
1188 	 * No need to charge this sock to the relevant IPv6 refcnt debug socks
1189 	 * count here, tcp_create_openreq_child now does this for us, see the
1190 	 * comment in that function for the gory details. -acme
1191 	 */
1192 
1193 	newsk->sk_gso_type = SKB_GSO_TCPV6;
1194 	__ip6_dst_store(newsk, dst, NULL, NULL);
1195 	inet6_sk_rx_dst_set(newsk, skb);
1196 
1197 	newtcp6sk = (struct tcp6_sock *)newsk;
1198 	inet_sk(newsk)->pinet6 = &newtcp6sk->inet6;
1199 
1200 	newtp = tcp_sk(newsk);
1201 	newinet = inet_sk(newsk);
1202 	newnp = inet6_sk(newsk);
1203 
1204 	memcpy(newnp, np, sizeof(struct ipv6_pinfo));
1205 
1206 	newsk->sk_v6_daddr = ireq->ir_v6_rmt_addr;
1207 	newnp->saddr = ireq->ir_v6_loc_addr;
1208 	newsk->sk_v6_rcv_saddr = ireq->ir_v6_loc_addr;
1209 	newsk->sk_bound_dev_if = ireq->ir_iif;
1210 
1211 	/* Now IPv6 options...
1212 
1213 	   First: no IPv4 options.
1214 	 */
1215 	newinet->inet_opt = NULL;
1216 	newnp->ipv6_ac_list = NULL;
1217 	newnp->ipv6_fl_list = NULL;
1218 
1219 	/* Clone RX bits */
1220 	newnp->rxopt.all = np->rxopt.all;
1221 
1222 	/* Clone pktoptions received with SYN */
1223 	newnp->pktoptions = NULL;
1224 	if (ireq->pktopts != NULL) {
1225 		newnp->pktoptions = skb_clone(ireq->pktopts,
1226 					      sk_gfp_atomic(sk, GFP_ATOMIC));
1227 		consume_skb(ireq->pktopts);
1228 		ireq->pktopts = NULL;
1229 		if (newnp->pktoptions)
1230 			skb_set_owner_r(newnp->pktoptions, newsk);
1231 	}
1232 	newnp->opt	  = NULL;
1233 	newnp->mcast_oif  = inet6_iif(skb);
1234 	newnp->mcast_hops = ipv6_hdr(skb)->hop_limit;
1235 	newnp->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(skb));
1236 	if (np->repflow)
1237 		newnp->flow_label = ip6_flowlabel(ipv6_hdr(skb));
1238 
1239 	/* Clone native IPv6 options from listening socket (if any)
1240 
1241 	   Yes, keeping reference count would be much more clever,
1242 	   but we make one more one thing there: reattach optmem
1243 	   to newsk.
1244 	 */
1245 	if (np->opt)
1246 		newnp->opt = ipv6_dup_options(newsk, np->opt);
1247 
1248 	inet_csk(newsk)->icsk_ext_hdr_len = 0;
1249 	if (newnp->opt)
1250 		inet_csk(newsk)->icsk_ext_hdr_len = (newnp->opt->opt_nflen +
1251 						     newnp->opt->opt_flen);
1252 
1253 	tcp_sync_mss(newsk, dst_mtu(dst));
1254 	newtp->advmss = dst_metric_advmss(dst);
1255 	if (tcp_sk(sk)->rx_opt.user_mss &&
1256 	    tcp_sk(sk)->rx_opt.user_mss < newtp->advmss)
1257 		newtp->advmss = tcp_sk(sk)->rx_opt.user_mss;
1258 
1259 	tcp_initialize_rcv_mss(newsk);
1260 
1261 	newinet->inet_daddr = newinet->inet_saddr = LOOPBACK4_IPV6;
1262 	newinet->inet_rcv_saddr = LOOPBACK4_IPV6;
1263 
1264 #ifdef CONFIG_TCP_MD5SIG
1265 	/* Copy over the MD5 key from the original socket */
1266 	key = tcp_v6_md5_do_lookup(sk, &newsk->sk_v6_daddr);
1267 	if (key != NULL) {
1268 		/* We're using one, so create a matching key
1269 		 * on the newsk structure. If we fail to get
1270 		 * memory, then we end up not copying the key
1271 		 * across. Shucks.
1272 		 */
1273 		tcp_md5_do_add(newsk, (union tcp_md5_addr *)&newsk->sk_v6_daddr,
1274 			       AF_INET6, key->key, key->keylen,
1275 			       sk_gfp_atomic(sk, GFP_ATOMIC));
1276 	}
1277 #endif
1278 
1279 	if (__inet_inherit_port(sk, newsk) < 0) {
1280 		inet_csk_prepare_forced_close(newsk);
1281 		tcp_done(newsk);
1282 		goto out;
1283 	}
1284 	__inet6_hash(newsk, NULL);
1285 
1286 	return newsk;
1287 
1288 out_overflow:
1289 	NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENOVERFLOWS);
1290 out_nonewsk:
1291 	dst_release(dst);
1292 out:
1293 	NET_INC_STATS_BH(sock_net(sk), LINUX_MIB_LISTENDROPS);
1294 	return NULL;
1295 }
1296 
1297 static __sum16 tcp_v6_checksum_init(struct sk_buff *skb)
1298 {
1299 	if (skb->ip_summed == CHECKSUM_COMPLETE) {
1300 		if (!tcp_v6_check(skb->len, &ipv6_hdr(skb)->saddr,
1301 				  &ipv6_hdr(skb)->daddr, skb->csum)) {
1302 			skb->ip_summed = CHECKSUM_UNNECESSARY;
1303 			return 0;
1304 		}
1305 	}
1306 
1307 	skb->csum = ~csum_unfold(tcp_v6_check(skb->len,
1308 					      &ipv6_hdr(skb)->saddr,
1309 					      &ipv6_hdr(skb)->daddr, 0));
1310 
1311 	if (skb->len <= 76)
1312 		return __skb_checksum_complete(skb);
1313 	return 0;
1314 }
1315 
1316 /* The socket must have it's spinlock held when we get
1317  * here.
1318  *
1319  * We have a potential double-lock case here, so even when
1320  * doing backlog processing we use the BH locking scheme.
1321  * This is because we cannot sleep with the original spinlock
1322  * held.
1323  */
1324 static int tcp_v6_do_rcv(struct sock *sk, struct sk_buff *skb)
1325 {
1326 	struct ipv6_pinfo *np = inet6_sk(sk);
1327 	struct tcp_sock *tp;
1328 	struct sk_buff *opt_skb = NULL;
1329 
1330 	/* Imagine: socket is IPv6. IPv4 packet arrives,
1331 	   goes to IPv4 receive handler and backlogged.
1332 	   From backlog it always goes here. Kerboom...
1333 	   Fortunately, tcp_rcv_established and rcv_established
1334 	   handle them correctly, but it is not case with
1335 	   tcp_v6_hnd_req and tcp_v6_send_reset().   --ANK
1336 	 */
1337 
1338 	if (skb->protocol == htons(ETH_P_IP))
1339 		return tcp_v4_do_rcv(sk, skb);
1340 
1341 #ifdef CONFIG_TCP_MD5SIG
1342 	if (tcp_v6_inbound_md5_hash(sk, skb))
1343 		goto discard;
1344 #endif
1345 
1346 	if (sk_filter(sk, skb))
1347 		goto discard;
1348 
1349 	/*
1350 	 *	socket locking is here for SMP purposes as backlog rcv
1351 	 *	is currently called with bh processing disabled.
1352 	 */
1353 
1354 	/* Do Stevens' IPV6_PKTOPTIONS.
1355 
1356 	   Yes, guys, it is the only place in our code, where we
1357 	   may make it not affecting IPv4.
1358 	   The rest of code is protocol independent,
1359 	   and I do not like idea to uglify IPv4.
1360 
1361 	   Actually, all the idea behind IPV6_PKTOPTIONS
1362 	   looks not very well thought. For now we latch
1363 	   options, received in the last packet, enqueued
1364 	   by tcp. Feel free to propose better solution.
1365 					       --ANK (980728)
1366 	 */
1367 	if (np->rxopt.all)
1368 		opt_skb = skb_clone(skb, sk_gfp_atomic(sk, GFP_ATOMIC));
1369 
1370 	if (sk->sk_state == TCP_ESTABLISHED) { /* Fast path */
1371 		struct dst_entry *dst = sk->sk_rx_dst;
1372 
1373 		sock_rps_save_rxhash(sk, skb);
1374 		if (dst) {
1375 			if (inet_sk(sk)->rx_dst_ifindex != skb->skb_iif ||
1376 			    dst->ops->check(dst, np->rx_dst_cookie) == NULL) {
1377 				dst_release(dst);
1378 				sk->sk_rx_dst = NULL;
1379 			}
1380 		}
1381 
1382 		tcp_rcv_established(sk, skb, tcp_hdr(skb), skb->len);
1383 		if (opt_skb)
1384 			goto ipv6_pktoptions;
1385 		return 0;
1386 	}
1387 
1388 	if (skb->len < tcp_hdrlen(skb) || tcp_checksum_complete(skb))
1389 		goto csum_err;
1390 
1391 	if (sk->sk_state == TCP_LISTEN) {
1392 		struct sock *nsk = tcp_v6_hnd_req(sk, skb);
1393 		if (!nsk)
1394 			goto discard;
1395 
1396 		/*
1397 		 * Queue it on the new socket if the new socket is active,
1398 		 * otherwise we just shortcircuit this and continue with
1399 		 * the new socket..
1400 		 */
1401 		if (nsk != sk) {
1402 			sock_rps_save_rxhash(nsk, skb);
1403 			if (tcp_child_process(sk, nsk, skb))
1404 				goto reset;
1405 			if (opt_skb)
1406 				__kfree_skb(opt_skb);
1407 			return 0;
1408 		}
1409 	} else
1410 		sock_rps_save_rxhash(sk, skb);
1411 
1412 	if (tcp_rcv_state_process(sk, skb, tcp_hdr(skb), skb->len))
1413 		goto reset;
1414 	if (opt_skb)
1415 		goto ipv6_pktoptions;
1416 	return 0;
1417 
1418 reset:
1419 	tcp_v6_send_reset(sk, skb);
1420 discard:
1421 	if (opt_skb)
1422 		__kfree_skb(opt_skb);
1423 	kfree_skb(skb);
1424 	return 0;
1425 csum_err:
1426 	TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_CSUMERRORS);
1427 	TCP_INC_STATS_BH(sock_net(sk), TCP_MIB_INERRS);
1428 	goto discard;
1429 
1430 
1431 ipv6_pktoptions:
1432 	/* Do you ask, what is it?
1433 
1434 	   1. skb was enqueued by tcp.
1435 	   2. skb is added to tail of read queue, rather than out of order.
1436 	   3. socket is not in passive state.
1437 	   4. Finally, it really contains options, which user wants to receive.
1438 	 */
1439 	tp = tcp_sk(sk);
1440 	if (TCP_SKB_CB(opt_skb)->end_seq == tp->rcv_nxt &&
1441 	    !((1 << sk->sk_state) & (TCPF_CLOSE | TCPF_LISTEN))) {
1442 		if (np->rxopt.bits.rxinfo || np->rxopt.bits.rxoinfo)
1443 			np->mcast_oif = inet6_iif(opt_skb);
1444 		if (np->rxopt.bits.rxhlim || np->rxopt.bits.rxohlim)
1445 			np->mcast_hops = ipv6_hdr(opt_skb)->hop_limit;
1446 		if (np->rxopt.bits.rxflow || np->rxopt.bits.rxtclass)
1447 			np->rcv_flowinfo = ip6_flowinfo(ipv6_hdr(opt_skb));
1448 		if (np->repflow)
1449 			np->flow_label = ip6_flowlabel(ipv6_hdr(opt_skb));
1450 		if (ipv6_opt_accepted(sk, opt_skb)) {
1451 			skb_set_owner_r(opt_skb, sk);
1452 			opt_skb = xchg(&np->pktoptions, opt_skb);
1453 		} else {
1454 			__kfree_skb(opt_skb);
1455 			opt_skb = xchg(&np->pktoptions, NULL);
1456 		}
1457 	}
1458 
1459 	kfree_skb(opt_skb);
1460 	return 0;
1461 }
1462 
1463 static int tcp_v6_rcv(struct sk_buff *skb)
1464 {
1465 	const struct tcphdr *th;
1466 	const struct ipv6hdr *hdr;
1467 	struct sock *sk;
1468 	int ret;
1469 	struct net *net = dev_net(skb->dev);
1470 
1471 	if (skb->pkt_type != PACKET_HOST)
1472 		goto discard_it;
1473 
1474 	/*
1475 	 *	Count it even if it's bad.
1476 	 */
1477 	TCP_INC_STATS_BH(net, TCP_MIB_INSEGS);
1478 
1479 	if (!pskb_may_pull(skb, sizeof(struct tcphdr)))
1480 		goto discard_it;
1481 
1482 	th = tcp_hdr(skb);
1483 
1484 	if (th->doff < sizeof(struct tcphdr)/4)
1485 		goto bad_packet;
1486 	if (!pskb_may_pull(skb, th->doff*4))
1487 		goto discard_it;
1488 
1489 	if (!skb_csum_unnecessary(skb) && tcp_v6_checksum_init(skb))
1490 		goto csum_error;
1491 
1492 	th = tcp_hdr(skb);
1493 	hdr = ipv6_hdr(skb);
1494 	TCP_SKB_CB(skb)->seq = ntohl(th->seq);
1495 	TCP_SKB_CB(skb)->end_seq = (TCP_SKB_CB(skb)->seq + th->syn + th->fin +
1496 				    skb->len - th->doff*4);
1497 	TCP_SKB_CB(skb)->ack_seq = ntohl(th->ack_seq);
1498 	TCP_SKB_CB(skb)->when = 0;
1499 	TCP_SKB_CB(skb)->ip_dsfield = ipv6_get_dsfield(hdr);
1500 	TCP_SKB_CB(skb)->sacked = 0;
1501 
1502 	sk = __inet6_lookup_skb(&tcp_hashinfo, skb, th->source, th->dest);
1503 	if (!sk)
1504 		goto no_tcp_socket;
1505 
1506 process:
1507 	if (sk->sk_state == TCP_TIME_WAIT)
1508 		goto do_time_wait;
1509 
1510 	if (hdr->hop_limit < inet6_sk(sk)->min_hopcount) {
1511 		NET_INC_STATS_BH(net, LINUX_MIB_TCPMINTTLDROP);
1512 		goto discard_and_relse;
1513 	}
1514 
1515 	if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
1516 		goto discard_and_relse;
1517 
1518 	if (sk_filter(sk, skb))
1519 		goto discard_and_relse;
1520 
1521 	sk_mark_napi_id(sk, skb);
1522 	skb->dev = NULL;
1523 
1524 	bh_lock_sock_nested(sk);
1525 	ret = 0;
1526 	if (!sock_owned_by_user(sk)) {
1527 #ifdef CONFIG_NET_DMA
1528 		struct tcp_sock *tp = tcp_sk(sk);
1529 		if (!tp->ucopy.dma_chan && tp->ucopy.pinned_list)
1530 			tp->ucopy.dma_chan = net_dma_find_channel();
1531 		if (tp->ucopy.dma_chan)
1532 			ret = tcp_v6_do_rcv(sk, skb);
1533 		else
1534 #endif
1535 		{
1536 			if (!tcp_prequeue(sk, skb))
1537 				ret = tcp_v6_do_rcv(sk, skb);
1538 		}
1539 	} else if (unlikely(sk_add_backlog(sk, skb,
1540 					   sk->sk_rcvbuf + sk->sk_sndbuf))) {
1541 		bh_unlock_sock(sk);
1542 		NET_INC_STATS_BH(net, LINUX_MIB_TCPBACKLOGDROP);
1543 		goto discard_and_relse;
1544 	}
1545 	bh_unlock_sock(sk);
1546 
1547 	sock_put(sk);
1548 	return ret ? -1 : 0;
1549 
1550 no_tcp_socket:
1551 	if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
1552 		goto discard_it;
1553 
1554 	if (skb->len < (th->doff<<2) || tcp_checksum_complete(skb)) {
1555 csum_error:
1556 		TCP_INC_STATS_BH(net, TCP_MIB_CSUMERRORS);
1557 bad_packet:
1558 		TCP_INC_STATS_BH(net, TCP_MIB_INERRS);
1559 	} else {
1560 		tcp_v6_send_reset(NULL, skb);
1561 	}
1562 
1563 discard_it:
1564 	kfree_skb(skb);
1565 	return 0;
1566 
1567 discard_and_relse:
1568 	sock_put(sk);
1569 	goto discard_it;
1570 
1571 do_time_wait:
1572 	if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb)) {
1573 		inet_twsk_put(inet_twsk(sk));
1574 		goto discard_it;
1575 	}
1576 
1577 	if (skb->len < (th->doff<<2)) {
1578 		inet_twsk_put(inet_twsk(sk));
1579 		goto bad_packet;
1580 	}
1581 	if (tcp_checksum_complete(skb)) {
1582 		inet_twsk_put(inet_twsk(sk));
1583 		goto csum_error;
1584 	}
1585 
1586 	switch (tcp_timewait_state_process(inet_twsk(sk), skb, th)) {
1587 	case TCP_TW_SYN:
1588 	{
1589 		struct sock *sk2;
1590 
1591 		sk2 = inet6_lookup_listener(dev_net(skb->dev), &tcp_hashinfo,
1592 					    &ipv6_hdr(skb)->saddr, th->source,
1593 					    &ipv6_hdr(skb)->daddr,
1594 					    ntohs(th->dest), inet6_iif(skb));
1595 		if (sk2 != NULL) {
1596 			struct inet_timewait_sock *tw = inet_twsk(sk);
1597 			inet_twsk_deschedule(tw, &tcp_death_row);
1598 			inet_twsk_put(tw);
1599 			sk = sk2;
1600 			goto process;
1601 		}
1602 		/* Fall through to ACK */
1603 	}
1604 	case TCP_TW_ACK:
1605 		tcp_v6_timewait_ack(sk, skb);
1606 		break;
1607 	case TCP_TW_RST:
1608 		goto no_tcp_socket;
1609 	case TCP_TW_SUCCESS:
1610 		;
1611 	}
1612 	goto discard_it;
1613 }
1614 
1615 static void tcp_v6_early_demux(struct sk_buff *skb)
1616 {
1617 	const struct ipv6hdr *hdr;
1618 	const struct tcphdr *th;
1619 	struct sock *sk;
1620 
1621 	if (skb->pkt_type != PACKET_HOST)
1622 		return;
1623 
1624 	if (!pskb_may_pull(skb, skb_transport_offset(skb) + sizeof(struct tcphdr)))
1625 		return;
1626 
1627 	hdr = ipv6_hdr(skb);
1628 	th = tcp_hdr(skb);
1629 
1630 	if (th->doff < sizeof(struct tcphdr) / 4)
1631 		return;
1632 
1633 	sk = __inet6_lookup_established(dev_net(skb->dev), &tcp_hashinfo,
1634 					&hdr->saddr, th->source,
1635 					&hdr->daddr, ntohs(th->dest),
1636 					inet6_iif(skb));
1637 	if (sk) {
1638 		skb->sk = sk;
1639 		skb->destructor = sock_edemux;
1640 		if (sk->sk_state != TCP_TIME_WAIT) {
1641 			struct dst_entry *dst = sk->sk_rx_dst;
1642 
1643 			if (dst)
1644 				dst = dst_check(dst, inet6_sk(sk)->rx_dst_cookie);
1645 			if (dst &&
1646 			    inet_sk(sk)->rx_dst_ifindex == skb->skb_iif)
1647 				skb_dst_set_noref(skb, dst);
1648 		}
1649 	}
1650 }
1651 
1652 static struct timewait_sock_ops tcp6_timewait_sock_ops = {
1653 	.twsk_obj_size	= sizeof(struct tcp6_timewait_sock),
1654 	.twsk_unique	= tcp_twsk_unique,
1655 	.twsk_destructor = tcp_twsk_destructor,
1656 };
1657 
1658 static const struct inet_connection_sock_af_ops ipv6_specific = {
1659 	.queue_xmit	   = inet6_csk_xmit,
1660 	.send_check	   = tcp_v6_send_check,
1661 	.rebuild_header	   = inet6_sk_rebuild_header,
1662 	.sk_rx_dst_set	   = inet6_sk_rx_dst_set,
1663 	.conn_request	   = tcp_v6_conn_request,
1664 	.syn_recv_sock	   = tcp_v6_syn_recv_sock,
1665 	.net_header_len	   = sizeof(struct ipv6hdr),
1666 	.net_frag_header_len = sizeof(struct frag_hdr),
1667 	.setsockopt	   = ipv6_setsockopt,
1668 	.getsockopt	   = ipv6_getsockopt,
1669 	.addr2sockaddr	   = inet6_csk_addr2sockaddr,
1670 	.sockaddr_len	   = sizeof(struct sockaddr_in6),
1671 	.bind_conflict	   = inet6_csk_bind_conflict,
1672 #ifdef CONFIG_COMPAT
1673 	.compat_setsockopt = compat_ipv6_setsockopt,
1674 	.compat_getsockopt = compat_ipv6_getsockopt,
1675 #endif
1676 };
1677 
1678 #ifdef CONFIG_TCP_MD5SIG
1679 static const struct tcp_sock_af_ops tcp_sock_ipv6_specific = {
1680 	.md5_lookup	=	tcp_v6_md5_lookup,
1681 	.calc_md5_hash	=	tcp_v6_md5_hash_skb,
1682 	.md5_parse	=	tcp_v6_parse_md5_keys,
1683 };
1684 #endif
1685 
1686 /*
1687  *	TCP over IPv4 via INET6 API
1688  */
1689 static const struct inet_connection_sock_af_ops ipv6_mapped = {
1690 	.queue_xmit	   = ip_queue_xmit,
1691 	.send_check	   = tcp_v4_send_check,
1692 	.rebuild_header	   = inet_sk_rebuild_header,
1693 	.sk_rx_dst_set	   = inet_sk_rx_dst_set,
1694 	.conn_request	   = tcp_v6_conn_request,
1695 	.syn_recv_sock	   = tcp_v6_syn_recv_sock,
1696 	.net_header_len	   = sizeof(struct iphdr),
1697 	.setsockopt	   = ipv6_setsockopt,
1698 	.getsockopt	   = ipv6_getsockopt,
1699 	.addr2sockaddr	   = inet6_csk_addr2sockaddr,
1700 	.sockaddr_len	   = sizeof(struct sockaddr_in6),
1701 	.bind_conflict	   = inet6_csk_bind_conflict,
1702 #ifdef CONFIG_COMPAT
1703 	.compat_setsockopt = compat_ipv6_setsockopt,
1704 	.compat_getsockopt = compat_ipv6_getsockopt,
1705 #endif
1706 };
1707 
1708 #ifdef CONFIG_TCP_MD5SIG
1709 static const struct tcp_sock_af_ops tcp_sock_ipv6_mapped_specific = {
1710 	.md5_lookup	=	tcp_v4_md5_lookup,
1711 	.calc_md5_hash	=	tcp_v4_md5_hash_skb,
1712 	.md5_parse	=	tcp_v6_parse_md5_keys,
1713 };
1714 #endif
1715 
1716 /* NOTE: A lot of things set to zero explicitly by call to
1717  *       sk_alloc() so need not be done here.
1718  */
1719 static int tcp_v6_init_sock(struct sock *sk)
1720 {
1721 	struct inet_connection_sock *icsk = inet_csk(sk);
1722 
1723 	tcp_init_sock(sk);
1724 
1725 	icsk->icsk_af_ops = &ipv6_specific;
1726 
1727 #ifdef CONFIG_TCP_MD5SIG
1728 	tcp_sk(sk)->af_specific = &tcp_sock_ipv6_specific;
1729 #endif
1730 
1731 	return 0;
1732 }
1733 
1734 static void tcp_v6_destroy_sock(struct sock *sk)
1735 {
1736 	tcp_v4_destroy_sock(sk);
1737 	inet6_destroy_sock(sk);
1738 }
1739 
1740 #ifdef CONFIG_PROC_FS
1741 /* Proc filesystem TCPv6 sock list dumping. */
1742 static void get_openreq6(struct seq_file *seq,
1743 			 const struct sock *sk, struct request_sock *req, int i, kuid_t uid)
1744 {
1745 	int ttd = req->expires - jiffies;
1746 	const struct in6_addr *src = &inet_rsk(req)->ir_v6_loc_addr;
1747 	const struct in6_addr *dest = &inet_rsk(req)->ir_v6_rmt_addr;
1748 
1749 	if (ttd < 0)
1750 		ttd = 0;
1751 
1752 	seq_printf(seq,
1753 		   "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1754 		   "%02X %08X:%08X %02X:%08lX %08X %5u %8d %d %d %pK\n",
1755 		   i,
1756 		   src->s6_addr32[0], src->s6_addr32[1],
1757 		   src->s6_addr32[2], src->s6_addr32[3],
1758 		   inet_rsk(req)->ir_num,
1759 		   dest->s6_addr32[0], dest->s6_addr32[1],
1760 		   dest->s6_addr32[2], dest->s6_addr32[3],
1761 		   ntohs(inet_rsk(req)->ir_rmt_port),
1762 		   TCP_SYN_RECV,
1763 		   0, 0, /* could print option size, but that is af dependent. */
1764 		   1,   /* timers active (only the expire timer) */
1765 		   jiffies_to_clock_t(ttd),
1766 		   req->num_timeout,
1767 		   from_kuid_munged(seq_user_ns(seq), uid),
1768 		   0,  /* non standard timer */
1769 		   0, /* open_requests have no inode */
1770 		   0, req);
1771 }
1772 
1773 static void get_tcp6_sock(struct seq_file *seq, struct sock *sp, int i)
1774 {
1775 	const struct in6_addr *dest, *src;
1776 	__u16 destp, srcp;
1777 	int timer_active;
1778 	unsigned long timer_expires;
1779 	const struct inet_sock *inet = inet_sk(sp);
1780 	const struct tcp_sock *tp = tcp_sk(sp);
1781 	const struct inet_connection_sock *icsk = inet_csk(sp);
1782 
1783 	dest  = &sp->sk_v6_daddr;
1784 	src   = &sp->sk_v6_rcv_saddr;
1785 	destp = ntohs(inet->inet_dport);
1786 	srcp  = ntohs(inet->inet_sport);
1787 
1788 	if (icsk->icsk_pending == ICSK_TIME_RETRANS) {
1789 		timer_active	= 1;
1790 		timer_expires	= icsk->icsk_timeout;
1791 	} else if (icsk->icsk_pending == ICSK_TIME_PROBE0) {
1792 		timer_active	= 4;
1793 		timer_expires	= icsk->icsk_timeout;
1794 	} else if (timer_pending(&sp->sk_timer)) {
1795 		timer_active	= 2;
1796 		timer_expires	= sp->sk_timer.expires;
1797 	} else {
1798 		timer_active	= 0;
1799 		timer_expires = jiffies;
1800 	}
1801 
1802 	seq_printf(seq,
1803 		   "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1804 		   "%02X %08X:%08X %02X:%08lX %08X %5u %8d %lu %d %pK %lu %lu %u %u %d\n",
1805 		   i,
1806 		   src->s6_addr32[0], src->s6_addr32[1],
1807 		   src->s6_addr32[2], src->s6_addr32[3], srcp,
1808 		   dest->s6_addr32[0], dest->s6_addr32[1],
1809 		   dest->s6_addr32[2], dest->s6_addr32[3], destp,
1810 		   sp->sk_state,
1811 		   tp->write_seq-tp->snd_una,
1812 		   (sp->sk_state == TCP_LISTEN) ? sp->sk_ack_backlog : (tp->rcv_nxt - tp->copied_seq),
1813 		   timer_active,
1814 		   jiffies_delta_to_clock_t(timer_expires - jiffies),
1815 		   icsk->icsk_retransmits,
1816 		   from_kuid_munged(seq_user_ns(seq), sock_i_uid(sp)),
1817 		   icsk->icsk_probes_out,
1818 		   sock_i_ino(sp),
1819 		   atomic_read(&sp->sk_refcnt), sp,
1820 		   jiffies_to_clock_t(icsk->icsk_rto),
1821 		   jiffies_to_clock_t(icsk->icsk_ack.ato),
1822 		   (icsk->icsk_ack.quick << 1) | icsk->icsk_ack.pingpong,
1823 		   tp->snd_cwnd,
1824 		   tcp_in_initial_slowstart(tp) ? -1 : tp->snd_ssthresh
1825 		   );
1826 }
1827 
1828 static void get_timewait6_sock(struct seq_file *seq,
1829 			       struct inet_timewait_sock *tw, int i)
1830 {
1831 	const struct in6_addr *dest, *src;
1832 	__u16 destp, srcp;
1833 	s32 delta = tw->tw_ttd - inet_tw_time_stamp();
1834 
1835 	dest = &tw->tw_v6_daddr;
1836 	src  = &tw->tw_v6_rcv_saddr;
1837 	destp = ntohs(tw->tw_dport);
1838 	srcp  = ntohs(tw->tw_sport);
1839 
1840 	seq_printf(seq,
1841 		   "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
1842 		   "%02X %08X:%08X %02X:%08lX %08X %5d %8d %d %d %pK\n",
1843 		   i,
1844 		   src->s6_addr32[0], src->s6_addr32[1],
1845 		   src->s6_addr32[2], src->s6_addr32[3], srcp,
1846 		   dest->s6_addr32[0], dest->s6_addr32[1],
1847 		   dest->s6_addr32[2], dest->s6_addr32[3], destp,
1848 		   tw->tw_substate, 0, 0,
1849 		   3, jiffies_delta_to_clock_t(delta), 0, 0, 0, 0,
1850 		   atomic_read(&tw->tw_refcnt), tw);
1851 }
1852 
1853 static int tcp6_seq_show(struct seq_file *seq, void *v)
1854 {
1855 	struct tcp_iter_state *st;
1856 	struct sock *sk = v;
1857 
1858 	if (v == SEQ_START_TOKEN) {
1859 		seq_puts(seq,
1860 			 "  sl  "
1861 			 "local_address                         "
1862 			 "remote_address                        "
1863 			 "st tx_queue rx_queue tr tm->when retrnsmt"
1864 			 "   uid  timeout inode\n");
1865 		goto out;
1866 	}
1867 	st = seq->private;
1868 
1869 	switch (st->state) {
1870 	case TCP_SEQ_STATE_LISTENING:
1871 	case TCP_SEQ_STATE_ESTABLISHED:
1872 		if (sk->sk_state == TCP_TIME_WAIT)
1873 			get_timewait6_sock(seq, v, st->num);
1874 		else
1875 			get_tcp6_sock(seq, v, st->num);
1876 		break;
1877 	case TCP_SEQ_STATE_OPENREQ:
1878 		get_openreq6(seq, st->syn_wait_sk, v, st->num, st->uid);
1879 		break;
1880 	}
1881 out:
1882 	return 0;
1883 }
1884 
1885 static const struct file_operations tcp6_afinfo_seq_fops = {
1886 	.owner   = THIS_MODULE,
1887 	.open    = tcp_seq_open,
1888 	.read    = seq_read,
1889 	.llseek  = seq_lseek,
1890 	.release = seq_release_net
1891 };
1892 
1893 static struct tcp_seq_afinfo tcp6_seq_afinfo = {
1894 	.name		= "tcp6",
1895 	.family		= AF_INET6,
1896 	.seq_fops	= &tcp6_afinfo_seq_fops,
1897 	.seq_ops	= {
1898 		.show		= tcp6_seq_show,
1899 	},
1900 };
1901 
1902 int __net_init tcp6_proc_init(struct net *net)
1903 {
1904 	return tcp_proc_register(net, &tcp6_seq_afinfo);
1905 }
1906 
1907 void tcp6_proc_exit(struct net *net)
1908 {
1909 	tcp_proc_unregister(net, &tcp6_seq_afinfo);
1910 }
1911 #endif
1912 
1913 static void tcp_v6_clear_sk(struct sock *sk, int size)
1914 {
1915 	struct inet_sock *inet = inet_sk(sk);
1916 
1917 	/* we do not want to clear pinet6 field, because of RCU lookups */
1918 	sk_prot_clear_nulls(sk, offsetof(struct inet_sock, pinet6));
1919 
1920 	size -= offsetof(struct inet_sock, pinet6) + sizeof(inet->pinet6);
1921 	memset(&inet->pinet6 + 1, 0, size);
1922 }
1923 
1924 struct proto tcpv6_prot = {
1925 	.name			= "TCPv6",
1926 	.owner			= THIS_MODULE,
1927 	.close			= tcp_close,
1928 	.connect		= tcp_v6_connect,
1929 	.disconnect		= tcp_disconnect,
1930 	.accept			= inet_csk_accept,
1931 	.ioctl			= tcp_ioctl,
1932 	.init			= tcp_v6_init_sock,
1933 	.destroy		= tcp_v6_destroy_sock,
1934 	.shutdown		= tcp_shutdown,
1935 	.setsockopt		= tcp_setsockopt,
1936 	.getsockopt		= tcp_getsockopt,
1937 	.recvmsg		= tcp_recvmsg,
1938 	.sendmsg		= tcp_sendmsg,
1939 	.sendpage		= tcp_sendpage,
1940 	.backlog_rcv		= tcp_v6_do_rcv,
1941 	.release_cb		= tcp_release_cb,
1942 	.mtu_reduced		= tcp_v6_mtu_reduced,
1943 	.hash			= tcp_v6_hash,
1944 	.unhash			= inet_unhash,
1945 	.get_port		= inet_csk_get_port,
1946 	.enter_memory_pressure	= tcp_enter_memory_pressure,
1947 	.stream_memory_free	= tcp_stream_memory_free,
1948 	.sockets_allocated	= &tcp_sockets_allocated,
1949 	.memory_allocated	= &tcp_memory_allocated,
1950 	.memory_pressure	= &tcp_memory_pressure,
1951 	.orphan_count		= &tcp_orphan_count,
1952 	.sysctl_mem		= sysctl_tcp_mem,
1953 	.sysctl_wmem		= sysctl_tcp_wmem,
1954 	.sysctl_rmem		= sysctl_tcp_rmem,
1955 	.max_header		= MAX_TCP_HEADER,
1956 	.obj_size		= sizeof(struct tcp6_sock),
1957 	.slab_flags		= SLAB_DESTROY_BY_RCU,
1958 	.twsk_prot		= &tcp6_timewait_sock_ops,
1959 	.rsk_prot		= &tcp6_request_sock_ops,
1960 	.h.hashinfo		= &tcp_hashinfo,
1961 	.no_autobind		= true,
1962 #ifdef CONFIG_COMPAT
1963 	.compat_setsockopt	= compat_tcp_setsockopt,
1964 	.compat_getsockopt	= compat_tcp_getsockopt,
1965 #endif
1966 #ifdef CONFIG_MEMCG_KMEM
1967 	.proto_cgroup		= tcp_proto_cgroup,
1968 #endif
1969 	.clear_sk		= tcp_v6_clear_sk,
1970 };
1971 
1972 static const struct inet6_protocol tcpv6_protocol = {
1973 	.early_demux	=	tcp_v6_early_demux,
1974 	.handler	=	tcp_v6_rcv,
1975 	.err_handler	=	tcp_v6_err,
1976 	.flags		=	INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
1977 };
1978 
1979 static struct inet_protosw tcpv6_protosw = {
1980 	.type		=	SOCK_STREAM,
1981 	.protocol	=	IPPROTO_TCP,
1982 	.prot		=	&tcpv6_prot,
1983 	.ops		=	&inet6_stream_ops,
1984 	.no_check	=	0,
1985 	.flags		=	INET_PROTOSW_PERMANENT |
1986 				INET_PROTOSW_ICSK,
1987 };
1988 
1989 static int __net_init tcpv6_net_init(struct net *net)
1990 {
1991 	return inet_ctl_sock_create(&net->ipv6.tcp_sk, PF_INET6,
1992 				    SOCK_RAW, IPPROTO_TCP, net);
1993 }
1994 
1995 static void __net_exit tcpv6_net_exit(struct net *net)
1996 {
1997 	inet_ctl_sock_destroy(net->ipv6.tcp_sk);
1998 }
1999 
2000 static void __net_exit tcpv6_net_exit_batch(struct list_head *net_exit_list)
2001 {
2002 	inet_twsk_purge(&tcp_hashinfo, &tcp_death_row, AF_INET6);
2003 }
2004 
2005 static struct pernet_operations tcpv6_net_ops = {
2006 	.init	    = tcpv6_net_init,
2007 	.exit	    = tcpv6_net_exit,
2008 	.exit_batch = tcpv6_net_exit_batch,
2009 };
2010 
2011 int __init tcpv6_init(void)
2012 {
2013 	int ret;
2014 
2015 	ret = inet6_add_protocol(&tcpv6_protocol, IPPROTO_TCP);
2016 	if (ret)
2017 		goto out;
2018 
2019 	/* register inet6 protocol */
2020 	ret = inet6_register_protosw(&tcpv6_protosw);
2021 	if (ret)
2022 		goto out_tcpv6_protocol;
2023 
2024 	ret = register_pernet_subsys(&tcpv6_net_ops);
2025 	if (ret)
2026 		goto out_tcpv6_protosw;
2027 out:
2028 	return ret;
2029 
2030 out_tcpv6_protosw:
2031 	inet6_unregister_protosw(&tcpv6_protosw);
2032 out_tcpv6_protocol:
2033 	inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2034 	goto out;
2035 }
2036 
2037 void tcpv6_exit(void)
2038 {
2039 	unregister_pernet_subsys(&tcpv6_net_ops);
2040 	inet6_unregister_protosw(&tcpv6_protosw);
2041 	inet6_del_protocol(&tcpv6_protocol, IPPROTO_TCP);
2042 }
2043