xref: /openbmc/linux/net/ipv6/udp.c (revision 96de0e252cedffad61b3cb5e05662c591898e69a)
1 /*
2  *	UDP over IPv6
3  *	Linux INET6 implementation
4  *
5  *	Authors:
6  *	Pedro Roque		<roque@di.fc.ul.pt>
7  *
8  *	Based on linux/ipv4/udp.c
9  *
10  *	$Id: udp.c,v 1.65 2002/02/01 22:01:04 davem Exp $
11  *
12  *	Fixes:
13  *	Hideaki YOSHIFUJI	:	sin6_scope_id support
14  *	YOSHIFUJI Hideaki @USAGI and:	Support IPV6_V6ONLY socket option, which
15  *	Alexey Kuznetsov		allow both IPv4 and IPv6 sockets to bind
16  *					a single port at the same time.
17  *      Kazunori MIYAZAWA @USAGI:       change process style to use ip6_append_data
18  *      YOSHIFUJI Hideaki @USAGI:	convert /proc/net/udp6 to seq_file.
19  *
20  *	This program is free software; you can redistribute it and/or
21  *      modify it under the terms of the GNU General Public License
22  *      as published by the Free Software Foundation; either version
23  *      2 of the License, or (at your option) any later version.
24  */
25 
26 #include <linux/errno.h>
27 #include <linux/types.h>
28 #include <linux/socket.h>
29 #include <linux/sockios.h>
30 #include <linux/net.h>
31 #include <linux/in6.h>
32 #include <linux/netdevice.h>
33 #include <linux/if_arp.h>
34 #include <linux/ipv6.h>
35 #include <linux/icmpv6.h>
36 #include <linux/init.h>
37 #include <linux/skbuff.h>
38 #include <asm/uaccess.h>
39 
40 #include <net/ndisc.h>
41 #include <net/protocol.h>
42 #include <net/transp_v6.h>
43 #include <net/ip6_route.h>
44 #include <net/raw.h>
45 #include <net/tcp_states.h>
46 #include <net/ip6_checksum.h>
47 #include <net/xfrm.h>
48 
49 #include <linux/proc_fs.h>
50 #include <linux/seq_file.h>
51 #include "udp_impl.h"
52 
53 DEFINE_SNMP_STAT(struct udp_mib, udp_stats_in6) __read_mostly;
54 
55 static inline int udp_v6_get_port(struct sock *sk, unsigned short snum)
56 {
57 	return udp_get_port(sk, snum, ipv6_rcv_saddr_equal);
58 }
59 
60 static struct sock *__udp6_lib_lookup(struct in6_addr *saddr, __be16 sport,
61 				      struct in6_addr *daddr, __be16 dport,
62 				      int dif, struct hlist_head udptable[])
63 {
64 	struct sock *sk, *result = NULL;
65 	struct hlist_node *node;
66 	unsigned short hnum = ntohs(dport);
67 	int badness = -1;
68 
69 	read_lock(&udp_hash_lock);
70 	sk_for_each(sk, node, &udptable[hnum & (UDP_HTABLE_SIZE - 1)]) {
71 		struct inet_sock *inet = inet_sk(sk);
72 
73 		if (sk->sk_hash == hnum && sk->sk_family == PF_INET6) {
74 			struct ipv6_pinfo *np = inet6_sk(sk);
75 			int score = 0;
76 			if (inet->dport) {
77 				if (inet->dport != sport)
78 					continue;
79 				score++;
80 			}
81 			if (!ipv6_addr_any(&np->rcv_saddr)) {
82 				if (!ipv6_addr_equal(&np->rcv_saddr, daddr))
83 					continue;
84 				score++;
85 			}
86 			if (!ipv6_addr_any(&np->daddr)) {
87 				if (!ipv6_addr_equal(&np->daddr, saddr))
88 					continue;
89 				score++;
90 			}
91 			if (sk->sk_bound_dev_if) {
92 				if (sk->sk_bound_dev_if != dif)
93 					continue;
94 				score++;
95 			}
96 			if (score == 4) {
97 				result = sk;
98 				break;
99 			} else if (score > badness) {
100 				result = sk;
101 				badness = score;
102 			}
103 		}
104 	}
105 	if (result)
106 		sock_hold(result);
107 	read_unlock(&udp_hash_lock);
108 	return result;
109 }
110 
111 /*
112  * 	This should be easy, if there is something there we
113  * 	return it, otherwise we block.
114  */
115 
116 int udpv6_recvmsg(struct kiocb *iocb, struct sock *sk,
117 		  struct msghdr *msg, size_t len,
118 		  int noblock, int flags, int *addr_len)
119 {
120 	struct ipv6_pinfo *np = inet6_sk(sk);
121 	struct inet_sock *inet = inet_sk(sk);
122 	struct sk_buff *skb;
123 	unsigned int ulen, copied;
124 	int err;
125 	int is_udplite = IS_UDPLITE(sk);
126 
127 	if (addr_len)
128 		*addr_len=sizeof(struct sockaddr_in6);
129 
130 	if (flags & MSG_ERRQUEUE)
131 		return ipv6_recv_error(sk, msg, len);
132 
133 try_again:
134 	skb = skb_recv_datagram(sk, flags, noblock, &err);
135 	if (!skb)
136 		goto out;
137 
138 	ulen = skb->len - sizeof(struct udphdr);
139 	copied = len;
140 	if (copied > ulen)
141 		copied = ulen;
142 	else if (copied < ulen)
143 		msg->msg_flags |= MSG_TRUNC;
144 
145 	/*
146 	 * If checksum is needed at all, try to do it while copying the
147 	 * data.  If the data is truncated, or if we only want a partial
148 	 * coverage checksum (UDP-Lite), do it before the copy.
149 	 */
150 
151 	if (copied < ulen || UDP_SKB_CB(skb)->partial_cov) {
152 		if (udp_lib_checksum_complete(skb))
153 			goto csum_copy_err;
154 	}
155 
156 	if (skb_csum_unnecessary(skb))
157 		err = skb_copy_datagram_iovec(skb, sizeof(struct udphdr),
158 					      msg->msg_iov, copied       );
159 	else {
160 		err = skb_copy_and_csum_datagram_iovec(skb, sizeof(struct udphdr), msg->msg_iov);
161 		if (err == -EINVAL)
162 			goto csum_copy_err;
163 	}
164 	if (err)
165 		goto out_free;
166 
167 	sock_recv_timestamp(msg, sk, skb);
168 
169 	/* Copy the address. */
170 	if (msg->msg_name) {
171 		struct sockaddr_in6 *sin6;
172 
173 		sin6 = (struct sockaddr_in6 *) msg->msg_name;
174 		sin6->sin6_family = AF_INET6;
175 		sin6->sin6_port = udp_hdr(skb)->source;
176 		sin6->sin6_flowinfo = 0;
177 		sin6->sin6_scope_id = 0;
178 
179 		if (skb->protocol == htons(ETH_P_IP))
180 			ipv6_addr_set(&sin6->sin6_addr, 0, 0,
181 				      htonl(0xffff), ip_hdr(skb)->saddr);
182 		else {
183 			ipv6_addr_copy(&sin6->sin6_addr,
184 				       &ipv6_hdr(skb)->saddr);
185 			if (ipv6_addr_type(&sin6->sin6_addr) & IPV6_ADDR_LINKLOCAL)
186 				sin6->sin6_scope_id = IP6CB(skb)->iif;
187 		}
188 
189 	}
190 	if (skb->protocol == htons(ETH_P_IP)) {
191 		if (inet->cmsg_flags)
192 			ip_cmsg_recv(msg, skb);
193 	} else {
194 		if (np->rxopt.all)
195 			datagram_recv_ctl(sk, msg, skb);
196 	}
197 
198 	err = copied;
199 	if (flags & MSG_TRUNC)
200 		err = ulen;
201 
202 out_free:
203 	skb_free_datagram(sk, skb);
204 out:
205 	return err;
206 
207 csum_copy_err:
208 	skb_kill_datagram(sk, skb, flags);
209 
210 	if (flags & MSG_DONTWAIT) {
211 		UDP6_INC_STATS_USER(UDP_MIB_INERRORS, is_udplite);
212 		return -EAGAIN;
213 	}
214 	goto try_again;
215 }
216 
217 void __udp6_lib_err(struct sk_buff *skb, struct inet6_skb_parm *opt,
218 		    int type, int code, int offset, __be32 info,
219 		    struct hlist_head udptable[]                    )
220 {
221 	struct ipv6_pinfo *np;
222 	struct ipv6hdr *hdr = (struct ipv6hdr*)skb->data;
223 	struct in6_addr *saddr = &hdr->saddr;
224 	struct in6_addr *daddr = &hdr->daddr;
225 	struct udphdr *uh = (struct udphdr*)(skb->data+offset);
226 	struct sock *sk;
227 	int err;
228 
229 	sk = __udp6_lib_lookup(daddr, uh->dest,
230 			       saddr, uh->source, inet6_iif(skb), udptable);
231 	if (sk == NULL)
232 		return;
233 
234 	np = inet6_sk(sk);
235 
236 	if (!icmpv6_err_convert(type, code, &err) && !np->recverr)
237 		goto out;
238 
239 	if (sk->sk_state != TCP_ESTABLISHED && !np->recverr)
240 		goto out;
241 
242 	if (np->recverr)
243 		ipv6_icmp_error(sk, skb, err, uh->dest, ntohl(info), (u8 *)(uh+1));
244 
245 	sk->sk_err = err;
246 	sk->sk_error_report(sk);
247 out:
248 	sock_put(sk);
249 }
250 
251 static __inline__ void udpv6_err(struct sk_buff *skb,
252 				 struct inet6_skb_parm *opt, int type,
253 				 int code, int offset, __be32 info     )
254 {
255 	return __udp6_lib_err(skb, opt, type, code, offset, info, udp_hash);
256 }
257 
258 int udpv6_queue_rcv_skb(struct sock * sk, struct sk_buff *skb)
259 {
260 	struct udp_sock *up = udp_sk(sk);
261 	int rc;
262 
263 	if (!xfrm6_policy_check(sk, XFRM_POLICY_IN, skb))
264 		goto drop;
265 
266 	/*
267 	 * UDP-Lite specific tests, ignored on UDP sockets (see net/ipv4/udp.c).
268 	 */
269 	if ((up->pcflag & UDPLITE_RECV_CC)  &&  UDP_SKB_CB(skb)->partial_cov) {
270 
271 		if (up->pcrlen == 0) {          /* full coverage was set  */
272 			LIMIT_NETDEBUG(KERN_WARNING "UDPLITE6: partial coverage"
273 				" %d while full coverage %d requested\n",
274 				UDP_SKB_CB(skb)->cscov, skb->len);
275 			goto drop;
276 		}
277 		if (UDP_SKB_CB(skb)->cscov  <  up->pcrlen) {
278 			LIMIT_NETDEBUG(KERN_WARNING "UDPLITE6: coverage %d "
279 						    "too small, need min %d\n",
280 				       UDP_SKB_CB(skb)->cscov, up->pcrlen);
281 			goto drop;
282 		}
283 	}
284 
285 	if (sk->sk_filter) {
286 		if (udp_lib_checksum_complete(skb))
287 			goto drop;
288 	}
289 
290 	if ((rc = sock_queue_rcv_skb(sk,skb)) < 0) {
291 		/* Note that an ENOMEM error is charged twice */
292 		if (rc == -ENOMEM)
293 			UDP6_INC_STATS_BH(UDP_MIB_RCVBUFERRORS, up->pcflag);
294 		goto drop;
295 	}
296 	UDP6_INC_STATS_BH(UDP_MIB_INDATAGRAMS, up->pcflag);
297 	return 0;
298 drop:
299 	UDP6_INC_STATS_BH(UDP_MIB_INERRORS, up->pcflag);
300 	kfree_skb(skb);
301 	return -1;
302 }
303 
304 static struct sock *udp_v6_mcast_next(struct sock *sk,
305 				      __be16 loc_port, struct in6_addr *loc_addr,
306 				      __be16 rmt_port, struct in6_addr *rmt_addr,
307 				      int dif)
308 {
309 	struct hlist_node *node;
310 	struct sock *s = sk;
311 	unsigned short num = ntohs(loc_port);
312 
313 	sk_for_each_from(s, node) {
314 		struct inet_sock *inet = inet_sk(s);
315 
316 		if (s->sk_hash == num && s->sk_family == PF_INET6) {
317 			struct ipv6_pinfo *np = inet6_sk(s);
318 			if (inet->dport) {
319 				if (inet->dport != rmt_port)
320 					continue;
321 			}
322 			if (!ipv6_addr_any(&np->daddr) &&
323 			    !ipv6_addr_equal(&np->daddr, rmt_addr))
324 				continue;
325 
326 			if (s->sk_bound_dev_if && s->sk_bound_dev_if != dif)
327 				continue;
328 
329 			if (!ipv6_addr_any(&np->rcv_saddr)) {
330 				if (!ipv6_addr_equal(&np->rcv_saddr, loc_addr))
331 					continue;
332 			}
333 			if (!inet6_mc_check(s, loc_addr, rmt_addr))
334 				continue;
335 			return s;
336 		}
337 	}
338 	return NULL;
339 }
340 
341 /*
342  * Note: called only from the BH handler context,
343  * so we don't need to lock the hashes.
344  */
345 static int __udp6_lib_mcast_deliver(struct sk_buff *skb, struct in6_addr *saddr,
346 			   struct in6_addr *daddr, struct hlist_head udptable[])
347 {
348 	struct sock *sk, *sk2;
349 	const struct udphdr *uh = udp_hdr(skb);
350 	int dif;
351 
352 	read_lock(&udp_hash_lock);
353 	sk = sk_head(&udptable[ntohs(uh->dest) & (UDP_HTABLE_SIZE - 1)]);
354 	dif = inet6_iif(skb);
355 	sk = udp_v6_mcast_next(sk, uh->dest, daddr, uh->source, saddr, dif);
356 	if (!sk) {
357 		kfree_skb(skb);
358 		goto out;
359 	}
360 
361 	sk2 = sk;
362 	while ((sk2 = udp_v6_mcast_next(sk_next(sk2), uh->dest, daddr,
363 					uh->source, saddr, dif))) {
364 		struct sk_buff *buff = skb_clone(skb, GFP_ATOMIC);
365 		if (buff)
366 			udpv6_queue_rcv_skb(sk2, buff);
367 	}
368 	udpv6_queue_rcv_skb(sk, skb);
369 out:
370 	read_unlock(&udp_hash_lock);
371 	return 0;
372 }
373 
374 static inline int udp6_csum_init(struct sk_buff *skb, struct udphdr *uh,
375 				 int proto)
376 {
377 	int err;
378 
379 	UDP_SKB_CB(skb)->partial_cov = 0;
380 	UDP_SKB_CB(skb)->cscov = skb->len;
381 
382 	if (proto == IPPROTO_UDPLITE) {
383 		err = udplite_checksum_init(skb, uh);
384 		if (err)
385 			return err;
386 	}
387 
388 	if (uh->check == 0) {
389 		/* RFC 2460 section 8.1 says that we SHOULD log
390 		   this error. Well, it is reasonable.
391 		 */
392 		LIMIT_NETDEBUG(KERN_INFO "IPv6: udp checksum is 0\n");
393 		return 1;
394 	}
395 	if (skb->ip_summed == CHECKSUM_COMPLETE &&
396 	    !csum_ipv6_magic(&ipv6_hdr(skb)->saddr, &ipv6_hdr(skb)->daddr,
397 			     skb->len, proto, skb->csum))
398 		skb->ip_summed = CHECKSUM_UNNECESSARY;
399 
400 	if (!skb_csum_unnecessary(skb))
401 		skb->csum = ~csum_unfold(csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
402 							 &ipv6_hdr(skb)->daddr,
403 							 skb->len, proto, 0));
404 
405 	return 0;
406 }
407 
408 int __udp6_lib_rcv(struct sk_buff *skb, struct hlist_head udptable[],
409 		   int proto)
410 {
411 	struct sock *sk;
412 	struct udphdr *uh;
413 	struct net_device *dev = skb->dev;
414 	struct in6_addr *saddr, *daddr;
415 	u32 ulen = 0;
416 
417 	if (!pskb_may_pull(skb, sizeof(struct udphdr)))
418 		goto short_packet;
419 
420 	saddr = &ipv6_hdr(skb)->saddr;
421 	daddr = &ipv6_hdr(skb)->daddr;
422 	uh = udp_hdr(skb);
423 
424 	ulen = ntohs(uh->len);
425 	if (ulen > skb->len)
426 		goto short_packet;
427 
428 	if (proto == IPPROTO_UDP) {
429 		/* UDP validates ulen. */
430 
431 		/* Check for jumbo payload */
432 		if (ulen == 0)
433 			ulen = skb->len;
434 
435 		if (ulen < sizeof(*uh))
436 			goto short_packet;
437 
438 		if (ulen < skb->len) {
439 			if (pskb_trim_rcsum(skb, ulen))
440 				goto short_packet;
441 			saddr = &ipv6_hdr(skb)->saddr;
442 			daddr = &ipv6_hdr(skb)->daddr;
443 			uh = udp_hdr(skb);
444 		}
445 	}
446 
447 	if (udp6_csum_init(skb, uh, proto))
448 		goto discard;
449 
450 	/*
451 	 *	Multicast receive code
452 	 */
453 	if (ipv6_addr_is_multicast(daddr))
454 		return __udp6_lib_mcast_deliver(skb, saddr, daddr, udptable);
455 
456 	/* Unicast */
457 
458 	/*
459 	 * check socket cache ... must talk to Alan about his plans
460 	 * for sock caches... i'll skip this for now.
461 	 */
462 	sk = __udp6_lib_lookup(saddr, uh->source,
463 			       daddr, uh->dest, inet6_iif(skb), udptable);
464 
465 	if (sk == NULL) {
466 		if (!xfrm6_policy_check(NULL, XFRM_POLICY_IN, skb))
467 			goto discard;
468 
469 		if (udp_lib_checksum_complete(skb))
470 			goto discard;
471 		UDP6_INC_STATS_BH(UDP_MIB_NOPORTS, proto == IPPROTO_UDPLITE);
472 
473 		icmpv6_send(skb, ICMPV6_DEST_UNREACH, ICMPV6_PORT_UNREACH, 0, dev);
474 
475 		kfree_skb(skb);
476 		return 0;
477 	}
478 
479 	/* deliver */
480 
481 	udpv6_queue_rcv_skb(sk, skb);
482 	sock_put(sk);
483 	return 0;
484 
485 short_packet:
486 	LIMIT_NETDEBUG(KERN_DEBUG "UDP%sv6: short packet: %d/%u\n",
487 		       proto == IPPROTO_UDPLITE ? "-Lite" : "",
488 		       ulen, skb->len);
489 
490 discard:
491 	UDP6_INC_STATS_BH(UDP_MIB_INERRORS, proto == IPPROTO_UDPLITE);
492 	kfree_skb(skb);
493 	return 0;
494 }
495 
496 static __inline__ int udpv6_rcv(struct sk_buff *skb)
497 {
498 	return __udp6_lib_rcv(skb, udp_hash, IPPROTO_UDP);
499 }
500 
501 /*
502  * Throw away all pending data and cancel the corking. Socket is locked.
503  */
504 static void udp_v6_flush_pending_frames(struct sock *sk)
505 {
506 	struct udp_sock *up = udp_sk(sk);
507 
508 	if (up->pending) {
509 		up->len = 0;
510 		up->pending = 0;
511 		ip6_flush_pending_frames(sk);
512 	}
513 }
514 
515 /*
516  *	Sending
517  */
518 
519 static int udp_v6_push_pending_frames(struct sock *sk)
520 {
521 	struct sk_buff *skb;
522 	struct udphdr *uh;
523 	struct udp_sock  *up = udp_sk(sk);
524 	struct inet_sock *inet = inet_sk(sk);
525 	struct flowi *fl = &inet->cork.fl;
526 	int err = 0;
527 	__wsum csum = 0;
528 
529 	/* Grab the skbuff where UDP header space exists. */
530 	if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
531 		goto out;
532 
533 	/*
534 	 * Create a UDP header
535 	 */
536 	uh = udp_hdr(skb);
537 	uh->source = fl->fl_ip_sport;
538 	uh->dest = fl->fl_ip_dport;
539 	uh->len = htons(up->len);
540 	uh->check = 0;
541 
542 	if (up->pcflag)
543 		csum = udplite_csum_outgoing(sk, skb);
544 	 else
545 		csum = udp_csum_outgoing(sk, skb);
546 
547 	/* add protocol-dependent pseudo-header */
548 	uh->check = csum_ipv6_magic(&fl->fl6_src, &fl->fl6_dst,
549 				    up->len, fl->proto, csum   );
550 	if (uh->check == 0)
551 		uh->check = CSUM_MANGLED_0;
552 
553 	err = ip6_push_pending_frames(sk);
554 out:
555 	up->len = 0;
556 	up->pending = 0;
557 	if (!err)
558 		UDP6_INC_STATS_USER(UDP_MIB_OUTDATAGRAMS, up->pcflag);
559 	return err;
560 }
561 
562 int udpv6_sendmsg(struct kiocb *iocb, struct sock *sk,
563 		  struct msghdr *msg, size_t len)
564 {
565 	struct ipv6_txoptions opt_space;
566 	struct udp_sock *up = udp_sk(sk);
567 	struct inet_sock *inet = inet_sk(sk);
568 	struct ipv6_pinfo *np = inet6_sk(sk);
569 	struct sockaddr_in6 *sin6 = (struct sockaddr_in6 *) msg->msg_name;
570 	struct in6_addr *daddr, *final_p = NULL, final;
571 	struct ipv6_txoptions *opt = NULL;
572 	struct ip6_flowlabel *flowlabel = NULL;
573 	struct flowi fl;
574 	struct dst_entry *dst;
575 	int addr_len = msg->msg_namelen;
576 	int ulen = len;
577 	int hlimit = -1;
578 	int tclass = -1;
579 	int corkreq = up->corkflag || msg->msg_flags&MSG_MORE;
580 	int err;
581 	int connected = 0;
582 	int is_udplite = up->pcflag;
583 	int (*getfrag)(void *, char *, int, int, int, struct sk_buff *);
584 
585 	/* destination address check */
586 	if (sin6) {
587 		if (addr_len < offsetof(struct sockaddr, sa_data))
588 			return -EINVAL;
589 
590 		switch (sin6->sin6_family) {
591 		case AF_INET6:
592 			if (addr_len < SIN6_LEN_RFC2133)
593 				return -EINVAL;
594 			daddr = &sin6->sin6_addr;
595 			break;
596 		case AF_INET:
597 			goto do_udp_sendmsg;
598 		case AF_UNSPEC:
599 			msg->msg_name = sin6 = NULL;
600 			msg->msg_namelen = addr_len = 0;
601 			daddr = NULL;
602 			break;
603 		default:
604 			return -EINVAL;
605 		}
606 	} else if (!up->pending) {
607 		if (sk->sk_state != TCP_ESTABLISHED)
608 			return -EDESTADDRREQ;
609 		daddr = &np->daddr;
610 	} else
611 		daddr = NULL;
612 
613 	if (daddr) {
614 		if (ipv6_addr_v4mapped(daddr)) {
615 			struct sockaddr_in sin;
616 			sin.sin_family = AF_INET;
617 			sin.sin_port = sin6 ? sin6->sin6_port : inet->dport;
618 			sin.sin_addr.s_addr = daddr->s6_addr32[3];
619 			msg->msg_name = &sin;
620 			msg->msg_namelen = sizeof(sin);
621 do_udp_sendmsg:
622 			if (__ipv6_only_sock(sk))
623 				return -ENETUNREACH;
624 			return udp_sendmsg(iocb, sk, msg, len);
625 		}
626 	}
627 
628 	if (up->pending == AF_INET)
629 		return udp_sendmsg(iocb, sk, msg, len);
630 
631 	/* Rough check on arithmetic overflow,
632 	   better check is made in ip6_append_data().
633 	   */
634 	if (len > INT_MAX - sizeof(struct udphdr))
635 		return -EMSGSIZE;
636 
637 	if (up->pending) {
638 		/*
639 		 * There are pending frames.
640 		 * The socket lock must be held while it's corked.
641 		 */
642 		lock_sock(sk);
643 		if (likely(up->pending)) {
644 			if (unlikely(up->pending != AF_INET6)) {
645 				release_sock(sk);
646 				return -EAFNOSUPPORT;
647 			}
648 			dst = NULL;
649 			goto do_append_data;
650 		}
651 		release_sock(sk);
652 	}
653 	ulen += sizeof(struct udphdr);
654 
655 	memset(&fl, 0, sizeof(fl));
656 
657 	if (sin6) {
658 		if (sin6->sin6_port == 0)
659 			return -EINVAL;
660 
661 		fl.fl_ip_dport = sin6->sin6_port;
662 		daddr = &sin6->sin6_addr;
663 
664 		if (np->sndflow) {
665 			fl.fl6_flowlabel = sin6->sin6_flowinfo&IPV6_FLOWINFO_MASK;
666 			if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
667 				flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
668 				if (flowlabel == NULL)
669 					return -EINVAL;
670 				daddr = &flowlabel->dst;
671 			}
672 		}
673 
674 		/*
675 		 * Otherwise it will be difficult to maintain
676 		 * sk->sk_dst_cache.
677 		 */
678 		if (sk->sk_state == TCP_ESTABLISHED &&
679 		    ipv6_addr_equal(daddr, &np->daddr))
680 			daddr = &np->daddr;
681 
682 		if (addr_len >= sizeof(struct sockaddr_in6) &&
683 		    sin6->sin6_scope_id &&
684 		    ipv6_addr_type(daddr)&IPV6_ADDR_LINKLOCAL)
685 			fl.oif = sin6->sin6_scope_id;
686 	} else {
687 		if (sk->sk_state != TCP_ESTABLISHED)
688 			return -EDESTADDRREQ;
689 
690 		fl.fl_ip_dport = inet->dport;
691 		daddr = &np->daddr;
692 		fl.fl6_flowlabel = np->flow_label;
693 		connected = 1;
694 	}
695 
696 	if (!fl.oif)
697 		fl.oif = sk->sk_bound_dev_if;
698 
699 	if (msg->msg_controllen) {
700 		opt = &opt_space;
701 		memset(opt, 0, sizeof(struct ipv6_txoptions));
702 		opt->tot_len = sizeof(*opt);
703 
704 		err = datagram_send_ctl(msg, &fl, opt, &hlimit, &tclass);
705 		if (err < 0) {
706 			fl6_sock_release(flowlabel);
707 			return err;
708 		}
709 		if ((fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) && !flowlabel) {
710 			flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
711 			if (flowlabel == NULL)
712 				return -EINVAL;
713 		}
714 		if (!(opt->opt_nflen|opt->opt_flen))
715 			opt = NULL;
716 		connected = 0;
717 	}
718 	if (opt == NULL)
719 		opt = np->opt;
720 	if (flowlabel)
721 		opt = fl6_merge_options(&opt_space, flowlabel, opt);
722 	opt = ipv6_fixup_options(&opt_space, opt);
723 
724 	fl.proto = sk->sk_protocol;
725 	ipv6_addr_copy(&fl.fl6_dst, daddr);
726 	if (ipv6_addr_any(&fl.fl6_src) && !ipv6_addr_any(&np->saddr))
727 		ipv6_addr_copy(&fl.fl6_src, &np->saddr);
728 	fl.fl_ip_sport = inet->sport;
729 
730 	/* merge ip6_build_xmit from ip6_output */
731 	if (opt && opt->srcrt) {
732 		struct rt0_hdr *rt0 = (struct rt0_hdr *) opt->srcrt;
733 		ipv6_addr_copy(&final, &fl.fl6_dst);
734 		ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
735 		final_p = &final;
736 		connected = 0;
737 	}
738 
739 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst)) {
740 		fl.oif = np->mcast_oif;
741 		connected = 0;
742 	}
743 
744 	security_sk_classify_flow(sk, &fl);
745 
746 	err = ip6_sk_dst_lookup(sk, &dst, &fl);
747 	if (err)
748 		goto out;
749 	if (final_p)
750 		ipv6_addr_copy(&fl.fl6_dst, final_p);
751 
752 	if ((err = __xfrm_lookup(&dst, &fl, sk, 1)) < 0) {
753 		if (err == -EREMOTE)
754 			err = ip6_dst_blackhole(sk, &dst, &fl);
755 		if (err < 0)
756 			goto out;
757 	}
758 
759 	if (hlimit < 0) {
760 		if (ipv6_addr_is_multicast(&fl.fl6_dst))
761 			hlimit = np->mcast_hops;
762 		else
763 			hlimit = np->hop_limit;
764 		if (hlimit < 0)
765 			hlimit = dst_metric(dst, RTAX_HOPLIMIT);
766 		if (hlimit < 0)
767 			hlimit = ipv6_get_hoplimit(dst->dev);
768 	}
769 
770 	if (tclass < 0) {
771 		tclass = np->tclass;
772 		if (tclass < 0)
773 			tclass = 0;
774 	}
775 
776 	if (msg->msg_flags&MSG_CONFIRM)
777 		goto do_confirm;
778 back_from_confirm:
779 
780 	lock_sock(sk);
781 	if (unlikely(up->pending)) {
782 		/* The socket is already corked while preparing it. */
783 		/* ... which is an evident application bug. --ANK */
784 		release_sock(sk);
785 
786 		LIMIT_NETDEBUG(KERN_DEBUG "udp cork app bug 2\n");
787 		err = -EINVAL;
788 		goto out;
789 	}
790 
791 	up->pending = AF_INET6;
792 
793 do_append_data:
794 	up->len += ulen;
795 	getfrag  =  is_udplite ?  udplite_getfrag : ip_generic_getfrag;
796 	err = ip6_append_data(sk, getfrag, msg->msg_iov, ulen,
797 		sizeof(struct udphdr), hlimit, tclass, opt, &fl,
798 		(struct rt6_info*)dst,
799 		corkreq ? msg->msg_flags|MSG_MORE : msg->msg_flags);
800 	if (err)
801 		udp_v6_flush_pending_frames(sk);
802 	else if (!corkreq)
803 		err = udp_v6_push_pending_frames(sk);
804 	else if (unlikely(skb_queue_empty(&sk->sk_write_queue)))
805 		up->pending = 0;
806 
807 	if (dst) {
808 		if (connected) {
809 			ip6_dst_store(sk, dst,
810 				      ipv6_addr_equal(&fl.fl6_dst, &np->daddr) ?
811 				      &np->daddr : NULL,
812 #ifdef CONFIG_IPV6_SUBTREES
813 				      ipv6_addr_equal(&fl.fl6_src, &np->saddr) ?
814 				      &np->saddr :
815 #endif
816 				      NULL);
817 		} else {
818 			dst_release(dst);
819 		}
820 	}
821 
822 	if (err > 0)
823 		err = np->recverr ? net_xmit_errno(err) : 0;
824 	release_sock(sk);
825 out:
826 	fl6_sock_release(flowlabel);
827 	if (!err)
828 		return len;
829 	/*
830 	 * ENOBUFS = no kernel mem, SOCK_NOSPACE = no sndbuf space.  Reporting
831 	 * ENOBUFS might not be good (it's not tunable per se), but otherwise
832 	 * we don't have a good statistic (IpOutDiscards but it can be too many
833 	 * things).  We could add another new stat but at least for now that
834 	 * seems like overkill.
835 	 */
836 	if (err == -ENOBUFS || test_bit(SOCK_NOSPACE, &sk->sk_socket->flags)) {
837 		UDP6_INC_STATS_USER(UDP_MIB_SNDBUFERRORS, is_udplite);
838 	}
839 	return err;
840 
841 do_confirm:
842 	dst_confirm(dst);
843 	if (!(msg->msg_flags&MSG_PROBE) || len)
844 		goto back_from_confirm;
845 	err = 0;
846 	goto out;
847 }
848 
849 int udpv6_destroy_sock(struct sock *sk)
850 {
851 	lock_sock(sk);
852 	udp_v6_flush_pending_frames(sk);
853 	release_sock(sk);
854 
855 	inet6_destroy_sock(sk);
856 
857 	return 0;
858 }
859 
860 /*
861  *	Socket option code for UDP
862  */
863 int udpv6_setsockopt(struct sock *sk, int level, int optname,
864 		     char __user *optval, int optlen)
865 {
866 	if (level == SOL_UDP  ||  level == SOL_UDPLITE)
867 		return udp_lib_setsockopt(sk, level, optname, optval, optlen,
868 					  udp_v6_push_pending_frames);
869 	return ipv6_setsockopt(sk, level, optname, optval, optlen);
870 }
871 
872 #ifdef CONFIG_COMPAT
873 int compat_udpv6_setsockopt(struct sock *sk, int level, int optname,
874 			    char __user *optval, int optlen)
875 {
876 	if (level == SOL_UDP  ||  level == SOL_UDPLITE)
877 		return udp_lib_setsockopt(sk, level, optname, optval, optlen,
878 					  udp_v6_push_pending_frames);
879 	return compat_ipv6_setsockopt(sk, level, optname, optval, optlen);
880 }
881 #endif
882 
883 int udpv6_getsockopt(struct sock *sk, int level, int optname,
884 		     char __user *optval, int __user *optlen)
885 {
886 	if (level == SOL_UDP  ||  level == SOL_UDPLITE)
887 		return udp_lib_getsockopt(sk, level, optname, optval, optlen);
888 	return ipv6_getsockopt(sk, level, optname, optval, optlen);
889 }
890 
891 #ifdef CONFIG_COMPAT
892 int compat_udpv6_getsockopt(struct sock *sk, int level, int optname,
893 			    char __user *optval, int __user *optlen)
894 {
895 	if (level == SOL_UDP  ||  level == SOL_UDPLITE)
896 		return udp_lib_getsockopt(sk, level, optname, optval, optlen);
897 	return compat_ipv6_getsockopt(sk, level, optname, optval, optlen);
898 }
899 #endif
900 
901 static struct inet6_protocol udpv6_protocol = {
902 	.handler	=	udpv6_rcv,
903 	.err_handler	=	udpv6_err,
904 	.flags		=	INET6_PROTO_NOPOLICY|INET6_PROTO_FINAL,
905 };
906 
907 /* ------------------------------------------------------------------------ */
908 #ifdef CONFIG_PROC_FS
909 
910 static void udp6_sock_seq_show(struct seq_file *seq, struct sock *sp, int bucket)
911 {
912 	struct inet_sock *inet = inet_sk(sp);
913 	struct ipv6_pinfo *np = inet6_sk(sp);
914 	struct in6_addr *dest, *src;
915 	__u16 destp, srcp;
916 
917 	dest  = &np->daddr;
918 	src   = &np->rcv_saddr;
919 	destp = ntohs(inet->dport);
920 	srcp  = ntohs(inet->sport);
921 	seq_printf(seq,
922 		   "%4d: %08X%08X%08X%08X:%04X %08X%08X%08X%08X:%04X "
923 		   "%02X %08X:%08X %02X:%08lX %08X %5d %8d %lu %d %p\n",
924 		   bucket,
925 		   src->s6_addr32[0], src->s6_addr32[1],
926 		   src->s6_addr32[2], src->s6_addr32[3], srcp,
927 		   dest->s6_addr32[0], dest->s6_addr32[1],
928 		   dest->s6_addr32[2], dest->s6_addr32[3], destp,
929 		   sp->sk_state,
930 		   atomic_read(&sp->sk_wmem_alloc),
931 		   atomic_read(&sp->sk_rmem_alloc),
932 		   0, 0L, 0,
933 		   sock_i_uid(sp), 0,
934 		   sock_i_ino(sp),
935 		   atomic_read(&sp->sk_refcnt), sp);
936 }
937 
938 int udp6_seq_show(struct seq_file *seq, void *v)
939 {
940 	if (v == SEQ_START_TOKEN)
941 		seq_printf(seq,
942 			   "  sl  "
943 			   "local_address                         "
944 			   "remote_address                        "
945 			   "st tx_queue rx_queue tr tm->when retrnsmt"
946 			   "   uid  timeout inode\n");
947 	else
948 		udp6_sock_seq_show(seq, v, ((struct udp_iter_state *)seq->private)->bucket);
949 	return 0;
950 }
951 
952 static struct file_operations udp6_seq_fops;
953 static struct udp_seq_afinfo udp6_seq_afinfo = {
954 	.owner		= THIS_MODULE,
955 	.name		= "udp6",
956 	.family		= AF_INET6,
957 	.hashtable	= udp_hash,
958 	.seq_show	= udp6_seq_show,
959 	.seq_fops	= &udp6_seq_fops,
960 };
961 
962 int __init udp6_proc_init(void)
963 {
964 	return udp_proc_register(&udp6_seq_afinfo);
965 }
966 
967 void udp6_proc_exit(void) {
968 	udp_proc_unregister(&udp6_seq_afinfo);
969 }
970 #endif /* CONFIG_PROC_FS */
971 
972 /* ------------------------------------------------------------------------ */
973 
974 struct proto udpv6_prot = {
975 	.name		   = "UDPv6",
976 	.owner		   = THIS_MODULE,
977 	.close		   = udp_lib_close,
978 	.connect	   = ip6_datagram_connect,
979 	.disconnect	   = udp_disconnect,
980 	.ioctl		   = udp_ioctl,
981 	.destroy	   = udpv6_destroy_sock,
982 	.setsockopt	   = udpv6_setsockopt,
983 	.getsockopt	   = udpv6_getsockopt,
984 	.sendmsg	   = udpv6_sendmsg,
985 	.recvmsg	   = udpv6_recvmsg,
986 	.backlog_rcv	   = udpv6_queue_rcv_skb,
987 	.hash		   = udp_lib_hash,
988 	.unhash		   = udp_lib_unhash,
989 	.get_port	   = udp_v6_get_port,
990 	.obj_size	   = sizeof(struct udp6_sock),
991 #ifdef CONFIG_COMPAT
992 	.compat_setsockopt = compat_udpv6_setsockopt,
993 	.compat_getsockopt = compat_udpv6_getsockopt,
994 #endif
995 };
996 
997 static struct inet_protosw udpv6_protosw = {
998 	.type =      SOCK_DGRAM,
999 	.protocol =  IPPROTO_UDP,
1000 	.prot =      &udpv6_prot,
1001 	.ops =       &inet6_dgram_ops,
1002 	.capability =-1,
1003 	.no_check =  UDP_CSUM_DEFAULT,
1004 	.flags =     INET_PROTOSW_PERMANENT,
1005 };
1006 
1007 
1008 void __init udpv6_init(void)
1009 {
1010 	if (inet6_add_protocol(&udpv6_protocol, IPPROTO_UDP) < 0)
1011 		printk(KERN_ERR "udpv6_init: Could not register protocol\n");
1012 	inet6_register_protosw(&udpv6_protosw);
1013 }
1014