xref: /openbmc/linux/net/ipv6/icmp.c (revision 9b5b5cff)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *	Internet Control Message Protocol (ICMPv6)
31da177e4SLinus Torvalds  *	Linux INET6 implementation
41da177e4SLinus Torvalds  *
51da177e4SLinus Torvalds  *	Authors:
61da177e4SLinus Torvalds  *	Pedro Roque		<roque@di.fc.ul.pt>
71da177e4SLinus Torvalds  *
81da177e4SLinus Torvalds  *	$Id: icmp.c,v 1.38 2002/02/08 03:57:19 davem Exp $
91da177e4SLinus Torvalds  *
101da177e4SLinus Torvalds  *	Based on net/ipv4/icmp.c
111da177e4SLinus Torvalds  *
121da177e4SLinus Torvalds  *	RFC 1885
131da177e4SLinus Torvalds  *
141da177e4SLinus Torvalds  *	This program is free software; you can redistribute it and/or
151da177e4SLinus Torvalds  *      modify it under the terms of the GNU General Public License
161da177e4SLinus Torvalds  *      as published by the Free Software Foundation; either version
171da177e4SLinus Torvalds  *      2 of the License, or (at your option) any later version.
181da177e4SLinus Torvalds  */
191da177e4SLinus Torvalds 
201da177e4SLinus Torvalds /*
211da177e4SLinus Torvalds  *	Changes:
221da177e4SLinus Torvalds  *
231da177e4SLinus Torvalds  *	Andi Kleen		:	exception handling
241da177e4SLinus Torvalds  *	Andi Kleen			add rate limits. never reply to a icmp.
251da177e4SLinus Torvalds  *					add more length checks and other fixes.
261da177e4SLinus Torvalds  *	yoshfuji		:	ensure to sent parameter problem for
271da177e4SLinus Torvalds  *					fragments.
281da177e4SLinus Torvalds  *	YOSHIFUJI Hideaki @USAGI:	added sysctl for icmp rate limit.
291da177e4SLinus Torvalds  *	Randy Dunlap and
301da177e4SLinus Torvalds  *	YOSHIFUJI Hideaki @USAGI:	Per-interface statistics support
311da177e4SLinus Torvalds  *	Kazunori MIYAZAWA @USAGI:       change output process to use ip6_append_data
321da177e4SLinus Torvalds  */
331da177e4SLinus Torvalds 
341da177e4SLinus Torvalds #include <linux/module.h>
351da177e4SLinus Torvalds #include <linux/errno.h>
361da177e4SLinus Torvalds #include <linux/types.h>
371da177e4SLinus Torvalds #include <linux/socket.h>
381da177e4SLinus Torvalds #include <linux/in.h>
391da177e4SLinus Torvalds #include <linux/kernel.h>
401da177e4SLinus Torvalds #include <linux/sched.h>
411da177e4SLinus Torvalds #include <linux/sockios.h>
421da177e4SLinus Torvalds #include <linux/net.h>
431da177e4SLinus Torvalds #include <linux/skbuff.h>
441da177e4SLinus Torvalds #include <linux/init.h>
451da177e4SLinus Torvalds 
461da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL
471da177e4SLinus Torvalds #include <linux/sysctl.h>
481da177e4SLinus Torvalds #endif
491da177e4SLinus Torvalds 
501da177e4SLinus Torvalds #include <linux/inet.h>
511da177e4SLinus Torvalds #include <linux/netdevice.h>
521da177e4SLinus Torvalds #include <linux/icmpv6.h>
531da177e4SLinus Torvalds 
541da177e4SLinus Torvalds #include <net/ip.h>
551da177e4SLinus Torvalds #include <net/sock.h>
561da177e4SLinus Torvalds 
571da177e4SLinus Torvalds #include <net/ipv6.h>
581da177e4SLinus Torvalds #include <net/ip6_checksum.h>
591da177e4SLinus Torvalds #include <net/protocol.h>
601da177e4SLinus Torvalds #include <net/raw.h>
611da177e4SLinus Torvalds #include <net/rawv6.h>
621da177e4SLinus Torvalds #include <net/transp_v6.h>
631da177e4SLinus Torvalds #include <net/ip6_route.h>
641da177e4SLinus Torvalds #include <net/addrconf.h>
651da177e4SLinus Torvalds #include <net/icmp.h>
661da177e4SLinus Torvalds 
671da177e4SLinus Torvalds #include <asm/uaccess.h>
681da177e4SLinus Torvalds #include <asm/system.h>
691da177e4SLinus Torvalds 
70ba89966cSEric Dumazet DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
711da177e4SLinus Torvalds 
721da177e4SLinus Torvalds /*
731da177e4SLinus Torvalds  *	The ICMP socket(s). This is the most convenient way to flow control
741da177e4SLinus Torvalds  *	our ICMP output as well as maintain a clean interface throughout
751da177e4SLinus Torvalds  *	all layers. All Socketless IP sends will soon be gone.
761da177e4SLinus Torvalds  *
771da177e4SLinus Torvalds  *	On SMP we have one ICMP socket per-cpu.
781da177e4SLinus Torvalds  */
791da177e4SLinus Torvalds static DEFINE_PER_CPU(struct socket *, __icmpv6_socket) = NULL;
801da177e4SLinus Torvalds #define icmpv6_socket	__get_cpu_var(__icmpv6_socket)
811da177e4SLinus Torvalds 
821da177e4SLinus Torvalds static int icmpv6_rcv(struct sk_buff **pskb, unsigned int *nhoffp);
831da177e4SLinus Torvalds 
841da177e4SLinus Torvalds static struct inet6_protocol icmpv6_protocol = {
851da177e4SLinus Torvalds 	.handler	=	icmpv6_rcv,
861da177e4SLinus Torvalds 	.flags		=	INET6_PROTO_FINAL,
871da177e4SLinus Torvalds };
881da177e4SLinus Torvalds 
891da177e4SLinus Torvalds static __inline__ int icmpv6_xmit_lock(void)
901da177e4SLinus Torvalds {
911da177e4SLinus Torvalds 	local_bh_disable();
921da177e4SLinus Torvalds 
931da177e4SLinus Torvalds 	if (unlikely(!spin_trylock(&icmpv6_socket->sk->sk_lock.slock))) {
941da177e4SLinus Torvalds 		/* This can happen if the output path (f.e. SIT or
951da177e4SLinus Torvalds 		 * ip6ip6 tunnel) signals dst_link_failure() for an
961da177e4SLinus Torvalds 		 * outgoing ICMP6 packet.
971da177e4SLinus Torvalds 		 */
981da177e4SLinus Torvalds 		local_bh_enable();
991da177e4SLinus Torvalds 		return 1;
1001da177e4SLinus Torvalds 	}
1011da177e4SLinus Torvalds 	return 0;
1021da177e4SLinus Torvalds }
1031da177e4SLinus Torvalds 
1041da177e4SLinus Torvalds static __inline__ void icmpv6_xmit_unlock(void)
1051da177e4SLinus Torvalds {
1061da177e4SLinus Torvalds 	spin_unlock_bh(&icmpv6_socket->sk->sk_lock.slock);
1071da177e4SLinus Torvalds }
1081da177e4SLinus Torvalds 
1091da177e4SLinus Torvalds /*
1101da177e4SLinus Torvalds  * Slightly more convenient version of icmpv6_send.
1111da177e4SLinus Torvalds  */
1121da177e4SLinus Torvalds void icmpv6_param_prob(struct sk_buff *skb, int code, int pos)
1131da177e4SLinus Torvalds {
1141da177e4SLinus Torvalds 	icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
1151da177e4SLinus Torvalds 	kfree_skb(skb);
1161da177e4SLinus Torvalds }
1171da177e4SLinus Torvalds 
1181da177e4SLinus Torvalds /*
1191da177e4SLinus Torvalds  * Figure out, may we reply to this packet with icmp error.
1201da177e4SLinus Torvalds  *
1211da177e4SLinus Torvalds  * We do not reply, if:
1221da177e4SLinus Torvalds  *	- it was icmp error message.
1231da177e4SLinus Torvalds  *	- it is truncated, so that it is known, that protocol is ICMPV6
1241da177e4SLinus Torvalds  *	  (i.e. in the middle of some exthdr)
1251da177e4SLinus Torvalds  *
1261da177e4SLinus Torvalds  *	--ANK (980726)
1271da177e4SLinus Torvalds  */
1281da177e4SLinus Torvalds 
1291da177e4SLinus Torvalds static int is_ineligible(struct sk_buff *skb)
1301da177e4SLinus Torvalds {
1311da177e4SLinus Torvalds 	int ptr = (u8*)(skb->nh.ipv6h+1) - skb->data;
1321da177e4SLinus Torvalds 	int len = skb->len - ptr;
1331da177e4SLinus Torvalds 	__u8 nexthdr = skb->nh.ipv6h->nexthdr;
1341da177e4SLinus Torvalds 
1351da177e4SLinus Torvalds 	if (len < 0)
1361da177e4SLinus Torvalds 		return 1;
1371da177e4SLinus Torvalds 
1380d3d077cSHerbert Xu 	ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
1391da177e4SLinus Torvalds 	if (ptr < 0)
1401da177e4SLinus Torvalds 		return 0;
1411da177e4SLinus Torvalds 	if (nexthdr == IPPROTO_ICMPV6) {
1421da177e4SLinus Torvalds 		u8 _type, *tp;
1431da177e4SLinus Torvalds 		tp = skb_header_pointer(skb,
1441da177e4SLinus Torvalds 			ptr+offsetof(struct icmp6hdr, icmp6_type),
1451da177e4SLinus Torvalds 			sizeof(_type), &_type);
1461da177e4SLinus Torvalds 		if (tp == NULL ||
1471da177e4SLinus Torvalds 		    !(*tp & ICMPV6_INFOMSG_MASK))
1481da177e4SLinus Torvalds 			return 1;
1491da177e4SLinus Torvalds 	}
1501da177e4SLinus Torvalds 	return 0;
1511da177e4SLinus Torvalds }
1521da177e4SLinus Torvalds 
1531da177e4SLinus Torvalds static int sysctl_icmpv6_time = 1*HZ;
1541da177e4SLinus Torvalds 
1551da177e4SLinus Torvalds /*
1561da177e4SLinus Torvalds  * Check the ICMP output rate limit
1571da177e4SLinus Torvalds  */
1581da177e4SLinus Torvalds static inline int icmpv6_xrlim_allow(struct sock *sk, int type,
1591da177e4SLinus Torvalds 				     struct flowi *fl)
1601da177e4SLinus Torvalds {
1611da177e4SLinus Torvalds 	struct dst_entry *dst;
1621da177e4SLinus Torvalds 	int res = 0;
1631da177e4SLinus Torvalds 
1641da177e4SLinus Torvalds 	/* Informational messages are not limited. */
1651da177e4SLinus Torvalds 	if (type & ICMPV6_INFOMSG_MASK)
1661da177e4SLinus Torvalds 		return 1;
1671da177e4SLinus Torvalds 
1681da177e4SLinus Torvalds 	/* Do not limit pmtu discovery, it would break it. */
1691da177e4SLinus Torvalds 	if (type == ICMPV6_PKT_TOOBIG)
1701da177e4SLinus Torvalds 		return 1;
1711da177e4SLinus Torvalds 
1721da177e4SLinus Torvalds 	/*
1731da177e4SLinus Torvalds 	 * Look up the output route.
1741da177e4SLinus Torvalds 	 * XXX: perhaps the expire for routing entries cloned by
1751da177e4SLinus Torvalds 	 * this lookup should be more aggressive (not longer than timeout).
1761da177e4SLinus Torvalds 	 */
1771da177e4SLinus Torvalds 	dst = ip6_route_output(sk, fl);
1781da177e4SLinus Torvalds 	if (dst->error) {
1791da177e4SLinus Torvalds 		IP6_INC_STATS(IPSTATS_MIB_OUTNOROUTES);
1801da177e4SLinus Torvalds 	} else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
1811da177e4SLinus Torvalds 		res = 1;
1821da177e4SLinus Torvalds 	} else {
1831da177e4SLinus Torvalds 		struct rt6_info *rt = (struct rt6_info *)dst;
1841da177e4SLinus Torvalds 		int tmo = sysctl_icmpv6_time;
1851da177e4SLinus Torvalds 
1861da177e4SLinus Torvalds 		/* Give more bandwidth to wider prefixes. */
1871da177e4SLinus Torvalds 		if (rt->rt6i_dst.plen < 128)
1881da177e4SLinus Torvalds 			tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
1891da177e4SLinus Torvalds 
1901da177e4SLinus Torvalds 		res = xrlim_allow(dst, tmo);
1911da177e4SLinus Torvalds 	}
1921da177e4SLinus Torvalds 	dst_release(dst);
1931da177e4SLinus Torvalds 	return res;
1941da177e4SLinus Torvalds }
1951da177e4SLinus Torvalds 
1961da177e4SLinus Torvalds /*
1971da177e4SLinus Torvalds  *	an inline helper for the "simple" if statement below
1981da177e4SLinus Torvalds  *	checks if parameter problem report is caused by an
1991da177e4SLinus Torvalds  *	unrecognized IPv6 option that has the Option Type
2001da177e4SLinus Torvalds  *	highest-order two bits set to 10
2011da177e4SLinus Torvalds  */
2021da177e4SLinus Torvalds 
2031da177e4SLinus Torvalds static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
2041da177e4SLinus Torvalds {
2051da177e4SLinus Torvalds 	u8 _optval, *op;
2061da177e4SLinus Torvalds 
2071da177e4SLinus Torvalds 	offset += skb->nh.raw - skb->data;
2081da177e4SLinus Torvalds 	op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
2091da177e4SLinus Torvalds 	if (op == NULL)
2101da177e4SLinus Torvalds 		return 1;
2111da177e4SLinus Torvalds 	return (*op & 0xC0) == 0x80;
2121da177e4SLinus Torvalds }
2131da177e4SLinus Torvalds 
2141da177e4SLinus Torvalds static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
2151da177e4SLinus Torvalds {
2161da177e4SLinus Torvalds 	struct sk_buff *skb;
2171da177e4SLinus Torvalds 	struct icmp6hdr *icmp6h;
2181da177e4SLinus Torvalds 	int err = 0;
2191da177e4SLinus Torvalds 
2201da177e4SLinus Torvalds 	if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
2211da177e4SLinus Torvalds 		goto out;
2221da177e4SLinus Torvalds 
2231da177e4SLinus Torvalds 	icmp6h = (struct icmp6hdr*) skb->h.raw;
2241da177e4SLinus Torvalds 	memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
2251da177e4SLinus Torvalds 	icmp6h->icmp6_cksum = 0;
2261da177e4SLinus Torvalds 
2271da177e4SLinus Torvalds 	if (skb_queue_len(&sk->sk_write_queue) == 1) {
2281da177e4SLinus Torvalds 		skb->csum = csum_partial((char *)icmp6h,
2291da177e4SLinus Torvalds 					sizeof(struct icmp6hdr), skb->csum);
2301da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
2311da177e4SLinus Torvalds 						      &fl->fl6_dst,
2321da177e4SLinus Torvalds 						      len, fl->proto,
2331da177e4SLinus Torvalds 						      skb->csum);
2341da177e4SLinus Torvalds 	} else {
2351da177e4SLinus Torvalds 		u32 tmp_csum = 0;
2361da177e4SLinus Torvalds 
2371da177e4SLinus Torvalds 		skb_queue_walk(&sk->sk_write_queue, skb) {
2381da177e4SLinus Torvalds 			tmp_csum = csum_add(tmp_csum, skb->csum);
2391da177e4SLinus Torvalds 		}
2401da177e4SLinus Torvalds 
2411da177e4SLinus Torvalds 		tmp_csum = csum_partial((char *)icmp6h,
2421da177e4SLinus Torvalds 					sizeof(struct icmp6hdr), tmp_csum);
2431da177e4SLinus Torvalds 		tmp_csum = csum_ipv6_magic(&fl->fl6_src,
2441da177e4SLinus Torvalds 					   &fl->fl6_dst,
2451da177e4SLinus Torvalds 					   len, fl->proto, tmp_csum);
2461da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = tmp_csum;
2471da177e4SLinus Torvalds 	}
2481da177e4SLinus Torvalds 	if (icmp6h->icmp6_cksum == 0)
2491da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = -1;
2501da177e4SLinus Torvalds 	ip6_push_pending_frames(sk);
2511da177e4SLinus Torvalds out:
2521da177e4SLinus Torvalds 	return err;
2531da177e4SLinus Torvalds }
2541da177e4SLinus Torvalds 
2551da177e4SLinus Torvalds struct icmpv6_msg {
2561da177e4SLinus Torvalds 	struct sk_buff	*skb;
2571da177e4SLinus Torvalds 	int		offset;
2581da177e4SLinus Torvalds };
2591da177e4SLinus Torvalds 
2601da177e4SLinus Torvalds static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
2611da177e4SLinus Torvalds {
2621da177e4SLinus Torvalds 	struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
2631da177e4SLinus Torvalds 	struct sk_buff *org_skb = msg->skb;
2641da177e4SLinus Torvalds 	__u32 csum = 0;
2651da177e4SLinus Torvalds 
2661da177e4SLinus Torvalds 	csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
2671da177e4SLinus Torvalds 				      to, len, csum);
2681da177e4SLinus Torvalds 	skb->csum = csum_block_add(skb->csum, csum, odd);
2691da177e4SLinus Torvalds 	return 0;
2701da177e4SLinus Torvalds }
2711da177e4SLinus Torvalds 
2721da177e4SLinus Torvalds /*
2731da177e4SLinus Torvalds  *	Send an ICMP message in response to a packet in error
2741da177e4SLinus Torvalds  */
2751da177e4SLinus Torvalds void icmpv6_send(struct sk_buff *skb, int type, int code, __u32 info,
2761da177e4SLinus Torvalds 		 struct net_device *dev)
2771da177e4SLinus Torvalds {
2781da177e4SLinus Torvalds 	struct inet6_dev *idev = NULL;
2791da177e4SLinus Torvalds 	struct ipv6hdr *hdr = skb->nh.ipv6h;
28084427d53SYOSHIFUJI Hideaki 	struct sock *sk;
28184427d53SYOSHIFUJI Hideaki 	struct ipv6_pinfo *np;
2821da177e4SLinus Torvalds 	struct in6_addr *saddr = NULL;
2831da177e4SLinus Torvalds 	struct dst_entry *dst;
2841da177e4SLinus Torvalds 	struct icmp6hdr tmp_hdr;
2851da177e4SLinus Torvalds 	struct flowi fl;
2861da177e4SLinus Torvalds 	struct icmpv6_msg msg;
2871da177e4SLinus Torvalds 	int iif = 0;
2881da177e4SLinus Torvalds 	int addr_type = 0;
2891da177e4SLinus Torvalds 	int len;
29041a1f8eaSYOSHIFUJI Hideaki 	int hlimit, tclass;
2911da177e4SLinus Torvalds 	int err = 0;
2921da177e4SLinus Torvalds 
2931da177e4SLinus Torvalds 	if ((u8*)hdr < skb->head || (u8*)(hdr+1) > skb->tail)
2941da177e4SLinus Torvalds 		return;
2951da177e4SLinus Torvalds 
2961da177e4SLinus Torvalds 	/*
2971da177e4SLinus Torvalds 	 *	Make sure we respect the rules
2981da177e4SLinus Torvalds 	 *	i.e. RFC 1885 2.4(e)
2991da177e4SLinus Torvalds 	 *	Rule (e.1) is enforced by not using icmpv6_send
3001da177e4SLinus Torvalds 	 *	in any code that processes icmp errors.
3011da177e4SLinus Torvalds 	 */
3021da177e4SLinus Torvalds 	addr_type = ipv6_addr_type(&hdr->daddr);
3031da177e4SLinus Torvalds 
3041da177e4SLinus Torvalds 	if (ipv6_chk_addr(&hdr->daddr, skb->dev, 0))
3051da177e4SLinus Torvalds 		saddr = &hdr->daddr;
3061da177e4SLinus Torvalds 
3071da177e4SLinus Torvalds 	/*
3081da177e4SLinus Torvalds 	 *	Dest addr check
3091da177e4SLinus Torvalds 	 */
3101da177e4SLinus Torvalds 
3111da177e4SLinus Torvalds 	if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
3121da177e4SLinus Torvalds 		if (type != ICMPV6_PKT_TOOBIG &&
3131da177e4SLinus Torvalds 		    !(type == ICMPV6_PARAMPROB &&
3141da177e4SLinus Torvalds 		      code == ICMPV6_UNK_OPTION &&
3151da177e4SLinus Torvalds 		      (opt_unrec(skb, info))))
3161da177e4SLinus Torvalds 			return;
3171da177e4SLinus Torvalds 
3181da177e4SLinus Torvalds 		saddr = NULL;
3191da177e4SLinus Torvalds 	}
3201da177e4SLinus Torvalds 
3211da177e4SLinus Torvalds 	addr_type = ipv6_addr_type(&hdr->saddr);
3221da177e4SLinus Torvalds 
3231da177e4SLinus Torvalds 	/*
3241da177e4SLinus Torvalds 	 *	Source addr check
3251da177e4SLinus Torvalds 	 */
3261da177e4SLinus Torvalds 
3271da177e4SLinus Torvalds 	if (addr_type & IPV6_ADDR_LINKLOCAL)
3281da177e4SLinus Torvalds 		iif = skb->dev->ifindex;
3291da177e4SLinus Torvalds 
3301da177e4SLinus Torvalds 	/*
3311da177e4SLinus Torvalds 	 *	Must not send if we know that source is Anycast also.
3321da177e4SLinus Torvalds 	 *	for now we don't know that.
3331da177e4SLinus Torvalds 	 */
3341da177e4SLinus Torvalds 	if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
33564ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
3361da177e4SLinus Torvalds 		return;
3371da177e4SLinus Torvalds 	}
3381da177e4SLinus Torvalds 
3391da177e4SLinus Torvalds 	/*
3401da177e4SLinus Torvalds 	 *	Never answer to a ICMP packet.
3411da177e4SLinus Torvalds 	 */
3421da177e4SLinus Torvalds 	if (is_ineligible(skb)) {
34364ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
3441da177e4SLinus Torvalds 		return;
3451da177e4SLinus Torvalds 	}
3461da177e4SLinus Torvalds 
3471da177e4SLinus Torvalds 	memset(&fl, 0, sizeof(fl));
3481da177e4SLinus Torvalds 	fl.proto = IPPROTO_ICMPV6;
3491da177e4SLinus Torvalds 	ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
3501da177e4SLinus Torvalds 	if (saddr)
3511da177e4SLinus Torvalds 		ipv6_addr_copy(&fl.fl6_src, saddr);
3521da177e4SLinus Torvalds 	fl.oif = iif;
3531da177e4SLinus Torvalds 	fl.fl_icmp_type = type;
3541da177e4SLinus Torvalds 	fl.fl_icmp_code = code;
3551da177e4SLinus Torvalds 
3561da177e4SLinus Torvalds 	if (icmpv6_xmit_lock())
3571da177e4SLinus Torvalds 		return;
3581da177e4SLinus Torvalds 
35984427d53SYOSHIFUJI Hideaki 	sk = icmpv6_socket->sk;
36084427d53SYOSHIFUJI Hideaki 	np = inet6_sk(sk);
36184427d53SYOSHIFUJI Hideaki 
3621da177e4SLinus Torvalds 	if (!icmpv6_xrlim_allow(sk, type, &fl))
3631da177e4SLinus Torvalds 		goto out;
3641da177e4SLinus Torvalds 
3651da177e4SLinus Torvalds 	tmp_hdr.icmp6_type = type;
3661da177e4SLinus Torvalds 	tmp_hdr.icmp6_code = code;
3671da177e4SLinus Torvalds 	tmp_hdr.icmp6_cksum = 0;
3681da177e4SLinus Torvalds 	tmp_hdr.icmp6_pointer = htonl(info);
3691da177e4SLinus Torvalds 
3701da177e4SLinus Torvalds 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
3711da177e4SLinus Torvalds 		fl.oif = np->mcast_oif;
3721da177e4SLinus Torvalds 
3731da177e4SLinus Torvalds 	err = ip6_dst_lookup(sk, &dst, &fl);
3741da177e4SLinus Torvalds 	if (err)
3751da177e4SLinus Torvalds 		goto out;
3761da177e4SLinus Torvalds 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
377e104411bSPatrick McHardy 		goto out;
3781da177e4SLinus Torvalds 
3791da177e4SLinus Torvalds 	if (ipv6_addr_is_multicast(&fl.fl6_dst))
3801da177e4SLinus Torvalds 		hlimit = np->mcast_hops;
3811da177e4SLinus Torvalds 	else
3821da177e4SLinus Torvalds 		hlimit = np->hop_limit;
3831da177e4SLinus Torvalds 	if (hlimit < 0)
3841da177e4SLinus Torvalds 		hlimit = dst_metric(dst, RTAX_HOPLIMIT);
3851da177e4SLinus Torvalds 	if (hlimit < 0)
3861da177e4SLinus Torvalds 		hlimit = ipv6_get_hoplimit(dst->dev);
3871da177e4SLinus Torvalds 
38841a1f8eaSYOSHIFUJI Hideaki 	tclass = np->cork.tclass;
38941a1f8eaSYOSHIFUJI Hideaki 	if (tclass < 0)
39041a1f8eaSYOSHIFUJI Hideaki 		tclass = 0;
39141a1f8eaSYOSHIFUJI Hideaki 
3921da177e4SLinus Torvalds 	msg.skb = skb;
3931da177e4SLinus Torvalds 	msg.offset = skb->nh.raw - skb->data;
3941da177e4SLinus Torvalds 
3951da177e4SLinus Torvalds 	len = skb->len - msg.offset;
3961da177e4SLinus Torvalds 	len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
3971da177e4SLinus Torvalds 	if (len < 0) {
39864ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
3991da177e4SLinus Torvalds 		goto out_dst_release;
4001da177e4SLinus Torvalds 	}
4011da177e4SLinus Torvalds 
4021da177e4SLinus Torvalds 	idev = in6_dev_get(skb->dev);
4031da177e4SLinus Torvalds 
4041da177e4SLinus Torvalds 	err = ip6_append_data(sk, icmpv6_getfrag, &msg,
4051da177e4SLinus Torvalds 			      len + sizeof(struct icmp6hdr),
4061da177e4SLinus Torvalds 			      sizeof(struct icmp6hdr),
40741a1f8eaSYOSHIFUJI Hideaki 			      hlimit, tclass, NULL, &fl, (struct rt6_info*)dst,
4081da177e4SLinus Torvalds 			      MSG_DONTWAIT);
4091da177e4SLinus Torvalds 	if (err) {
4101da177e4SLinus Torvalds 		ip6_flush_pending_frames(sk);
4111da177e4SLinus Torvalds 		goto out_put;
4121da177e4SLinus Torvalds 	}
4131da177e4SLinus Torvalds 	err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
4141da177e4SLinus Torvalds 
4151da177e4SLinus Torvalds 	if (type >= ICMPV6_DEST_UNREACH && type <= ICMPV6_PARAMPROB)
4161da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_OUTDESTUNREACHS, type - ICMPV6_DEST_UNREACH);
4171da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
4181da177e4SLinus Torvalds 
4191da177e4SLinus Torvalds out_put:
4201da177e4SLinus Torvalds 	if (likely(idev != NULL))
4211da177e4SLinus Torvalds 		in6_dev_put(idev);
4221da177e4SLinus Torvalds out_dst_release:
4231da177e4SLinus Torvalds 	dst_release(dst);
4241da177e4SLinus Torvalds out:
4251da177e4SLinus Torvalds 	icmpv6_xmit_unlock();
4261da177e4SLinus Torvalds }
4271da177e4SLinus Torvalds 
4281da177e4SLinus Torvalds static void icmpv6_echo_reply(struct sk_buff *skb)
4291da177e4SLinus Torvalds {
43084427d53SYOSHIFUJI Hideaki 	struct sock *sk;
4311da177e4SLinus Torvalds 	struct inet6_dev *idev;
43284427d53SYOSHIFUJI Hideaki 	struct ipv6_pinfo *np;
4331da177e4SLinus Torvalds 	struct in6_addr *saddr = NULL;
4341da177e4SLinus Torvalds 	struct icmp6hdr *icmph = (struct icmp6hdr *) skb->h.raw;
4351da177e4SLinus Torvalds 	struct icmp6hdr tmp_hdr;
4361da177e4SLinus Torvalds 	struct flowi fl;
4371da177e4SLinus Torvalds 	struct icmpv6_msg msg;
4381da177e4SLinus Torvalds 	struct dst_entry *dst;
4391da177e4SLinus Torvalds 	int err = 0;
4401da177e4SLinus Torvalds 	int hlimit;
44141a1f8eaSYOSHIFUJI Hideaki 	int tclass;
4421da177e4SLinus Torvalds 
4431da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->daddr;
4441da177e4SLinus Torvalds 
4451da177e4SLinus Torvalds 	if (!ipv6_unicast_destination(skb))
4461da177e4SLinus Torvalds 		saddr = NULL;
4471da177e4SLinus Torvalds 
4481da177e4SLinus Torvalds 	memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
4491da177e4SLinus Torvalds 	tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
4501da177e4SLinus Torvalds 
4511da177e4SLinus Torvalds 	memset(&fl, 0, sizeof(fl));
4521da177e4SLinus Torvalds 	fl.proto = IPPROTO_ICMPV6;
4531da177e4SLinus Torvalds 	ipv6_addr_copy(&fl.fl6_dst, &skb->nh.ipv6h->saddr);
4541da177e4SLinus Torvalds 	if (saddr)
4551da177e4SLinus Torvalds 		ipv6_addr_copy(&fl.fl6_src, saddr);
4561da177e4SLinus Torvalds 	fl.oif = skb->dev->ifindex;
4571da177e4SLinus Torvalds 	fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
4581da177e4SLinus Torvalds 
4591da177e4SLinus Torvalds 	if (icmpv6_xmit_lock())
4601da177e4SLinus Torvalds 		return;
4611da177e4SLinus Torvalds 
46284427d53SYOSHIFUJI Hideaki 	sk = icmpv6_socket->sk;
46384427d53SYOSHIFUJI Hideaki 	np = inet6_sk(sk);
46484427d53SYOSHIFUJI Hideaki 
4651da177e4SLinus Torvalds 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
4661da177e4SLinus Torvalds 		fl.oif = np->mcast_oif;
4671da177e4SLinus Torvalds 
4681da177e4SLinus Torvalds 	err = ip6_dst_lookup(sk, &dst, &fl);
4691da177e4SLinus Torvalds 	if (err)
4701da177e4SLinus Torvalds 		goto out;
4711da177e4SLinus Torvalds 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
472e104411bSPatrick McHardy 		goto out;
4731da177e4SLinus Torvalds 
4741da177e4SLinus Torvalds 	if (ipv6_addr_is_multicast(&fl.fl6_dst))
4751da177e4SLinus Torvalds 		hlimit = np->mcast_hops;
4761da177e4SLinus Torvalds 	else
4771da177e4SLinus Torvalds 		hlimit = np->hop_limit;
4781da177e4SLinus Torvalds 	if (hlimit < 0)
4791da177e4SLinus Torvalds 		hlimit = dst_metric(dst, RTAX_HOPLIMIT);
4801da177e4SLinus Torvalds 	if (hlimit < 0)
4811da177e4SLinus Torvalds 		hlimit = ipv6_get_hoplimit(dst->dev);
4821da177e4SLinus Torvalds 
48341a1f8eaSYOSHIFUJI Hideaki 	tclass = np->cork.tclass;
48441a1f8eaSYOSHIFUJI Hideaki 	if (tclass < 0)
48541a1f8eaSYOSHIFUJI Hideaki 		tclass = 0;
48641a1f8eaSYOSHIFUJI Hideaki 
4871da177e4SLinus Torvalds 	idev = in6_dev_get(skb->dev);
4881da177e4SLinus Torvalds 
4891da177e4SLinus Torvalds 	msg.skb = skb;
4901da177e4SLinus Torvalds 	msg.offset = 0;
4911da177e4SLinus Torvalds 
4921da177e4SLinus Torvalds 	err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
49341a1f8eaSYOSHIFUJI Hideaki 				sizeof(struct icmp6hdr), hlimit, tclass, NULL, &fl,
4941da177e4SLinus Torvalds 				(struct rt6_info*)dst, MSG_DONTWAIT);
4951da177e4SLinus Torvalds 
4961da177e4SLinus Torvalds 	if (err) {
4971da177e4SLinus Torvalds 		ip6_flush_pending_frames(sk);
4981da177e4SLinus Torvalds 		goto out_put;
4991da177e4SLinus Torvalds 	}
5001da177e4SLinus Torvalds 	err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
5011da177e4SLinus Torvalds 
5021da177e4SLinus Torvalds         ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTECHOREPLIES);
5031da177e4SLinus Torvalds         ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
5041da177e4SLinus Torvalds 
5051da177e4SLinus Torvalds out_put:
5061da177e4SLinus Torvalds 	if (likely(idev != NULL))
5071da177e4SLinus Torvalds 		in6_dev_put(idev);
5081da177e4SLinus Torvalds 	dst_release(dst);
5091da177e4SLinus Torvalds out:
5101da177e4SLinus Torvalds 	icmpv6_xmit_unlock();
5111da177e4SLinus Torvalds }
5121da177e4SLinus Torvalds 
5131da177e4SLinus Torvalds static void icmpv6_notify(struct sk_buff *skb, int type, int code, u32 info)
5141da177e4SLinus Torvalds {
5151da177e4SLinus Torvalds 	struct in6_addr *saddr, *daddr;
5161da177e4SLinus Torvalds 	struct inet6_protocol *ipprot;
5171da177e4SLinus Torvalds 	struct sock *sk;
5181da177e4SLinus Torvalds 	int inner_offset;
5191da177e4SLinus Torvalds 	int hash;
5201da177e4SLinus Torvalds 	u8 nexthdr;
5211da177e4SLinus Torvalds 
5221da177e4SLinus Torvalds 	if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
5231da177e4SLinus Torvalds 		return;
5241da177e4SLinus Torvalds 
5251da177e4SLinus Torvalds 	nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
5261da177e4SLinus Torvalds 	if (ipv6_ext_hdr(nexthdr)) {
5271da177e4SLinus Torvalds 		/* now skip over extension headers */
5280d3d077cSHerbert Xu 		inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
5291da177e4SLinus Torvalds 		if (inner_offset<0)
5301da177e4SLinus Torvalds 			return;
5311da177e4SLinus Torvalds 	} else {
5321da177e4SLinus Torvalds 		inner_offset = sizeof(struct ipv6hdr);
5331da177e4SLinus Torvalds 	}
5341da177e4SLinus Torvalds 
5351da177e4SLinus Torvalds 	/* Checkin header including 8 bytes of inner protocol header. */
5361da177e4SLinus Torvalds 	if (!pskb_may_pull(skb, inner_offset+8))
5371da177e4SLinus Torvalds 		return;
5381da177e4SLinus Torvalds 
5391da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->saddr;
5401da177e4SLinus Torvalds 	daddr = &skb->nh.ipv6h->daddr;
5411da177e4SLinus Torvalds 
5421da177e4SLinus Torvalds 	/* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
5431da177e4SLinus Torvalds 	   Without this we will not able f.e. to make source routed
5441da177e4SLinus Torvalds 	   pmtu discovery.
5451da177e4SLinus Torvalds 	   Corresponding argument (opt) to notifiers is already added.
5461da177e4SLinus Torvalds 	   --ANK (980726)
5471da177e4SLinus Torvalds 	 */
5481da177e4SLinus Torvalds 
5491da177e4SLinus Torvalds 	hash = nexthdr & (MAX_INET_PROTOS - 1);
5501da177e4SLinus Torvalds 
5511da177e4SLinus Torvalds 	rcu_read_lock();
5521da177e4SLinus Torvalds 	ipprot = rcu_dereference(inet6_protos[hash]);
5531da177e4SLinus Torvalds 	if (ipprot && ipprot->err_handler)
5541da177e4SLinus Torvalds 		ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
5551da177e4SLinus Torvalds 	rcu_read_unlock();
5561da177e4SLinus Torvalds 
5571da177e4SLinus Torvalds 	read_lock(&raw_v6_lock);
5581da177e4SLinus Torvalds 	if ((sk = sk_head(&raw_v6_htable[hash])) != NULL) {
5590bd1b59bSAndrew McDonald 		while((sk = __raw_v6_lookup(sk, nexthdr, daddr, saddr,
5602dac4b96SYOSHIFUJI Hideaki 					    IP6CB(skb)->iif))) {
5611da177e4SLinus Torvalds 			rawv6_err(sk, skb, NULL, type, code, inner_offset, info);
5621da177e4SLinus Torvalds 			sk = sk_next(sk);
5631da177e4SLinus Torvalds 		}
5641da177e4SLinus Torvalds 	}
5651da177e4SLinus Torvalds 	read_unlock(&raw_v6_lock);
5661da177e4SLinus Torvalds }
5671da177e4SLinus Torvalds 
5681da177e4SLinus Torvalds /*
5691da177e4SLinus Torvalds  *	Handle icmp messages
5701da177e4SLinus Torvalds  */
5711da177e4SLinus Torvalds 
5721da177e4SLinus Torvalds static int icmpv6_rcv(struct sk_buff **pskb, unsigned int *nhoffp)
5731da177e4SLinus Torvalds {
5741da177e4SLinus Torvalds 	struct sk_buff *skb = *pskb;
5751da177e4SLinus Torvalds 	struct net_device *dev = skb->dev;
5761da177e4SLinus Torvalds 	struct inet6_dev *idev = __in6_dev_get(dev);
5771da177e4SLinus Torvalds 	struct in6_addr *saddr, *daddr;
5781da177e4SLinus Torvalds 	struct ipv6hdr *orig_hdr;
5791da177e4SLinus Torvalds 	struct icmp6hdr *hdr;
5801da177e4SLinus Torvalds 	int type;
5811da177e4SLinus Torvalds 
5821da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INMSGS);
5831da177e4SLinus Torvalds 
5841da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->saddr;
5851da177e4SLinus Torvalds 	daddr = &skb->nh.ipv6h->daddr;
5861da177e4SLinus Torvalds 
5871da177e4SLinus Torvalds 	/* Perform checksum. */
588fb286bb2SHerbert Xu 	switch (skb->ip_summed) {
589fb286bb2SHerbert Xu 	case CHECKSUM_HW:
590fb286bb2SHerbert Xu 		if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
591fb286bb2SHerbert Xu 				     skb->csum))
592fb286bb2SHerbert Xu 			break;
593fb286bb2SHerbert Xu 		/* fall through */
594fb286bb2SHerbert Xu 	case CHECKSUM_NONE:
595fb286bb2SHerbert Xu 		skb->csum = ~csum_ipv6_magic(saddr, daddr, skb->len,
596fb286bb2SHerbert Xu 					     IPPROTO_ICMPV6, 0);
597fb286bb2SHerbert Xu 		if (__skb_checksum_complete(skb)) {
59864ce2073SPatrick McHardy 			LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [%04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x > %04x:%04x:%04x:%04x:%04x:%04x:%04x:%04x]\n",
59964ce2073SPatrick McHardy 				       NIP6(*saddr), NIP6(*daddr));
6001da177e4SLinus Torvalds 			goto discard_it;
6011da177e4SLinus Torvalds 		}
6021da177e4SLinus Torvalds 	}
6031da177e4SLinus Torvalds 
6041da177e4SLinus Torvalds 	if (!pskb_pull(skb, sizeof(struct icmp6hdr)))
6051da177e4SLinus Torvalds 		goto discard_it;
6061da177e4SLinus Torvalds 
6071da177e4SLinus Torvalds 	hdr = (struct icmp6hdr *) skb->h.raw;
6081da177e4SLinus Torvalds 
6091da177e4SLinus Torvalds 	type = hdr->icmp6_type;
6101da177e4SLinus Torvalds 
6111da177e4SLinus Torvalds 	if (type >= ICMPV6_DEST_UNREACH && type <= ICMPV6_PARAMPROB)
6121da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_INDESTUNREACHS, type - ICMPV6_DEST_UNREACH);
6131da177e4SLinus Torvalds 	else if (type >= ICMPV6_ECHO_REQUEST && type <= NDISC_REDIRECT)
6141da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_INECHOS, type - ICMPV6_ECHO_REQUEST);
6151da177e4SLinus Torvalds 
6161da177e4SLinus Torvalds 	switch (type) {
6171da177e4SLinus Torvalds 	case ICMPV6_ECHO_REQUEST:
6181da177e4SLinus Torvalds 		icmpv6_echo_reply(skb);
6191da177e4SLinus Torvalds 		break;
6201da177e4SLinus Torvalds 
6211da177e4SLinus Torvalds 	case ICMPV6_ECHO_REPLY:
6221da177e4SLinus Torvalds 		/* we couldn't care less */
6231da177e4SLinus Torvalds 		break;
6241da177e4SLinus Torvalds 
6251da177e4SLinus Torvalds 	case ICMPV6_PKT_TOOBIG:
6261da177e4SLinus Torvalds 		/* BUGGG_FUTURE: if packet contains rthdr, we cannot update
6271da177e4SLinus Torvalds 		   standard destination cache. Seems, only "advanced"
6281da177e4SLinus Torvalds 		   destination cache will allow to solve this problem
6291da177e4SLinus Torvalds 		   --ANK (980726)
6301da177e4SLinus Torvalds 		 */
6311da177e4SLinus Torvalds 		if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
6321da177e4SLinus Torvalds 			goto discard_it;
6331da177e4SLinus Torvalds 		hdr = (struct icmp6hdr *) skb->h.raw;
6341da177e4SLinus Torvalds 		orig_hdr = (struct ipv6hdr *) (hdr + 1);
6351da177e4SLinus Torvalds 		rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
6361da177e4SLinus Torvalds 				   ntohl(hdr->icmp6_mtu));
6371da177e4SLinus Torvalds 
6381da177e4SLinus Torvalds 		/*
6391da177e4SLinus Torvalds 		 *	Drop through to notify
6401da177e4SLinus Torvalds 		 */
6411da177e4SLinus Torvalds 
6421da177e4SLinus Torvalds 	case ICMPV6_DEST_UNREACH:
6431da177e4SLinus Torvalds 	case ICMPV6_TIME_EXCEED:
6441da177e4SLinus Torvalds 	case ICMPV6_PARAMPROB:
6451da177e4SLinus Torvalds 		icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
6461da177e4SLinus Torvalds 		break;
6471da177e4SLinus Torvalds 
6481da177e4SLinus Torvalds 	case NDISC_ROUTER_SOLICITATION:
6491da177e4SLinus Torvalds 	case NDISC_ROUTER_ADVERTISEMENT:
6501da177e4SLinus Torvalds 	case NDISC_NEIGHBOUR_SOLICITATION:
6511da177e4SLinus Torvalds 	case NDISC_NEIGHBOUR_ADVERTISEMENT:
6521da177e4SLinus Torvalds 	case NDISC_REDIRECT:
6531da177e4SLinus Torvalds 		ndisc_rcv(skb);
6541da177e4SLinus Torvalds 		break;
6551da177e4SLinus Torvalds 
6561da177e4SLinus Torvalds 	case ICMPV6_MGM_QUERY:
6571da177e4SLinus Torvalds 		igmp6_event_query(skb);
6581da177e4SLinus Torvalds 		break;
6591da177e4SLinus Torvalds 
6601da177e4SLinus Torvalds 	case ICMPV6_MGM_REPORT:
6611da177e4SLinus Torvalds 		igmp6_event_report(skb);
6621da177e4SLinus Torvalds 		break;
6631da177e4SLinus Torvalds 
6641da177e4SLinus Torvalds 	case ICMPV6_MGM_REDUCTION:
6651da177e4SLinus Torvalds 	case ICMPV6_NI_QUERY:
6661da177e4SLinus Torvalds 	case ICMPV6_NI_REPLY:
6671da177e4SLinus Torvalds 	case ICMPV6_MLD2_REPORT:
6681da177e4SLinus Torvalds 	case ICMPV6_DHAAD_REQUEST:
6691da177e4SLinus Torvalds 	case ICMPV6_DHAAD_REPLY:
6701da177e4SLinus Torvalds 	case ICMPV6_MOBILE_PREFIX_SOL:
6711da177e4SLinus Torvalds 	case ICMPV6_MOBILE_PREFIX_ADV:
6721da177e4SLinus Torvalds 		break;
6731da177e4SLinus Torvalds 
6741da177e4SLinus Torvalds 	default:
67564ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
6761da177e4SLinus Torvalds 
6771da177e4SLinus Torvalds 		/* informational */
6781da177e4SLinus Torvalds 		if (type & ICMPV6_INFOMSG_MASK)
6791da177e4SLinus Torvalds 			break;
6801da177e4SLinus Torvalds 
6811da177e4SLinus Torvalds 		/*
6821da177e4SLinus Torvalds 		 * error of unknown type.
6831da177e4SLinus Torvalds 		 * must pass to upper level
6841da177e4SLinus Torvalds 		 */
6851da177e4SLinus Torvalds 
6861da177e4SLinus Torvalds 		icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
6871da177e4SLinus Torvalds 	};
6881da177e4SLinus Torvalds 	kfree_skb(skb);
6891da177e4SLinus Torvalds 	return 0;
6901da177e4SLinus Torvalds 
6911da177e4SLinus Torvalds discard_it:
6921da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INERRORS);
6931da177e4SLinus Torvalds 	kfree_skb(skb);
6941da177e4SLinus Torvalds 	return 0;
6951da177e4SLinus Torvalds }
6961da177e4SLinus Torvalds 
6971da177e4SLinus Torvalds int __init icmpv6_init(struct net_proto_family *ops)
6981da177e4SLinus Torvalds {
6991da177e4SLinus Torvalds 	struct sock *sk;
7001da177e4SLinus Torvalds 	int err, i, j;
7011da177e4SLinus Torvalds 
702670c02c2SJohn Hawkes 	for_each_cpu(i) {
7031da177e4SLinus Torvalds 		err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6,
7041da177e4SLinus Torvalds 				       &per_cpu(__icmpv6_socket, i));
7051da177e4SLinus Torvalds 		if (err < 0) {
7061da177e4SLinus Torvalds 			printk(KERN_ERR
7071da177e4SLinus Torvalds 			       "Failed to initialize the ICMP6 control socket "
7081da177e4SLinus Torvalds 			       "(err %d).\n",
7091da177e4SLinus Torvalds 			       err);
7101da177e4SLinus Torvalds 			goto fail;
7111da177e4SLinus Torvalds 		}
7121da177e4SLinus Torvalds 
7131da177e4SLinus Torvalds 		sk = per_cpu(__icmpv6_socket, i)->sk;
7141da177e4SLinus Torvalds 		sk->sk_allocation = GFP_ATOMIC;
7151da177e4SLinus Torvalds 
7161da177e4SLinus Torvalds 		/* Enough space for 2 64K ICMP packets, including
7171da177e4SLinus Torvalds 		 * sk_buff struct overhead.
7181da177e4SLinus Torvalds 		 */
7191da177e4SLinus Torvalds 		sk->sk_sndbuf =
7201da177e4SLinus Torvalds 			(2 * ((64 * 1024) + sizeof(struct sk_buff)));
7211da177e4SLinus Torvalds 
7221da177e4SLinus Torvalds 		sk->sk_prot->unhash(sk);
7231da177e4SLinus Torvalds 	}
7241da177e4SLinus Torvalds 
7251da177e4SLinus Torvalds 
7261da177e4SLinus Torvalds 	if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0) {
7271da177e4SLinus Torvalds 		printk(KERN_ERR "Failed to register ICMP6 protocol\n");
7281da177e4SLinus Torvalds 		err = -EAGAIN;
7291da177e4SLinus Torvalds 		goto fail;
7301da177e4SLinus Torvalds 	}
7311da177e4SLinus Torvalds 
7321da177e4SLinus Torvalds 	return 0;
7331da177e4SLinus Torvalds 
7341da177e4SLinus Torvalds  fail:
7351da177e4SLinus Torvalds 	for (j = 0; j < i; j++) {
7361da177e4SLinus Torvalds 		if (!cpu_possible(j))
7371da177e4SLinus Torvalds 			continue;
7381da177e4SLinus Torvalds 		sock_release(per_cpu(__icmpv6_socket, j));
7391da177e4SLinus Torvalds 	}
7401da177e4SLinus Torvalds 
7411da177e4SLinus Torvalds 	return err;
7421da177e4SLinus Torvalds }
7431da177e4SLinus Torvalds 
7441da177e4SLinus Torvalds void icmpv6_cleanup(void)
7451da177e4SLinus Torvalds {
7461da177e4SLinus Torvalds 	int i;
7471da177e4SLinus Torvalds 
748670c02c2SJohn Hawkes 	for_each_cpu(i) {
7491da177e4SLinus Torvalds 		sock_release(per_cpu(__icmpv6_socket, i));
7501da177e4SLinus Torvalds 	}
7511da177e4SLinus Torvalds 	inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
7521da177e4SLinus Torvalds }
7531da177e4SLinus Torvalds 
7549b5b5cffSArjan van de Ven static const struct icmp6_err {
7551da177e4SLinus Torvalds 	int err;
7561da177e4SLinus Torvalds 	int fatal;
7571da177e4SLinus Torvalds } tab_unreach[] = {
7581da177e4SLinus Torvalds 	{	/* NOROUTE */
7591da177e4SLinus Torvalds 		.err	= ENETUNREACH,
7601da177e4SLinus Torvalds 		.fatal	= 0,
7611da177e4SLinus Torvalds 	},
7621da177e4SLinus Torvalds 	{	/* ADM_PROHIBITED */
7631da177e4SLinus Torvalds 		.err	= EACCES,
7641da177e4SLinus Torvalds 		.fatal	= 1,
7651da177e4SLinus Torvalds 	},
7661da177e4SLinus Torvalds 	{	/* Was NOT_NEIGHBOUR, now reserved */
7671da177e4SLinus Torvalds 		.err	= EHOSTUNREACH,
7681da177e4SLinus Torvalds 		.fatal	= 0,
7691da177e4SLinus Torvalds 	},
7701da177e4SLinus Torvalds 	{	/* ADDR_UNREACH	*/
7711da177e4SLinus Torvalds 		.err	= EHOSTUNREACH,
7721da177e4SLinus Torvalds 		.fatal	= 0,
7731da177e4SLinus Torvalds 	},
7741da177e4SLinus Torvalds 	{	/* PORT_UNREACH	*/
7751da177e4SLinus Torvalds 		.err	= ECONNREFUSED,
7761da177e4SLinus Torvalds 		.fatal	= 1,
7771da177e4SLinus Torvalds 	},
7781da177e4SLinus Torvalds };
7791da177e4SLinus Torvalds 
7801da177e4SLinus Torvalds int icmpv6_err_convert(int type, int code, int *err)
7811da177e4SLinus Torvalds {
7821da177e4SLinus Torvalds 	int fatal = 0;
7831da177e4SLinus Torvalds 
7841da177e4SLinus Torvalds 	*err = EPROTO;
7851da177e4SLinus Torvalds 
7861da177e4SLinus Torvalds 	switch (type) {
7871da177e4SLinus Torvalds 	case ICMPV6_DEST_UNREACH:
7881da177e4SLinus Torvalds 		fatal = 1;
7891da177e4SLinus Torvalds 		if (code <= ICMPV6_PORT_UNREACH) {
7901da177e4SLinus Torvalds 			*err  = tab_unreach[code].err;
7911da177e4SLinus Torvalds 			fatal = tab_unreach[code].fatal;
7921da177e4SLinus Torvalds 		}
7931da177e4SLinus Torvalds 		break;
7941da177e4SLinus Torvalds 
7951da177e4SLinus Torvalds 	case ICMPV6_PKT_TOOBIG:
7961da177e4SLinus Torvalds 		*err = EMSGSIZE;
7971da177e4SLinus Torvalds 		break;
7981da177e4SLinus Torvalds 
7991da177e4SLinus Torvalds 	case ICMPV6_PARAMPROB:
8001da177e4SLinus Torvalds 		*err = EPROTO;
8011da177e4SLinus Torvalds 		fatal = 1;
8021da177e4SLinus Torvalds 		break;
8031da177e4SLinus Torvalds 
8041da177e4SLinus Torvalds 	case ICMPV6_TIME_EXCEED:
8051da177e4SLinus Torvalds 		*err = EHOSTUNREACH;
8061da177e4SLinus Torvalds 		break;
8071da177e4SLinus Torvalds 	};
8081da177e4SLinus Torvalds 
8091da177e4SLinus Torvalds 	return fatal;
8101da177e4SLinus Torvalds }
8111da177e4SLinus Torvalds 
8121da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL
8131da177e4SLinus Torvalds ctl_table ipv6_icmp_table[] = {
8141da177e4SLinus Torvalds 	{
8151da177e4SLinus Torvalds 		.ctl_name	= NET_IPV6_ICMP_RATELIMIT,
8161da177e4SLinus Torvalds 		.procname	= "ratelimit",
8171da177e4SLinus Torvalds 		.data		= &sysctl_icmpv6_time,
8181da177e4SLinus Torvalds 		.maxlen		= sizeof(int),
8191da177e4SLinus Torvalds 		.mode		= 0644,
8201da177e4SLinus Torvalds 		.proc_handler	= &proc_dointvec
8211da177e4SLinus Torvalds 	},
8221da177e4SLinus Torvalds 	{ .ctl_name = 0 },
8231da177e4SLinus Torvalds };
8241da177e4SLinus Torvalds #endif
8251da177e4SLinus Torvalds 
826