xref: /openbmc/linux/net/ipv6/icmp.c (revision 84fa7933)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *	Internet Control Message Protocol (ICMPv6)
31da177e4SLinus Torvalds  *	Linux INET6 implementation
41da177e4SLinus Torvalds  *
51da177e4SLinus Torvalds  *	Authors:
61da177e4SLinus Torvalds  *	Pedro Roque		<roque@di.fc.ul.pt>
71da177e4SLinus Torvalds  *
81da177e4SLinus Torvalds  *	$Id: icmp.c,v 1.38 2002/02/08 03:57:19 davem Exp $
91da177e4SLinus Torvalds  *
101da177e4SLinus Torvalds  *	Based on net/ipv4/icmp.c
111da177e4SLinus Torvalds  *
121da177e4SLinus Torvalds  *	RFC 1885
131da177e4SLinus Torvalds  *
141da177e4SLinus Torvalds  *	This program is free software; you can redistribute it and/or
151da177e4SLinus Torvalds  *      modify it under the terms of the GNU General Public License
161da177e4SLinus Torvalds  *      as published by the Free Software Foundation; either version
171da177e4SLinus Torvalds  *      2 of the License, or (at your option) any later version.
181da177e4SLinus Torvalds  */
191da177e4SLinus Torvalds 
201da177e4SLinus Torvalds /*
211da177e4SLinus Torvalds  *	Changes:
221da177e4SLinus Torvalds  *
231da177e4SLinus Torvalds  *	Andi Kleen		:	exception handling
241da177e4SLinus Torvalds  *	Andi Kleen			add rate limits. never reply to a icmp.
251da177e4SLinus Torvalds  *					add more length checks and other fixes.
261da177e4SLinus Torvalds  *	yoshfuji		:	ensure to sent parameter problem for
271da177e4SLinus Torvalds  *					fragments.
281da177e4SLinus Torvalds  *	YOSHIFUJI Hideaki @USAGI:	added sysctl for icmp rate limit.
291da177e4SLinus Torvalds  *	Randy Dunlap and
301da177e4SLinus Torvalds  *	YOSHIFUJI Hideaki @USAGI:	Per-interface statistics support
311da177e4SLinus Torvalds  *	Kazunori MIYAZAWA @USAGI:       change output process to use ip6_append_data
321da177e4SLinus Torvalds  */
331da177e4SLinus Torvalds 
341da177e4SLinus Torvalds #include <linux/module.h>
351da177e4SLinus Torvalds #include <linux/errno.h>
361da177e4SLinus Torvalds #include <linux/types.h>
371da177e4SLinus Torvalds #include <linux/socket.h>
381da177e4SLinus Torvalds #include <linux/in.h>
391da177e4SLinus Torvalds #include <linux/kernel.h>
401da177e4SLinus Torvalds #include <linux/sched.h>
411da177e4SLinus Torvalds #include <linux/sockios.h>
421da177e4SLinus Torvalds #include <linux/net.h>
431da177e4SLinus Torvalds #include <linux/skbuff.h>
441da177e4SLinus Torvalds #include <linux/init.h>
45763ecff1SYasuyuki Kozakai #include <linux/netfilter.h>
461da177e4SLinus Torvalds 
471da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL
481da177e4SLinus Torvalds #include <linux/sysctl.h>
491da177e4SLinus Torvalds #endif
501da177e4SLinus Torvalds 
511da177e4SLinus Torvalds #include <linux/inet.h>
521da177e4SLinus Torvalds #include <linux/netdevice.h>
531da177e4SLinus Torvalds #include <linux/icmpv6.h>
541da177e4SLinus Torvalds 
551da177e4SLinus Torvalds #include <net/ip.h>
561da177e4SLinus Torvalds #include <net/sock.h>
571da177e4SLinus Torvalds 
581da177e4SLinus Torvalds #include <net/ipv6.h>
591da177e4SLinus Torvalds #include <net/ip6_checksum.h>
601da177e4SLinus Torvalds #include <net/protocol.h>
611da177e4SLinus Torvalds #include <net/raw.h>
621da177e4SLinus Torvalds #include <net/rawv6.h>
631da177e4SLinus Torvalds #include <net/transp_v6.h>
641da177e4SLinus Torvalds #include <net/ip6_route.h>
651da177e4SLinus Torvalds #include <net/addrconf.h>
661da177e4SLinus Torvalds #include <net/icmp.h>
671da177e4SLinus Torvalds 
681da177e4SLinus Torvalds #include <asm/uaccess.h>
691da177e4SLinus Torvalds #include <asm/system.h>
701da177e4SLinus Torvalds 
71ba89966cSEric Dumazet DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
721da177e4SLinus Torvalds 
731da177e4SLinus Torvalds /*
741da177e4SLinus Torvalds  *	The ICMP socket(s). This is the most convenient way to flow control
751da177e4SLinus Torvalds  *	our ICMP output as well as maintain a clean interface throughout
761da177e4SLinus Torvalds  *	all layers. All Socketless IP sends will soon be gone.
771da177e4SLinus Torvalds  *
781da177e4SLinus Torvalds  *	On SMP we have one ICMP socket per-cpu.
791da177e4SLinus Torvalds  */
801da177e4SLinus Torvalds static DEFINE_PER_CPU(struct socket *, __icmpv6_socket) = NULL;
811da177e4SLinus Torvalds #define icmpv6_socket	__get_cpu_var(__icmpv6_socket)
821da177e4SLinus Torvalds 
83951dbc8aSPatrick McHardy static int icmpv6_rcv(struct sk_buff **pskb);
841da177e4SLinus Torvalds 
851da177e4SLinus Torvalds static struct inet6_protocol icmpv6_protocol = {
861da177e4SLinus Torvalds 	.handler	=	icmpv6_rcv,
871da177e4SLinus Torvalds 	.flags		=	INET6_PROTO_FINAL,
881da177e4SLinus Torvalds };
891da177e4SLinus Torvalds 
901da177e4SLinus Torvalds static __inline__ int icmpv6_xmit_lock(void)
911da177e4SLinus Torvalds {
921da177e4SLinus Torvalds 	local_bh_disable();
931da177e4SLinus Torvalds 
941da177e4SLinus Torvalds 	if (unlikely(!spin_trylock(&icmpv6_socket->sk->sk_lock.slock))) {
951da177e4SLinus Torvalds 		/* This can happen if the output path (f.e. SIT or
961da177e4SLinus Torvalds 		 * ip6ip6 tunnel) signals dst_link_failure() for an
971da177e4SLinus Torvalds 		 * outgoing ICMP6 packet.
981da177e4SLinus Torvalds 		 */
991da177e4SLinus Torvalds 		local_bh_enable();
1001da177e4SLinus Torvalds 		return 1;
1011da177e4SLinus Torvalds 	}
1021da177e4SLinus Torvalds 	return 0;
1031da177e4SLinus Torvalds }
1041da177e4SLinus Torvalds 
1051da177e4SLinus Torvalds static __inline__ void icmpv6_xmit_unlock(void)
1061da177e4SLinus Torvalds {
1071da177e4SLinus Torvalds 	spin_unlock_bh(&icmpv6_socket->sk->sk_lock.slock);
1081da177e4SLinus Torvalds }
1091da177e4SLinus Torvalds 
1101da177e4SLinus Torvalds /*
1111da177e4SLinus Torvalds  * Slightly more convenient version of icmpv6_send.
1121da177e4SLinus Torvalds  */
1131da177e4SLinus Torvalds void icmpv6_param_prob(struct sk_buff *skb, int code, int pos)
1141da177e4SLinus Torvalds {
1151da177e4SLinus Torvalds 	icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
1161da177e4SLinus Torvalds 	kfree_skb(skb);
1171da177e4SLinus Torvalds }
1181da177e4SLinus Torvalds 
1191da177e4SLinus Torvalds /*
1201da177e4SLinus Torvalds  * Figure out, may we reply to this packet with icmp error.
1211da177e4SLinus Torvalds  *
1221da177e4SLinus Torvalds  * We do not reply, if:
1231da177e4SLinus Torvalds  *	- it was icmp error message.
1241da177e4SLinus Torvalds  *	- it is truncated, so that it is known, that protocol is ICMPV6
1251da177e4SLinus Torvalds  *	  (i.e. in the middle of some exthdr)
1261da177e4SLinus Torvalds  *
1271da177e4SLinus Torvalds  *	--ANK (980726)
1281da177e4SLinus Torvalds  */
1291da177e4SLinus Torvalds 
1301da177e4SLinus Torvalds static int is_ineligible(struct sk_buff *skb)
1311da177e4SLinus Torvalds {
1321da177e4SLinus Torvalds 	int ptr = (u8*)(skb->nh.ipv6h+1) - skb->data;
1331da177e4SLinus Torvalds 	int len = skb->len - ptr;
1341da177e4SLinus Torvalds 	__u8 nexthdr = skb->nh.ipv6h->nexthdr;
1351da177e4SLinus Torvalds 
1361da177e4SLinus Torvalds 	if (len < 0)
1371da177e4SLinus Torvalds 		return 1;
1381da177e4SLinus Torvalds 
1390d3d077cSHerbert Xu 	ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
1401da177e4SLinus Torvalds 	if (ptr < 0)
1411da177e4SLinus Torvalds 		return 0;
1421da177e4SLinus Torvalds 	if (nexthdr == IPPROTO_ICMPV6) {
1431da177e4SLinus Torvalds 		u8 _type, *tp;
1441da177e4SLinus Torvalds 		tp = skb_header_pointer(skb,
1451da177e4SLinus Torvalds 			ptr+offsetof(struct icmp6hdr, icmp6_type),
1461da177e4SLinus Torvalds 			sizeof(_type), &_type);
1471da177e4SLinus Torvalds 		if (tp == NULL ||
1481da177e4SLinus Torvalds 		    !(*tp & ICMPV6_INFOMSG_MASK))
1491da177e4SLinus Torvalds 			return 1;
1501da177e4SLinus Torvalds 	}
1511da177e4SLinus Torvalds 	return 0;
1521da177e4SLinus Torvalds }
1531da177e4SLinus Torvalds 
1541da177e4SLinus Torvalds static int sysctl_icmpv6_time = 1*HZ;
1551da177e4SLinus Torvalds 
1561da177e4SLinus Torvalds /*
1571da177e4SLinus Torvalds  * Check the ICMP output rate limit
1581da177e4SLinus Torvalds  */
1591da177e4SLinus Torvalds static inline int icmpv6_xrlim_allow(struct sock *sk, int type,
1601da177e4SLinus Torvalds 				     struct flowi *fl)
1611da177e4SLinus Torvalds {
1621da177e4SLinus Torvalds 	struct dst_entry *dst;
1631da177e4SLinus Torvalds 	int res = 0;
1641da177e4SLinus Torvalds 
1651da177e4SLinus Torvalds 	/* Informational messages are not limited. */
1661da177e4SLinus Torvalds 	if (type & ICMPV6_INFOMSG_MASK)
1671da177e4SLinus Torvalds 		return 1;
1681da177e4SLinus Torvalds 
1691da177e4SLinus Torvalds 	/* Do not limit pmtu discovery, it would break it. */
1701da177e4SLinus Torvalds 	if (type == ICMPV6_PKT_TOOBIG)
1711da177e4SLinus Torvalds 		return 1;
1721da177e4SLinus Torvalds 
1731da177e4SLinus Torvalds 	/*
1741da177e4SLinus Torvalds 	 * Look up the output route.
1751da177e4SLinus Torvalds 	 * XXX: perhaps the expire for routing entries cloned by
1761da177e4SLinus Torvalds 	 * this lookup should be more aggressive (not longer than timeout).
1771da177e4SLinus Torvalds 	 */
1781da177e4SLinus Torvalds 	dst = ip6_route_output(sk, fl);
1791da177e4SLinus Torvalds 	if (dst->error) {
1801da177e4SLinus Torvalds 		IP6_INC_STATS(IPSTATS_MIB_OUTNOROUTES);
1811da177e4SLinus Torvalds 	} else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
1821da177e4SLinus Torvalds 		res = 1;
1831da177e4SLinus Torvalds 	} else {
1841da177e4SLinus Torvalds 		struct rt6_info *rt = (struct rt6_info *)dst;
1851da177e4SLinus Torvalds 		int tmo = sysctl_icmpv6_time;
1861da177e4SLinus Torvalds 
1871da177e4SLinus Torvalds 		/* Give more bandwidth to wider prefixes. */
1881da177e4SLinus Torvalds 		if (rt->rt6i_dst.plen < 128)
1891da177e4SLinus Torvalds 			tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
1901da177e4SLinus Torvalds 
1911da177e4SLinus Torvalds 		res = xrlim_allow(dst, tmo);
1921da177e4SLinus Torvalds 	}
1931da177e4SLinus Torvalds 	dst_release(dst);
1941da177e4SLinus Torvalds 	return res;
1951da177e4SLinus Torvalds }
1961da177e4SLinus Torvalds 
1971da177e4SLinus Torvalds /*
1981da177e4SLinus Torvalds  *	an inline helper for the "simple" if statement below
1991da177e4SLinus Torvalds  *	checks if parameter problem report is caused by an
2001da177e4SLinus Torvalds  *	unrecognized IPv6 option that has the Option Type
2011da177e4SLinus Torvalds  *	highest-order two bits set to 10
2021da177e4SLinus Torvalds  */
2031da177e4SLinus Torvalds 
2041da177e4SLinus Torvalds static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
2051da177e4SLinus Torvalds {
2061da177e4SLinus Torvalds 	u8 _optval, *op;
2071da177e4SLinus Torvalds 
2081da177e4SLinus Torvalds 	offset += skb->nh.raw - skb->data;
2091da177e4SLinus Torvalds 	op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
2101da177e4SLinus Torvalds 	if (op == NULL)
2111da177e4SLinus Torvalds 		return 1;
2121da177e4SLinus Torvalds 	return (*op & 0xC0) == 0x80;
2131da177e4SLinus Torvalds }
2141da177e4SLinus Torvalds 
2151da177e4SLinus Torvalds static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
2161da177e4SLinus Torvalds {
2171da177e4SLinus Torvalds 	struct sk_buff *skb;
2181da177e4SLinus Torvalds 	struct icmp6hdr *icmp6h;
2191da177e4SLinus Torvalds 	int err = 0;
2201da177e4SLinus Torvalds 
2211da177e4SLinus Torvalds 	if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
2221da177e4SLinus Torvalds 		goto out;
2231da177e4SLinus Torvalds 
2241da177e4SLinus Torvalds 	icmp6h = (struct icmp6hdr*) skb->h.raw;
2251da177e4SLinus Torvalds 	memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
2261da177e4SLinus Torvalds 	icmp6h->icmp6_cksum = 0;
2271da177e4SLinus Torvalds 
2281da177e4SLinus Torvalds 	if (skb_queue_len(&sk->sk_write_queue) == 1) {
2291da177e4SLinus Torvalds 		skb->csum = csum_partial((char *)icmp6h,
2301da177e4SLinus Torvalds 					sizeof(struct icmp6hdr), skb->csum);
2311da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
2321da177e4SLinus Torvalds 						      &fl->fl6_dst,
2331da177e4SLinus Torvalds 						      len, fl->proto,
2341da177e4SLinus Torvalds 						      skb->csum);
2351da177e4SLinus Torvalds 	} else {
2361da177e4SLinus Torvalds 		u32 tmp_csum = 0;
2371da177e4SLinus Torvalds 
2381da177e4SLinus Torvalds 		skb_queue_walk(&sk->sk_write_queue, skb) {
2391da177e4SLinus Torvalds 			tmp_csum = csum_add(tmp_csum, skb->csum);
2401da177e4SLinus Torvalds 		}
2411da177e4SLinus Torvalds 
2421da177e4SLinus Torvalds 		tmp_csum = csum_partial((char *)icmp6h,
2431da177e4SLinus Torvalds 					sizeof(struct icmp6hdr), tmp_csum);
2441da177e4SLinus Torvalds 		tmp_csum = csum_ipv6_magic(&fl->fl6_src,
2451da177e4SLinus Torvalds 					   &fl->fl6_dst,
2461da177e4SLinus Torvalds 					   len, fl->proto, tmp_csum);
2471da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = tmp_csum;
2481da177e4SLinus Torvalds 	}
2491da177e4SLinus Torvalds 	if (icmp6h->icmp6_cksum == 0)
2501da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = -1;
2511da177e4SLinus Torvalds 	ip6_push_pending_frames(sk);
2521da177e4SLinus Torvalds out:
2531da177e4SLinus Torvalds 	return err;
2541da177e4SLinus Torvalds }
2551da177e4SLinus Torvalds 
2561da177e4SLinus Torvalds struct icmpv6_msg {
2571da177e4SLinus Torvalds 	struct sk_buff	*skb;
2581da177e4SLinus Torvalds 	int		offset;
259763ecff1SYasuyuki Kozakai 	uint8_t		type;
2601da177e4SLinus Torvalds };
2611da177e4SLinus Torvalds 
2621da177e4SLinus Torvalds static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
2631da177e4SLinus Torvalds {
2641da177e4SLinus Torvalds 	struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
2651da177e4SLinus Torvalds 	struct sk_buff *org_skb = msg->skb;
2661da177e4SLinus Torvalds 	__u32 csum = 0;
2671da177e4SLinus Torvalds 
2681da177e4SLinus Torvalds 	csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
2691da177e4SLinus Torvalds 				      to, len, csum);
2701da177e4SLinus Torvalds 	skb->csum = csum_block_add(skb->csum, csum, odd);
271763ecff1SYasuyuki Kozakai 	if (!(msg->type & ICMPV6_INFOMSG_MASK))
272763ecff1SYasuyuki Kozakai 		nf_ct_attach(skb, org_skb);
2731da177e4SLinus Torvalds 	return 0;
2741da177e4SLinus Torvalds }
2751da177e4SLinus Torvalds 
2761da177e4SLinus Torvalds /*
2771da177e4SLinus Torvalds  *	Send an ICMP message in response to a packet in error
2781da177e4SLinus Torvalds  */
2791da177e4SLinus Torvalds void icmpv6_send(struct sk_buff *skb, int type, int code, __u32 info,
2801da177e4SLinus Torvalds 		 struct net_device *dev)
2811da177e4SLinus Torvalds {
2821da177e4SLinus Torvalds 	struct inet6_dev *idev = NULL;
2831da177e4SLinus Torvalds 	struct ipv6hdr *hdr = skb->nh.ipv6h;
28484427d53SYOSHIFUJI Hideaki 	struct sock *sk;
28584427d53SYOSHIFUJI Hideaki 	struct ipv6_pinfo *np;
2861da177e4SLinus Torvalds 	struct in6_addr *saddr = NULL;
2871da177e4SLinus Torvalds 	struct dst_entry *dst;
2881da177e4SLinus Torvalds 	struct icmp6hdr tmp_hdr;
2891da177e4SLinus Torvalds 	struct flowi fl;
2901da177e4SLinus Torvalds 	struct icmpv6_msg msg;
2911da177e4SLinus Torvalds 	int iif = 0;
2921da177e4SLinus Torvalds 	int addr_type = 0;
2931da177e4SLinus Torvalds 	int len;
29441a1f8eaSYOSHIFUJI Hideaki 	int hlimit, tclass;
2951da177e4SLinus Torvalds 	int err = 0;
2961da177e4SLinus Torvalds 
2971da177e4SLinus Torvalds 	if ((u8*)hdr < skb->head || (u8*)(hdr+1) > skb->tail)
2981da177e4SLinus Torvalds 		return;
2991da177e4SLinus Torvalds 
3001da177e4SLinus Torvalds 	/*
3011da177e4SLinus Torvalds 	 *	Make sure we respect the rules
3021da177e4SLinus Torvalds 	 *	i.e. RFC 1885 2.4(e)
3031da177e4SLinus Torvalds 	 *	Rule (e.1) is enforced by not using icmpv6_send
3041da177e4SLinus Torvalds 	 *	in any code that processes icmp errors.
3051da177e4SLinus Torvalds 	 */
3061da177e4SLinus Torvalds 	addr_type = ipv6_addr_type(&hdr->daddr);
3071da177e4SLinus Torvalds 
3081da177e4SLinus Torvalds 	if (ipv6_chk_addr(&hdr->daddr, skb->dev, 0))
3091da177e4SLinus Torvalds 		saddr = &hdr->daddr;
3101da177e4SLinus Torvalds 
3111da177e4SLinus Torvalds 	/*
3121da177e4SLinus Torvalds 	 *	Dest addr check
3131da177e4SLinus Torvalds 	 */
3141da177e4SLinus Torvalds 
3151da177e4SLinus Torvalds 	if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
3161da177e4SLinus Torvalds 		if (type != ICMPV6_PKT_TOOBIG &&
3171da177e4SLinus Torvalds 		    !(type == ICMPV6_PARAMPROB &&
3181da177e4SLinus Torvalds 		      code == ICMPV6_UNK_OPTION &&
3191da177e4SLinus Torvalds 		      (opt_unrec(skb, info))))
3201da177e4SLinus Torvalds 			return;
3211da177e4SLinus Torvalds 
3221da177e4SLinus Torvalds 		saddr = NULL;
3231da177e4SLinus Torvalds 	}
3241da177e4SLinus Torvalds 
3251da177e4SLinus Torvalds 	addr_type = ipv6_addr_type(&hdr->saddr);
3261da177e4SLinus Torvalds 
3271da177e4SLinus Torvalds 	/*
3281da177e4SLinus Torvalds 	 *	Source addr check
3291da177e4SLinus Torvalds 	 */
3301da177e4SLinus Torvalds 
3311da177e4SLinus Torvalds 	if (addr_type & IPV6_ADDR_LINKLOCAL)
3321da177e4SLinus Torvalds 		iif = skb->dev->ifindex;
3331da177e4SLinus Torvalds 
3341da177e4SLinus Torvalds 	/*
3358de3351eSYOSHIFUJI Hideaki 	 *	Must not send error if the source does not uniquely
3368de3351eSYOSHIFUJI Hideaki 	 *	identify a single node (RFC2463 Section 2.4).
3378de3351eSYOSHIFUJI Hideaki 	 *	We check unspecified / multicast addresses here,
3388de3351eSYOSHIFUJI Hideaki 	 *	and anycast addresses will be checked later.
3391da177e4SLinus Torvalds 	 */
3401da177e4SLinus Torvalds 	if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
34164ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
3421da177e4SLinus Torvalds 		return;
3431da177e4SLinus Torvalds 	}
3441da177e4SLinus Torvalds 
3451da177e4SLinus Torvalds 	/*
3461da177e4SLinus Torvalds 	 *	Never answer to a ICMP packet.
3471da177e4SLinus Torvalds 	 */
3481da177e4SLinus Torvalds 	if (is_ineligible(skb)) {
34964ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
3501da177e4SLinus Torvalds 		return;
3511da177e4SLinus Torvalds 	}
3521da177e4SLinus Torvalds 
3531da177e4SLinus Torvalds 	memset(&fl, 0, sizeof(fl));
3541da177e4SLinus Torvalds 	fl.proto = IPPROTO_ICMPV6;
3551da177e4SLinus Torvalds 	ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
3561da177e4SLinus Torvalds 	if (saddr)
3571da177e4SLinus Torvalds 		ipv6_addr_copy(&fl.fl6_src, saddr);
3581da177e4SLinus Torvalds 	fl.oif = iif;
3591da177e4SLinus Torvalds 	fl.fl_icmp_type = type;
3601da177e4SLinus Torvalds 	fl.fl_icmp_code = code;
361beb8d13bSVenkat Yekkirala 	security_skb_classify_flow(skb, &fl);
3621da177e4SLinus Torvalds 
3631da177e4SLinus Torvalds 	if (icmpv6_xmit_lock())
3641da177e4SLinus Torvalds 		return;
3651da177e4SLinus Torvalds 
36684427d53SYOSHIFUJI Hideaki 	sk = icmpv6_socket->sk;
36784427d53SYOSHIFUJI Hideaki 	np = inet6_sk(sk);
36884427d53SYOSHIFUJI Hideaki 
3691da177e4SLinus Torvalds 	if (!icmpv6_xrlim_allow(sk, type, &fl))
3701da177e4SLinus Torvalds 		goto out;
3711da177e4SLinus Torvalds 
3721da177e4SLinus Torvalds 	tmp_hdr.icmp6_type = type;
3731da177e4SLinus Torvalds 	tmp_hdr.icmp6_code = code;
3741da177e4SLinus Torvalds 	tmp_hdr.icmp6_cksum = 0;
3751da177e4SLinus Torvalds 	tmp_hdr.icmp6_pointer = htonl(info);
3761da177e4SLinus Torvalds 
3771da177e4SLinus Torvalds 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
3781da177e4SLinus Torvalds 		fl.oif = np->mcast_oif;
3791da177e4SLinus Torvalds 
3801da177e4SLinus Torvalds 	err = ip6_dst_lookup(sk, &dst, &fl);
3811da177e4SLinus Torvalds 	if (err)
3821da177e4SLinus Torvalds 		goto out;
3838de3351eSYOSHIFUJI Hideaki 
3848de3351eSYOSHIFUJI Hideaki 	/*
3858de3351eSYOSHIFUJI Hideaki 	 * We won't send icmp if the destination is known
3868de3351eSYOSHIFUJI Hideaki 	 * anycast.
3878de3351eSYOSHIFUJI Hideaki 	 */
3888de3351eSYOSHIFUJI Hideaki 	if (((struct rt6_info *)dst)->rt6i_flags & RTF_ANYCAST) {
3898de3351eSYOSHIFUJI Hideaki 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: acast source\n");
3908de3351eSYOSHIFUJI Hideaki 		goto out_dst_release;
3918de3351eSYOSHIFUJI Hideaki 	}
3928de3351eSYOSHIFUJI Hideaki 
3931da177e4SLinus Torvalds 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
394e104411bSPatrick McHardy 		goto out;
3951da177e4SLinus Torvalds 
3961da177e4SLinus Torvalds 	if (ipv6_addr_is_multicast(&fl.fl6_dst))
3971da177e4SLinus Torvalds 		hlimit = np->mcast_hops;
3981da177e4SLinus Torvalds 	else
3991da177e4SLinus Torvalds 		hlimit = np->hop_limit;
4001da177e4SLinus Torvalds 	if (hlimit < 0)
4011da177e4SLinus Torvalds 		hlimit = dst_metric(dst, RTAX_HOPLIMIT);
4021da177e4SLinus Torvalds 	if (hlimit < 0)
4031da177e4SLinus Torvalds 		hlimit = ipv6_get_hoplimit(dst->dev);
4041da177e4SLinus Torvalds 
405e012d51cSYOSHIFUJI Hideaki 	tclass = np->tclass;
40641a1f8eaSYOSHIFUJI Hideaki 	if (tclass < 0)
40741a1f8eaSYOSHIFUJI Hideaki 		tclass = 0;
40841a1f8eaSYOSHIFUJI Hideaki 
4091da177e4SLinus Torvalds 	msg.skb = skb;
4101da177e4SLinus Torvalds 	msg.offset = skb->nh.raw - skb->data;
411763ecff1SYasuyuki Kozakai 	msg.type = type;
4121da177e4SLinus Torvalds 
4131da177e4SLinus Torvalds 	len = skb->len - msg.offset;
4141da177e4SLinus Torvalds 	len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
4151da177e4SLinus Torvalds 	if (len < 0) {
41664ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
4171da177e4SLinus Torvalds 		goto out_dst_release;
4181da177e4SLinus Torvalds 	}
4191da177e4SLinus Torvalds 
4201da177e4SLinus Torvalds 	idev = in6_dev_get(skb->dev);
4211da177e4SLinus Torvalds 
4221da177e4SLinus Torvalds 	err = ip6_append_data(sk, icmpv6_getfrag, &msg,
4231da177e4SLinus Torvalds 			      len + sizeof(struct icmp6hdr),
4241da177e4SLinus Torvalds 			      sizeof(struct icmp6hdr),
42541a1f8eaSYOSHIFUJI Hideaki 			      hlimit, tclass, NULL, &fl, (struct rt6_info*)dst,
4261da177e4SLinus Torvalds 			      MSG_DONTWAIT);
4271da177e4SLinus Torvalds 	if (err) {
4281da177e4SLinus Torvalds 		ip6_flush_pending_frames(sk);
4291da177e4SLinus Torvalds 		goto out_put;
4301da177e4SLinus Torvalds 	}
4311da177e4SLinus Torvalds 	err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
4321da177e4SLinus Torvalds 
4331da177e4SLinus Torvalds 	if (type >= ICMPV6_DEST_UNREACH && type <= ICMPV6_PARAMPROB)
4341da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_OUTDESTUNREACHS, type - ICMPV6_DEST_UNREACH);
4351da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
4361da177e4SLinus Torvalds 
4371da177e4SLinus Torvalds out_put:
4381da177e4SLinus Torvalds 	if (likely(idev != NULL))
4391da177e4SLinus Torvalds 		in6_dev_put(idev);
4401da177e4SLinus Torvalds out_dst_release:
4411da177e4SLinus Torvalds 	dst_release(dst);
4421da177e4SLinus Torvalds out:
4431da177e4SLinus Torvalds 	icmpv6_xmit_unlock();
4441da177e4SLinus Torvalds }
4451da177e4SLinus Torvalds 
4461da177e4SLinus Torvalds static void icmpv6_echo_reply(struct sk_buff *skb)
4471da177e4SLinus Torvalds {
44884427d53SYOSHIFUJI Hideaki 	struct sock *sk;
4491da177e4SLinus Torvalds 	struct inet6_dev *idev;
45084427d53SYOSHIFUJI Hideaki 	struct ipv6_pinfo *np;
4511da177e4SLinus Torvalds 	struct in6_addr *saddr = NULL;
4521da177e4SLinus Torvalds 	struct icmp6hdr *icmph = (struct icmp6hdr *) skb->h.raw;
4531da177e4SLinus Torvalds 	struct icmp6hdr tmp_hdr;
4541da177e4SLinus Torvalds 	struct flowi fl;
4551da177e4SLinus Torvalds 	struct icmpv6_msg msg;
4561da177e4SLinus Torvalds 	struct dst_entry *dst;
4571da177e4SLinus Torvalds 	int err = 0;
4581da177e4SLinus Torvalds 	int hlimit;
45941a1f8eaSYOSHIFUJI Hideaki 	int tclass;
4601da177e4SLinus Torvalds 
4611da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->daddr;
4621da177e4SLinus Torvalds 
4631da177e4SLinus Torvalds 	if (!ipv6_unicast_destination(skb))
4641da177e4SLinus Torvalds 		saddr = NULL;
4651da177e4SLinus Torvalds 
4661da177e4SLinus Torvalds 	memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
4671da177e4SLinus Torvalds 	tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
4681da177e4SLinus Torvalds 
4691da177e4SLinus Torvalds 	memset(&fl, 0, sizeof(fl));
4701da177e4SLinus Torvalds 	fl.proto = IPPROTO_ICMPV6;
4711da177e4SLinus Torvalds 	ipv6_addr_copy(&fl.fl6_dst, &skb->nh.ipv6h->saddr);
4721da177e4SLinus Torvalds 	if (saddr)
4731da177e4SLinus Torvalds 		ipv6_addr_copy(&fl.fl6_src, saddr);
4741da177e4SLinus Torvalds 	fl.oif = skb->dev->ifindex;
4751da177e4SLinus Torvalds 	fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
476beb8d13bSVenkat Yekkirala 	security_skb_classify_flow(skb, &fl);
4771da177e4SLinus Torvalds 
4781da177e4SLinus Torvalds 	if (icmpv6_xmit_lock())
4791da177e4SLinus Torvalds 		return;
4801da177e4SLinus Torvalds 
48184427d53SYOSHIFUJI Hideaki 	sk = icmpv6_socket->sk;
48284427d53SYOSHIFUJI Hideaki 	np = inet6_sk(sk);
48384427d53SYOSHIFUJI Hideaki 
4841da177e4SLinus Torvalds 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
4851da177e4SLinus Torvalds 		fl.oif = np->mcast_oif;
4861da177e4SLinus Torvalds 
4871da177e4SLinus Torvalds 	err = ip6_dst_lookup(sk, &dst, &fl);
4881da177e4SLinus Torvalds 	if (err)
4891da177e4SLinus Torvalds 		goto out;
4901da177e4SLinus Torvalds 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
491e104411bSPatrick McHardy 		goto out;
4921da177e4SLinus Torvalds 
4931da177e4SLinus Torvalds 	if (ipv6_addr_is_multicast(&fl.fl6_dst))
4941da177e4SLinus Torvalds 		hlimit = np->mcast_hops;
4951da177e4SLinus Torvalds 	else
4961da177e4SLinus Torvalds 		hlimit = np->hop_limit;
4971da177e4SLinus Torvalds 	if (hlimit < 0)
4981da177e4SLinus Torvalds 		hlimit = dst_metric(dst, RTAX_HOPLIMIT);
4991da177e4SLinus Torvalds 	if (hlimit < 0)
5001da177e4SLinus Torvalds 		hlimit = ipv6_get_hoplimit(dst->dev);
5011da177e4SLinus Torvalds 
502e012d51cSYOSHIFUJI Hideaki 	tclass = np->tclass;
50341a1f8eaSYOSHIFUJI Hideaki 	if (tclass < 0)
50441a1f8eaSYOSHIFUJI Hideaki 		tclass = 0;
50541a1f8eaSYOSHIFUJI Hideaki 
5061da177e4SLinus Torvalds 	idev = in6_dev_get(skb->dev);
5071da177e4SLinus Torvalds 
5081da177e4SLinus Torvalds 	msg.skb = skb;
5091da177e4SLinus Torvalds 	msg.offset = 0;
510763ecff1SYasuyuki Kozakai 	msg.type = ICMPV6_ECHO_REPLY;
5111da177e4SLinus Torvalds 
5121da177e4SLinus Torvalds 	err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
51341a1f8eaSYOSHIFUJI Hideaki 				sizeof(struct icmp6hdr), hlimit, tclass, NULL, &fl,
5141da177e4SLinus Torvalds 				(struct rt6_info*)dst, MSG_DONTWAIT);
5151da177e4SLinus Torvalds 
5161da177e4SLinus Torvalds 	if (err) {
5171da177e4SLinus Torvalds 		ip6_flush_pending_frames(sk);
5181da177e4SLinus Torvalds 		goto out_put;
5191da177e4SLinus Torvalds 	}
5201da177e4SLinus Torvalds 	err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
5211da177e4SLinus Torvalds 
5221da177e4SLinus Torvalds         ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTECHOREPLIES);
5231da177e4SLinus Torvalds         ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
5241da177e4SLinus Torvalds 
5251da177e4SLinus Torvalds out_put:
5261da177e4SLinus Torvalds 	if (likely(idev != NULL))
5271da177e4SLinus Torvalds 		in6_dev_put(idev);
5281da177e4SLinus Torvalds 	dst_release(dst);
5291da177e4SLinus Torvalds out:
5301da177e4SLinus Torvalds 	icmpv6_xmit_unlock();
5311da177e4SLinus Torvalds }
5321da177e4SLinus Torvalds 
5331da177e4SLinus Torvalds static void icmpv6_notify(struct sk_buff *skb, int type, int code, u32 info)
5341da177e4SLinus Torvalds {
5351da177e4SLinus Torvalds 	struct in6_addr *saddr, *daddr;
5361da177e4SLinus Torvalds 	struct inet6_protocol *ipprot;
5371da177e4SLinus Torvalds 	struct sock *sk;
5381da177e4SLinus Torvalds 	int inner_offset;
5391da177e4SLinus Torvalds 	int hash;
5401da177e4SLinus Torvalds 	u8 nexthdr;
5411da177e4SLinus Torvalds 
5421da177e4SLinus Torvalds 	if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
5431da177e4SLinus Torvalds 		return;
5441da177e4SLinus Torvalds 
5451da177e4SLinus Torvalds 	nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
5461da177e4SLinus Torvalds 	if (ipv6_ext_hdr(nexthdr)) {
5471da177e4SLinus Torvalds 		/* now skip over extension headers */
5480d3d077cSHerbert Xu 		inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
5491da177e4SLinus Torvalds 		if (inner_offset<0)
5501da177e4SLinus Torvalds 			return;
5511da177e4SLinus Torvalds 	} else {
5521da177e4SLinus Torvalds 		inner_offset = sizeof(struct ipv6hdr);
5531da177e4SLinus Torvalds 	}
5541da177e4SLinus Torvalds 
5551da177e4SLinus Torvalds 	/* Checkin header including 8 bytes of inner protocol header. */
5561da177e4SLinus Torvalds 	if (!pskb_may_pull(skb, inner_offset+8))
5571da177e4SLinus Torvalds 		return;
5581da177e4SLinus Torvalds 
5591da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->saddr;
5601da177e4SLinus Torvalds 	daddr = &skb->nh.ipv6h->daddr;
5611da177e4SLinus Torvalds 
5621da177e4SLinus Torvalds 	/* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
5631da177e4SLinus Torvalds 	   Without this we will not able f.e. to make source routed
5641da177e4SLinus Torvalds 	   pmtu discovery.
5651da177e4SLinus Torvalds 	   Corresponding argument (opt) to notifiers is already added.
5661da177e4SLinus Torvalds 	   --ANK (980726)
5671da177e4SLinus Torvalds 	 */
5681da177e4SLinus Torvalds 
5691da177e4SLinus Torvalds 	hash = nexthdr & (MAX_INET_PROTOS - 1);
5701da177e4SLinus Torvalds 
5711da177e4SLinus Torvalds 	rcu_read_lock();
5721da177e4SLinus Torvalds 	ipprot = rcu_dereference(inet6_protos[hash]);
5731da177e4SLinus Torvalds 	if (ipprot && ipprot->err_handler)
5741da177e4SLinus Torvalds 		ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
5751da177e4SLinus Torvalds 	rcu_read_unlock();
5761da177e4SLinus Torvalds 
5771da177e4SLinus Torvalds 	read_lock(&raw_v6_lock);
5781da177e4SLinus Torvalds 	if ((sk = sk_head(&raw_v6_htable[hash])) != NULL) {
5790bd1b59bSAndrew McDonald 		while((sk = __raw_v6_lookup(sk, nexthdr, daddr, saddr,
5802dac4b96SYOSHIFUJI Hideaki 					    IP6CB(skb)->iif))) {
5811da177e4SLinus Torvalds 			rawv6_err(sk, skb, NULL, type, code, inner_offset, info);
5821da177e4SLinus Torvalds 			sk = sk_next(sk);
5831da177e4SLinus Torvalds 		}
5841da177e4SLinus Torvalds 	}
5851da177e4SLinus Torvalds 	read_unlock(&raw_v6_lock);
5861da177e4SLinus Torvalds }
5871da177e4SLinus Torvalds 
5881da177e4SLinus Torvalds /*
5891da177e4SLinus Torvalds  *	Handle icmp messages
5901da177e4SLinus Torvalds  */
5911da177e4SLinus Torvalds 
592951dbc8aSPatrick McHardy static int icmpv6_rcv(struct sk_buff **pskb)
5931da177e4SLinus Torvalds {
5941da177e4SLinus Torvalds 	struct sk_buff *skb = *pskb;
5951da177e4SLinus Torvalds 	struct net_device *dev = skb->dev;
5961da177e4SLinus Torvalds 	struct inet6_dev *idev = __in6_dev_get(dev);
5971da177e4SLinus Torvalds 	struct in6_addr *saddr, *daddr;
5981da177e4SLinus Torvalds 	struct ipv6hdr *orig_hdr;
5991da177e4SLinus Torvalds 	struct icmp6hdr *hdr;
6001da177e4SLinus Torvalds 	int type;
6011da177e4SLinus Torvalds 
6021da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INMSGS);
6031da177e4SLinus Torvalds 
6041da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->saddr;
6051da177e4SLinus Torvalds 	daddr = &skb->nh.ipv6h->daddr;
6061da177e4SLinus Torvalds 
6071da177e4SLinus Torvalds 	/* Perform checksum. */
608fb286bb2SHerbert Xu 	switch (skb->ip_summed) {
60984fa7933SPatrick McHardy 	case CHECKSUM_COMPLETE:
610fb286bb2SHerbert Xu 		if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
611fb286bb2SHerbert Xu 				     skb->csum))
612fb286bb2SHerbert Xu 			break;
613fb286bb2SHerbert Xu 		/* fall through */
614fb286bb2SHerbert Xu 	case CHECKSUM_NONE:
615fb286bb2SHerbert Xu 		skb->csum = ~csum_ipv6_magic(saddr, daddr, skb->len,
616fb286bb2SHerbert Xu 					     IPPROTO_ICMPV6, 0);
617fb286bb2SHerbert Xu 		if (__skb_checksum_complete(skb)) {
61846b86a2dSJoe Perches 			LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [" NIP6_FMT " > " NIP6_FMT "]\n",
61964ce2073SPatrick McHardy 				       NIP6(*saddr), NIP6(*daddr));
6201da177e4SLinus Torvalds 			goto discard_it;
6211da177e4SLinus Torvalds 		}
6221da177e4SLinus Torvalds 	}
6231da177e4SLinus Torvalds 
6241da177e4SLinus Torvalds 	if (!pskb_pull(skb, sizeof(struct icmp6hdr)))
6251da177e4SLinus Torvalds 		goto discard_it;
6261da177e4SLinus Torvalds 
6271da177e4SLinus Torvalds 	hdr = (struct icmp6hdr *) skb->h.raw;
6281da177e4SLinus Torvalds 
6291da177e4SLinus Torvalds 	type = hdr->icmp6_type;
6301da177e4SLinus Torvalds 
6311da177e4SLinus Torvalds 	if (type >= ICMPV6_DEST_UNREACH && type <= ICMPV6_PARAMPROB)
6321da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_INDESTUNREACHS, type - ICMPV6_DEST_UNREACH);
6331da177e4SLinus Torvalds 	else if (type >= ICMPV6_ECHO_REQUEST && type <= NDISC_REDIRECT)
6341da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_INECHOS, type - ICMPV6_ECHO_REQUEST);
6351da177e4SLinus Torvalds 
6361da177e4SLinus Torvalds 	switch (type) {
6371da177e4SLinus Torvalds 	case ICMPV6_ECHO_REQUEST:
6381da177e4SLinus Torvalds 		icmpv6_echo_reply(skb);
6391da177e4SLinus Torvalds 		break;
6401da177e4SLinus Torvalds 
6411da177e4SLinus Torvalds 	case ICMPV6_ECHO_REPLY:
6421da177e4SLinus Torvalds 		/* we couldn't care less */
6431da177e4SLinus Torvalds 		break;
6441da177e4SLinus Torvalds 
6451da177e4SLinus Torvalds 	case ICMPV6_PKT_TOOBIG:
6461da177e4SLinus Torvalds 		/* BUGGG_FUTURE: if packet contains rthdr, we cannot update
6471da177e4SLinus Torvalds 		   standard destination cache. Seems, only "advanced"
6481da177e4SLinus Torvalds 		   destination cache will allow to solve this problem
6491da177e4SLinus Torvalds 		   --ANK (980726)
6501da177e4SLinus Torvalds 		 */
6511da177e4SLinus Torvalds 		if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
6521da177e4SLinus Torvalds 			goto discard_it;
6531da177e4SLinus Torvalds 		hdr = (struct icmp6hdr *) skb->h.raw;
6541da177e4SLinus Torvalds 		orig_hdr = (struct ipv6hdr *) (hdr + 1);
6551da177e4SLinus Torvalds 		rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
6561da177e4SLinus Torvalds 				   ntohl(hdr->icmp6_mtu));
6571da177e4SLinus Torvalds 
6581da177e4SLinus Torvalds 		/*
6591da177e4SLinus Torvalds 		 *	Drop through to notify
6601da177e4SLinus Torvalds 		 */
6611da177e4SLinus Torvalds 
6621da177e4SLinus Torvalds 	case ICMPV6_DEST_UNREACH:
6631da177e4SLinus Torvalds 	case ICMPV6_TIME_EXCEED:
6641da177e4SLinus Torvalds 	case ICMPV6_PARAMPROB:
6651da177e4SLinus Torvalds 		icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
6661da177e4SLinus Torvalds 		break;
6671da177e4SLinus Torvalds 
6681da177e4SLinus Torvalds 	case NDISC_ROUTER_SOLICITATION:
6691da177e4SLinus Torvalds 	case NDISC_ROUTER_ADVERTISEMENT:
6701da177e4SLinus Torvalds 	case NDISC_NEIGHBOUR_SOLICITATION:
6711da177e4SLinus Torvalds 	case NDISC_NEIGHBOUR_ADVERTISEMENT:
6721da177e4SLinus Torvalds 	case NDISC_REDIRECT:
6731da177e4SLinus Torvalds 		ndisc_rcv(skb);
6741da177e4SLinus Torvalds 		break;
6751da177e4SLinus Torvalds 
6761da177e4SLinus Torvalds 	case ICMPV6_MGM_QUERY:
6771da177e4SLinus Torvalds 		igmp6_event_query(skb);
6781da177e4SLinus Torvalds 		break;
6791da177e4SLinus Torvalds 
6801da177e4SLinus Torvalds 	case ICMPV6_MGM_REPORT:
6811da177e4SLinus Torvalds 		igmp6_event_report(skb);
6821da177e4SLinus Torvalds 		break;
6831da177e4SLinus Torvalds 
6841da177e4SLinus Torvalds 	case ICMPV6_MGM_REDUCTION:
6851da177e4SLinus Torvalds 	case ICMPV6_NI_QUERY:
6861da177e4SLinus Torvalds 	case ICMPV6_NI_REPLY:
6871da177e4SLinus Torvalds 	case ICMPV6_MLD2_REPORT:
6881da177e4SLinus Torvalds 	case ICMPV6_DHAAD_REQUEST:
6891da177e4SLinus Torvalds 	case ICMPV6_DHAAD_REPLY:
6901da177e4SLinus Torvalds 	case ICMPV6_MOBILE_PREFIX_SOL:
6911da177e4SLinus Torvalds 	case ICMPV6_MOBILE_PREFIX_ADV:
6921da177e4SLinus Torvalds 		break;
6931da177e4SLinus Torvalds 
6941da177e4SLinus Torvalds 	default:
69564ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
6961da177e4SLinus Torvalds 
6971da177e4SLinus Torvalds 		/* informational */
6981da177e4SLinus Torvalds 		if (type & ICMPV6_INFOMSG_MASK)
6991da177e4SLinus Torvalds 			break;
7001da177e4SLinus Torvalds 
7011da177e4SLinus Torvalds 		/*
7021da177e4SLinus Torvalds 		 * error of unknown type.
7031da177e4SLinus Torvalds 		 * must pass to upper level
7041da177e4SLinus Torvalds 		 */
7051da177e4SLinus Torvalds 
7061da177e4SLinus Torvalds 		icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
7071da177e4SLinus Torvalds 	};
7081da177e4SLinus Torvalds 	kfree_skb(skb);
7091da177e4SLinus Torvalds 	return 0;
7101da177e4SLinus Torvalds 
7111da177e4SLinus Torvalds discard_it:
7121da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INERRORS);
7131da177e4SLinus Torvalds 	kfree_skb(skb);
7141da177e4SLinus Torvalds 	return 0;
7151da177e4SLinus Torvalds }
7161da177e4SLinus Torvalds 
717640c41c7SIngo Molnar /*
718640c41c7SIngo Molnar  * Special lock-class for __icmpv6_socket:
719640c41c7SIngo Molnar  */
720640c41c7SIngo Molnar static struct lock_class_key icmpv6_socket_sk_dst_lock_key;
721640c41c7SIngo Molnar 
7221da177e4SLinus Torvalds int __init icmpv6_init(struct net_proto_family *ops)
7231da177e4SLinus Torvalds {
7241da177e4SLinus Torvalds 	struct sock *sk;
7251da177e4SLinus Torvalds 	int err, i, j;
7261da177e4SLinus Torvalds 
7276f912042SKAMEZAWA Hiroyuki 	for_each_possible_cpu(i) {
7281da177e4SLinus Torvalds 		err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6,
7291da177e4SLinus Torvalds 				       &per_cpu(__icmpv6_socket, i));
7301da177e4SLinus Torvalds 		if (err < 0) {
7311da177e4SLinus Torvalds 			printk(KERN_ERR
7321da177e4SLinus Torvalds 			       "Failed to initialize the ICMP6 control socket "
7331da177e4SLinus Torvalds 			       "(err %d).\n",
7341da177e4SLinus Torvalds 			       err);
7351da177e4SLinus Torvalds 			goto fail;
7361da177e4SLinus Torvalds 		}
7371da177e4SLinus Torvalds 
7381da177e4SLinus Torvalds 		sk = per_cpu(__icmpv6_socket, i)->sk;
7391da177e4SLinus Torvalds 		sk->sk_allocation = GFP_ATOMIC;
740640c41c7SIngo Molnar 		/*
741640c41c7SIngo Molnar 		 * Split off their lock-class, because sk->sk_dst_lock
742640c41c7SIngo Molnar 		 * gets used from softirqs, which is safe for
743640c41c7SIngo Molnar 		 * __icmpv6_socket (because those never get directly used
744640c41c7SIngo Molnar 		 * via userspace syscalls), but unsafe for normal sockets.
745640c41c7SIngo Molnar 		 */
746640c41c7SIngo Molnar 		lockdep_set_class(&sk->sk_dst_lock,
747640c41c7SIngo Molnar 				  &icmpv6_socket_sk_dst_lock_key);
7481da177e4SLinus Torvalds 
7491da177e4SLinus Torvalds 		/* Enough space for 2 64K ICMP packets, including
7501da177e4SLinus Torvalds 		 * sk_buff struct overhead.
7511da177e4SLinus Torvalds 		 */
7521da177e4SLinus Torvalds 		sk->sk_sndbuf =
7531da177e4SLinus Torvalds 			(2 * ((64 * 1024) + sizeof(struct sk_buff)));
7541da177e4SLinus Torvalds 
7551da177e4SLinus Torvalds 		sk->sk_prot->unhash(sk);
7561da177e4SLinus Torvalds 	}
7571da177e4SLinus Torvalds 
7581da177e4SLinus Torvalds 
7591da177e4SLinus Torvalds 	if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0) {
7601da177e4SLinus Torvalds 		printk(KERN_ERR "Failed to register ICMP6 protocol\n");
7611da177e4SLinus Torvalds 		err = -EAGAIN;
7621da177e4SLinus Torvalds 		goto fail;
7631da177e4SLinus Torvalds 	}
7641da177e4SLinus Torvalds 
7651da177e4SLinus Torvalds 	return 0;
7661da177e4SLinus Torvalds 
7671da177e4SLinus Torvalds  fail:
7681da177e4SLinus Torvalds 	for (j = 0; j < i; j++) {
7691da177e4SLinus Torvalds 		if (!cpu_possible(j))
7701da177e4SLinus Torvalds 			continue;
7711da177e4SLinus Torvalds 		sock_release(per_cpu(__icmpv6_socket, j));
7721da177e4SLinus Torvalds 	}
7731da177e4SLinus Torvalds 
7741da177e4SLinus Torvalds 	return err;
7751da177e4SLinus Torvalds }
7761da177e4SLinus Torvalds 
7771da177e4SLinus Torvalds void icmpv6_cleanup(void)
7781da177e4SLinus Torvalds {
7791da177e4SLinus Torvalds 	int i;
7801da177e4SLinus Torvalds 
7816f912042SKAMEZAWA Hiroyuki 	for_each_possible_cpu(i) {
7821da177e4SLinus Torvalds 		sock_release(per_cpu(__icmpv6_socket, i));
7831da177e4SLinus Torvalds 	}
7841da177e4SLinus Torvalds 	inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
7851da177e4SLinus Torvalds }
7861da177e4SLinus Torvalds 
7879b5b5cffSArjan van de Ven static const struct icmp6_err {
7881da177e4SLinus Torvalds 	int err;
7891da177e4SLinus Torvalds 	int fatal;
7901da177e4SLinus Torvalds } tab_unreach[] = {
7911da177e4SLinus Torvalds 	{	/* NOROUTE */
7921da177e4SLinus Torvalds 		.err	= ENETUNREACH,
7931da177e4SLinus Torvalds 		.fatal	= 0,
7941da177e4SLinus Torvalds 	},
7951da177e4SLinus Torvalds 	{	/* ADM_PROHIBITED */
7961da177e4SLinus Torvalds 		.err	= EACCES,
7971da177e4SLinus Torvalds 		.fatal	= 1,
7981da177e4SLinus Torvalds 	},
7991da177e4SLinus Torvalds 	{	/* Was NOT_NEIGHBOUR, now reserved */
8001da177e4SLinus Torvalds 		.err	= EHOSTUNREACH,
8011da177e4SLinus Torvalds 		.fatal	= 0,
8021da177e4SLinus Torvalds 	},
8031da177e4SLinus Torvalds 	{	/* ADDR_UNREACH	*/
8041da177e4SLinus Torvalds 		.err	= EHOSTUNREACH,
8051da177e4SLinus Torvalds 		.fatal	= 0,
8061da177e4SLinus Torvalds 	},
8071da177e4SLinus Torvalds 	{	/* PORT_UNREACH	*/
8081da177e4SLinus Torvalds 		.err	= ECONNREFUSED,
8091da177e4SLinus Torvalds 		.fatal	= 1,
8101da177e4SLinus Torvalds 	},
8111da177e4SLinus Torvalds };
8121da177e4SLinus Torvalds 
8131da177e4SLinus Torvalds int icmpv6_err_convert(int type, int code, int *err)
8141da177e4SLinus Torvalds {
8151da177e4SLinus Torvalds 	int fatal = 0;
8161da177e4SLinus Torvalds 
8171da177e4SLinus Torvalds 	*err = EPROTO;
8181da177e4SLinus Torvalds 
8191da177e4SLinus Torvalds 	switch (type) {
8201da177e4SLinus Torvalds 	case ICMPV6_DEST_UNREACH:
8211da177e4SLinus Torvalds 		fatal = 1;
8221da177e4SLinus Torvalds 		if (code <= ICMPV6_PORT_UNREACH) {
8231da177e4SLinus Torvalds 			*err  = tab_unreach[code].err;
8241da177e4SLinus Torvalds 			fatal = tab_unreach[code].fatal;
8251da177e4SLinus Torvalds 		}
8261da177e4SLinus Torvalds 		break;
8271da177e4SLinus Torvalds 
8281da177e4SLinus Torvalds 	case ICMPV6_PKT_TOOBIG:
8291da177e4SLinus Torvalds 		*err = EMSGSIZE;
8301da177e4SLinus Torvalds 		break;
8311da177e4SLinus Torvalds 
8321da177e4SLinus Torvalds 	case ICMPV6_PARAMPROB:
8331da177e4SLinus Torvalds 		*err = EPROTO;
8341da177e4SLinus Torvalds 		fatal = 1;
8351da177e4SLinus Torvalds 		break;
8361da177e4SLinus Torvalds 
8371da177e4SLinus Torvalds 	case ICMPV6_TIME_EXCEED:
8381da177e4SLinus Torvalds 		*err = EHOSTUNREACH;
8391da177e4SLinus Torvalds 		break;
8401da177e4SLinus Torvalds 	};
8411da177e4SLinus Torvalds 
8421da177e4SLinus Torvalds 	return fatal;
8431da177e4SLinus Torvalds }
8441da177e4SLinus Torvalds 
8451da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL
8461da177e4SLinus Torvalds ctl_table ipv6_icmp_table[] = {
8471da177e4SLinus Torvalds 	{
8481da177e4SLinus Torvalds 		.ctl_name	= NET_IPV6_ICMP_RATELIMIT,
8491da177e4SLinus Torvalds 		.procname	= "ratelimit",
8501da177e4SLinus Torvalds 		.data		= &sysctl_icmpv6_time,
8511da177e4SLinus Torvalds 		.maxlen		= sizeof(int),
8521da177e4SLinus Torvalds 		.mode		= 0644,
8531da177e4SLinus Torvalds 		.proc_handler	= &proc_dointvec
8541da177e4SLinus Torvalds 	},
8551da177e4SLinus Torvalds 	{ .ctl_name = 0 },
8561da177e4SLinus Torvalds };
8571da177e4SLinus Torvalds #endif
8581da177e4SLinus Torvalds 
859