xref: /openbmc/linux/net/ipv6/icmp.c (revision a11d206d)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  *	Internet Control Message Protocol (ICMPv6)
31da177e4SLinus Torvalds  *	Linux INET6 implementation
41da177e4SLinus Torvalds  *
51da177e4SLinus Torvalds  *	Authors:
61da177e4SLinus Torvalds  *	Pedro Roque		<roque@di.fc.ul.pt>
71da177e4SLinus Torvalds  *
81da177e4SLinus Torvalds  *	$Id: icmp.c,v 1.38 2002/02/08 03:57:19 davem Exp $
91da177e4SLinus Torvalds  *
101da177e4SLinus Torvalds  *	Based on net/ipv4/icmp.c
111da177e4SLinus Torvalds  *
121da177e4SLinus Torvalds  *	RFC 1885
131da177e4SLinus Torvalds  *
141da177e4SLinus Torvalds  *	This program is free software; you can redistribute it and/or
151da177e4SLinus Torvalds  *      modify it under the terms of the GNU General Public License
161da177e4SLinus Torvalds  *      as published by the Free Software Foundation; either version
171da177e4SLinus Torvalds  *      2 of the License, or (at your option) any later version.
181da177e4SLinus Torvalds  */
191da177e4SLinus Torvalds 
201da177e4SLinus Torvalds /*
211da177e4SLinus Torvalds  *	Changes:
221da177e4SLinus Torvalds  *
231da177e4SLinus Torvalds  *	Andi Kleen		:	exception handling
241da177e4SLinus Torvalds  *	Andi Kleen			add rate limits. never reply to a icmp.
251da177e4SLinus Torvalds  *					add more length checks and other fixes.
261da177e4SLinus Torvalds  *	yoshfuji		:	ensure to sent parameter problem for
271da177e4SLinus Torvalds  *					fragments.
281da177e4SLinus Torvalds  *	YOSHIFUJI Hideaki @USAGI:	added sysctl for icmp rate limit.
291da177e4SLinus Torvalds  *	Randy Dunlap and
301da177e4SLinus Torvalds  *	YOSHIFUJI Hideaki @USAGI:	Per-interface statistics support
311da177e4SLinus Torvalds  *	Kazunori MIYAZAWA @USAGI:       change output process to use ip6_append_data
321da177e4SLinus Torvalds  */
331da177e4SLinus Torvalds 
341da177e4SLinus Torvalds #include <linux/module.h>
351da177e4SLinus Torvalds #include <linux/errno.h>
361da177e4SLinus Torvalds #include <linux/types.h>
371da177e4SLinus Torvalds #include <linux/socket.h>
381da177e4SLinus Torvalds #include <linux/in.h>
391da177e4SLinus Torvalds #include <linux/kernel.h>
401da177e4SLinus Torvalds #include <linux/sched.h>
411da177e4SLinus Torvalds #include <linux/sockios.h>
421da177e4SLinus Torvalds #include <linux/net.h>
431da177e4SLinus Torvalds #include <linux/skbuff.h>
441da177e4SLinus Torvalds #include <linux/init.h>
45763ecff1SYasuyuki Kozakai #include <linux/netfilter.h>
461da177e4SLinus Torvalds 
471da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL
481da177e4SLinus Torvalds #include <linux/sysctl.h>
491da177e4SLinus Torvalds #endif
501da177e4SLinus Torvalds 
511da177e4SLinus Torvalds #include <linux/inet.h>
521da177e4SLinus Torvalds #include <linux/netdevice.h>
531da177e4SLinus Torvalds #include <linux/icmpv6.h>
541da177e4SLinus Torvalds 
551da177e4SLinus Torvalds #include <net/ip.h>
561da177e4SLinus Torvalds #include <net/sock.h>
571da177e4SLinus Torvalds 
581da177e4SLinus Torvalds #include <net/ipv6.h>
591da177e4SLinus Torvalds #include <net/ip6_checksum.h>
601da177e4SLinus Torvalds #include <net/protocol.h>
611da177e4SLinus Torvalds #include <net/raw.h>
621da177e4SLinus Torvalds #include <net/rawv6.h>
631da177e4SLinus Torvalds #include <net/transp_v6.h>
641da177e4SLinus Torvalds #include <net/ip6_route.h>
651da177e4SLinus Torvalds #include <net/addrconf.h>
661da177e4SLinus Torvalds #include <net/icmp.h>
671da177e4SLinus Torvalds 
681da177e4SLinus Torvalds #include <asm/uaccess.h>
691da177e4SLinus Torvalds #include <asm/system.h>
701da177e4SLinus Torvalds 
71ba89966cSEric Dumazet DEFINE_SNMP_STAT(struct icmpv6_mib, icmpv6_statistics) __read_mostly;
721da177e4SLinus Torvalds 
731da177e4SLinus Torvalds /*
741da177e4SLinus Torvalds  *	The ICMP socket(s). This is the most convenient way to flow control
751da177e4SLinus Torvalds  *	our ICMP output as well as maintain a clean interface throughout
761da177e4SLinus Torvalds  *	all layers. All Socketless IP sends will soon be gone.
771da177e4SLinus Torvalds  *
781da177e4SLinus Torvalds  *	On SMP we have one ICMP socket per-cpu.
791da177e4SLinus Torvalds  */
801da177e4SLinus Torvalds static DEFINE_PER_CPU(struct socket *, __icmpv6_socket) = NULL;
811da177e4SLinus Torvalds #define icmpv6_socket	__get_cpu_var(__icmpv6_socket)
821da177e4SLinus Torvalds 
83951dbc8aSPatrick McHardy static int icmpv6_rcv(struct sk_buff **pskb);
841da177e4SLinus Torvalds 
851da177e4SLinus Torvalds static struct inet6_protocol icmpv6_protocol = {
861da177e4SLinus Torvalds 	.handler	=	icmpv6_rcv,
871da177e4SLinus Torvalds 	.flags		=	INET6_PROTO_FINAL,
881da177e4SLinus Torvalds };
891da177e4SLinus Torvalds 
901da177e4SLinus Torvalds static __inline__ int icmpv6_xmit_lock(void)
911da177e4SLinus Torvalds {
921da177e4SLinus Torvalds 	local_bh_disable();
931da177e4SLinus Torvalds 
941da177e4SLinus Torvalds 	if (unlikely(!spin_trylock(&icmpv6_socket->sk->sk_lock.slock))) {
951da177e4SLinus Torvalds 		/* This can happen if the output path (f.e. SIT or
961da177e4SLinus Torvalds 		 * ip6ip6 tunnel) signals dst_link_failure() for an
971da177e4SLinus Torvalds 		 * outgoing ICMP6 packet.
981da177e4SLinus Torvalds 		 */
991da177e4SLinus Torvalds 		local_bh_enable();
1001da177e4SLinus Torvalds 		return 1;
1011da177e4SLinus Torvalds 	}
1021da177e4SLinus Torvalds 	return 0;
1031da177e4SLinus Torvalds }
1041da177e4SLinus Torvalds 
1051da177e4SLinus Torvalds static __inline__ void icmpv6_xmit_unlock(void)
1061da177e4SLinus Torvalds {
1071da177e4SLinus Torvalds 	spin_unlock_bh(&icmpv6_socket->sk->sk_lock.slock);
1081da177e4SLinus Torvalds }
1091da177e4SLinus Torvalds 
1101da177e4SLinus Torvalds /*
1111da177e4SLinus Torvalds  * Slightly more convenient version of icmpv6_send.
1121da177e4SLinus Torvalds  */
1131da177e4SLinus Torvalds void icmpv6_param_prob(struct sk_buff *skb, int code, int pos)
1141da177e4SLinus Torvalds {
1151da177e4SLinus Torvalds 	icmpv6_send(skb, ICMPV6_PARAMPROB, code, pos, skb->dev);
1161da177e4SLinus Torvalds 	kfree_skb(skb);
1171da177e4SLinus Torvalds }
1181da177e4SLinus Torvalds 
1191da177e4SLinus Torvalds /*
1201da177e4SLinus Torvalds  * Figure out, may we reply to this packet with icmp error.
1211da177e4SLinus Torvalds  *
1221da177e4SLinus Torvalds  * We do not reply, if:
1231da177e4SLinus Torvalds  *	- it was icmp error message.
1241da177e4SLinus Torvalds  *	- it is truncated, so that it is known, that protocol is ICMPV6
1251da177e4SLinus Torvalds  *	  (i.e. in the middle of some exthdr)
1261da177e4SLinus Torvalds  *
1271da177e4SLinus Torvalds  *	--ANK (980726)
1281da177e4SLinus Torvalds  */
1291da177e4SLinus Torvalds 
1301da177e4SLinus Torvalds static int is_ineligible(struct sk_buff *skb)
1311da177e4SLinus Torvalds {
1321da177e4SLinus Torvalds 	int ptr = (u8*)(skb->nh.ipv6h+1) - skb->data;
1331da177e4SLinus Torvalds 	int len = skb->len - ptr;
1341da177e4SLinus Torvalds 	__u8 nexthdr = skb->nh.ipv6h->nexthdr;
1351da177e4SLinus Torvalds 
1361da177e4SLinus Torvalds 	if (len < 0)
1371da177e4SLinus Torvalds 		return 1;
1381da177e4SLinus Torvalds 
1390d3d077cSHerbert Xu 	ptr = ipv6_skip_exthdr(skb, ptr, &nexthdr);
1401da177e4SLinus Torvalds 	if (ptr < 0)
1411da177e4SLinus Torvalds 		return 0;
1421da177e4SLinus Torvalds 	if (nexthdr == IPPROTO_ICMPV6) {
1431da177e4SLinus Torvalds 		u8 _type, *tp;
1441da177e4SLinus Torvalds 		tp = skb_header_pointer(skb,
1451da177e4SLinus Torvalds 			ptr+offsetof(struct icmp6hdr, icmp6_type),
1461da177e4SLinus Torvalds 			sizeof(_type), &_type);
1471da177e4SLinus Torvalds 		if (tp == NULL ||
1481da177e4SLinus Torvalds 		    !(*tp & ICMPV6_INFOMSG_MASK))
1491da177e4SLinus Torvalds 			return 1;
1501da177e4SLinus Torvalds 	}
1511da177e4SLinus Torvalds 	return 0;
1521da177e4SLinus Torvalds }
1531da177e4SLinus Torvalds 
154ab32ea5dSBrian Haley static int sysctl_icmpv6_time __read_mostly = 1*HZ;
1551da177e4SLinus Torvalds 
1561da177e4SLinus Torvalds /*
1571da177e4SLinus Torvalds  * Check the ICMP output rate limit
1581da177e4SLinus Torvalds  */
1591da177e4SLinus Torvalds static inline int icmpv6_xrlim_allow(struct sock *sk, int type,
1601da177e4SLinus Torvalds 				     struct flowi *fl)
1611da177e4SLinus Torvalds {
1621da177e4SLinus Torvalds 	struct dst_entry *dst;
1631da177e4SLinus Torvalds 	int res = 0;
1641da177e4SLinus Torvalds 
1651da177e4SLinus Torvalds 	/* Informational messages are not limited. */
1661da177e4SLinus Torvalds 	if (type & ICMPV6_INFOMSG_MASK)
1671da177e4SLinus Torvalds 		return 1;
1681da177e4SLinus Torvalds 
1691da177e4SLinus Torvalds 	/* Do not limit pmtu discovery, it would break it. */
1701da177e4SLinus Torvalds 	if (type == ICMPV6_PKT_TOOBIG)
1711da177e4SLinus Torvalds 		return 1;
1721da177e4SLinus Torvalds 
1731da177e4SLinus Torvalds 	/*
1741da177e4SLinus Torvalds 	 * Look up the output route.
1751da177e4SLinus Torvalds 	 * XXX: perhaps the expire for routing entries cloned by
1761da177e4SLinus Torvalds 	 * this lookup should be more aggressive (not longer than timeout).
1771da177e4SLinus Torvalds 	 */
1781da177e4SLinus Torvalds 	dst = ip6_route_output(sk, fl);
1791da177e4SLinus Torvalds 	if (dst->error) {
180a11d206dSYOSHIFUJI Hideaki 		IP6_INC_STATS(ip6_dst_idev(dst),
181a11d206dSYOSHIFUJI Hideaki 			      IPSTATS_MIB_OUTNOROUTES);
1821da177e4SLinus Torvalds 	} else if (dst->dev && (dst->dev->flags&IFF_LOOPBACK)) {
1831da177e4SLinus Torvalds 		res = 1;
1841da177e4SLinus Torvalds 	} else {
1851da177e4SLinus Torvalds 		struct rt6_info *rt = (struct rt6_info *)dst;
1861da177e4SLinus Torvalds 		int tmo = sysctl_icmpv6_time;
1871da177e4SLinus Torvalds 
1881da177e4SLinus Torvalds 		/* Give more bandwidth to wider prefixes. */
1891da177e4SLinus Torvalds 		if (rt->rt6i_dst.plen < 128)
1901da177e4SLinus Torvalds 			tmo >>= ((128 - rt->rt6i_dst.plen)>>5);
1911da177e4SLinus Torvalds 
1921da177e4SLinus Torvalds 		res = xrlim_allow(dst, tmo);
1931da177e4SLinus Torvalds 	}
1941da177e4SLinus Torvalds 	dst_release(dst);
1951da177e4SLinus Torvalds 	return res;
1961da177e4SLinus Torvalds }
1971da177e4SLinus Torvalds 
1981da177e4SLinus Torvalds /*
1991da177e4SLinus Torvalds  *	an inline helper for the "simple" if statement below
2001da177e4SLinus Torvalds  *	checks if parameter problem report is caused by an
2011da177e4SLinus Torvalds  *	unrecognized IPv6 option that has the Option Type
2021da177e4SLinus Torvalds  *	highest-order two bits set to 10
2031da177e4SLinus Torvalds  */
2041da177e4SLinus Torvalds 
2051da177e4SLinus Torvalds static __inline__ int opt_unrec(struct sk_buff *skb, __u32 offset)
2061da177e4SLinus Torvalds {
2071da177e4SLinus Torvalds 	u8 _optval, *op;
2081da177e4SLinus Torvalds 
2091da177e4SLinus Torvalds 	offset += skb->nh.raw - skb->data;
2101da177e4SLinus Torvalds 	op = skb_header_pointer(skb, offset, sizeof(_optval), &_optval);
2111da177e4SLinus Torvalds 	if (op == NULL)
2121da177e4SLinus Torvalds 		return 1;
2131da177e4SLinus Torvalds 	return (*op & 0xC0) == 0x80;
2141da177e4SLinus Torvalds }
2151da177e4SLinus Torvalds 
2161da177e4SLinus Torvalds static int icmpv6_push_pending_frames(struct sock *sk, struct flowi *fl, struct icmp6hdr *thdr, int len)
2171da177e4SLinus Torvalds {
2181da177e4SLinus Torvalds 	struct sk_buff *skb;
2191da177e4SLinus Torvalds 	struct icmp6hdr *icmp6h;
2201da177e4SLinus Torvalds 	int err = 0;
2211da177e4SLinus Torvalds 
2221da177e4SLinus Torvalds 	if ((skb = skb_peek(&sk->sk_write_queue)) == NULL)
2231da177e4SLinus Torvalds 		goto out;
2241da177e4SLinus Torvalds 
2251da177e4SLinus Torvalds 	icmp6h = (struct icmp6hdr*) skb->h.raw;
2261da177e4SLinus Torvalds 	memcpy(icmp6h, thdr, sizeof(struct icmp6hdr));
2271da177e4SLinus Torvalds 	icmp6h->icmp6_cksum = 0;
2281da177e4SLinus Torvalds 
2291da177e4SLinus Torvalds 	if (skb_queue_len(&sk->sk_write_queue) == 1) {
2301da177e4SLinus Torvalds 		skb->csum = csum_partial((char *)icmp6h,
2311da177e4SLinus Torvalds 					sizeof(struct icmp6hdr), skb->csum);
2321da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = csum_ipv6_magic(&fl->fl6_src,
2331da177e4SLinus Torvalds 						      &fl->fl6_dst,
2341da177e4SLinus Torvalds 						      len, fl->proto,
2351da177e4SLinus Torvalds 						      skb->csum);
2361da177e4SLinus Torvalds 	} else {
2371da177e4SLinus Torvalds 		u32 tmp_csum = 0;
2381da177e4SLinus Torvalds 
2391da177e4SLinus Torvalds 		skb_queue_walk(&sk->sk_write_queue, skb) {
2401da177e4SLinus Torvalds 			tmp_csum = csum_add(tmp_csum, skb->csum);
2411da177e4SLinus Torvalds 		}
2421da177e4SLinus Torvalds 
2431da177e4SLinus Torvalds 		tmp_csum = csum_partial((char *)icmp6h,
2441da177e4SLinus Torvalds 					sizeof(struct icmp6hdr), tmp_csum);
2451da177e4SLinus Torvalds 		tmp_csum = csum_ipv6_magic(&fl->fl6_src,
2461da177e4SLinus Torvalds 					   &fl->fl6_dst,
2471da177e4SLinus Torvalds 					   len, fl->proto, tmp_csum);
2481da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = tmp_csum;
2491da177e4SLinus Torvalds 	}
2501da177e4SLinus Torvalds 	if (icmp6h->icmp6_cksum == 0)
2511da177e4SLinus Torvalds 		icmp6h->icmp6_cksum = -1;
2521da177e4SLinus Torvalds 	ip6_push_pending_frames(sk);
2531da177e4SLinus Torvalds out:
2541da177e4SLinus Torvalds 	return err;
2551da177e4SLinus Torvalds }
2561da177e4SLinus Torvalds 
2571da177e4SLinus Torvalds struct icmpv6_msg {
2581da177e4SLinus Torvalds 	struct sk_buff	*skb;
2591da177e4SLinus Torvalds 	int		offset;
260763ecff1SYasuyuki Kozakai 	uint8_t		type;
2611da177e4SLinus Torvalds };
2621da177e4SLinus Torvalds 
2631da177e4SLinus Torvalds static int icmpv6_getfrag(void *from, char *to, int offset, int len, int odd, struct sk_buff *skb)
2641da177e4SLinus Torvalds {
2651da177e4SLinus Torvalds 	struct icmpv6_msg *msg = (struct icmpv6_msg *) from;
2661da177e4SLinus Torvalds 	struct sk_buff *org_skb = msg->skb;
2671da177e4SLinus Torvalds 	__u32 csum = 0;
2681da177e4SLinus Torvalds 
2691da177e4SLinus Torvalds 	csum = skb_copy_and_csum_bits(org_skb, msg->offset + offset,
2701da177e4SLinus Torvalds 				      to, len, csum);
2711da177e4SLinus Torvalds 	skb->csum = csum_block_add(skb->csum, csum, odd);
272763ecff1SYasuyuki Kozakai 	if (!(msg->type & ICMPV6_INFOMSG_MASK))
273763ecff1SYasuyuki Kozakai 		nf_ct_attach(skb, org_skb);
2741da177e4SLinus Torvalds 	return 0;
2751da177e4SLinus Torvalds }
2761da177e4SLinus Torvalds 
27779383236SMasahide NAKAMURA #ifdef CONFIG_IPV6_MIP6
27879383236SMasahide NAKAMURA static void mip6_addr_swap(struct sk_buff *skb)
27979383236SMasahide NAKAMURA {
28079383236SMasahide NAKAMURA 	struct ipv6hdr *iph = skb->nh.ipv6h;
28179383236SMasahide NAKAMURA 	struct inet6_skb_parm *opt = IP6CB(skb);
28279383236SMasahide NAKAMURA 	struct ipv6_destopt_hao *hao;
28379383236SMasahide NAKAMURA 	struct in6_addr tmp;
28479383236SMasahide NAKAMURA 	int off;
28579383236SMasahide NAKAMURA 
28679383236SMasahide NAKAMURA 	if (opt->dsthao) {
28779383236SMasahide NAKAMURA 		off = ipv6_find_tlv(skb, opt->dsthao, IPV6_TLV_HAO);
28879383236SMasahide NAKAMURA 		if (likely(off >= 0)) {
28979383236SMasahide NAKAMURA 			hao = (struct ipv6_destopt_hao *)(skb->nh.raw + off);
29079383236SMasahide NAKAMURA 			ipv6_addr_copy(&tmp, &iph->saddr);
29179383236SMasahide NAKAMURA 			ipv6_addr_copy(&iph->saddr, &hao->addr);
29279383236SMasahide NAKAMURA 			ipv6_addr_copy(&hao->addr, &tmp);
29379383236SMasahide NAKAMURA 		}
29479383236SMasahide NAKAMURA 	}
29579383236SMasahide NAKAMURA }
29679383236SMasahide NAKAMURA #else
29779383236SMasahide NAKAMURA static inline void mip6_addr_swap(struct sk_buff *skb) {}
29879383236SMasahide NAKAMURA #endif
29979383236SMasahide NAKAMURA 
3001da177e4SLinus Torvalds /*
3011da177e4SLinus Torvalds  *	Send an ICMP message in response to a packet in error
3021da177e4SLinus Torvalds  */
3031da177e4SLinus Torvalds void icmpv6_send(struct sk_buff *skb, int type, int code, __u32 info,
3041da177e4SLinus Torvalds 		 struct net_device *dev)
3051da177e4SLinus Torvalds {
3061da177e4SLinus Torvalds 	struct inet6_dev *idev = NULL;
3071da177e4SLinus Torvalds 	struct ipv6hdr *hdr = skb->nh.ipv6h;
30884427d53SYOSHIFUJI Hideaki 	struct sock *sk;
30984427d53SYOSHIFUJI Hideaki 	struct ipv6_pinfo *np;
3101da177e4SLinus Torvalds 	struct in6_addr *saddr = NULL;
3111da177e4SLinus Torvalds 	struct dst_entry *dst;
3121da177e4SLinus Torvalds 	struct icmp6hdr tmp_hdr;
3131da177e4SLinus Torvalds 	struct flowi fl;
3141da177e4SLinus Torvalds 	struct icmpv6_msg msg;
3151da177e4SLinus Torvalds 	int iif = 0;
3161da177e4SLinus Torvalds 	int addr_type = 0;
3171da177e4SLinus Torvalds 	int len;
31841a1f8eaSYOSHIFUJI Hideaki 	int hlimit, tclass;
3191da177e4SLinus Torvalds 	int err = 0;
3201da177e4SLinus Torvalds 
3211da177e4SLinus Torvalds 	if ((u8*)hdr < skb->head || (u8*)(hdr+1) > skb->tail)
3221da177e4SLinus Torvalds 		return;
3231da177e4SLinus Torvalds 
3241da177e4SLinus Torvalds 	/*
3251da177e4SLinus Torvalds 	 *	Make sure we respect the rules
3261da177e4SLinus Torvalds 	 *	i.e. RFC 1885 2.4(e)
3271da177e4SLinus Torvalds 	 *	Rule (e.1) is enforced by not using icmpv6_send
3281da177e4SLinus Torvalds 	 *	in any code that processes icmp errors.
3291da177e4SLinus Torvalds 	 */
3301da177e4SLinus Torvalds 	addr_type = ipv6_addr_type(&hdr->daddr);
3311da177e4SLinus Torvalds 
3321da177e4SLinus Torvalds 	if (ipv6_chk_addr(&hdr->daddr, skb->dev, 0))
3331da177e4SLinus Torvalds 		saddr = &hdr->daddr;
3341da177e4SLinus Torvalds 
3351da177e4SLinus Torvalds 	/*
3361da177e4SLinus Torvalds 	 *	Dest addr check
3371da177e4SLinus Torvalds 	 */
3381da177e4SLinus Torvalds 
3391da177e4SLinus Torvalds 	if ((addr_type & IPV6_ADDR_MULTICAST || skb->pkt_type != PACKET_HOST)) {
3401da177e4SLinus Torvalds 		if (type != ICMPV6_PKT_TOOBIG &&
3411da177e4SLinus Torvalds 		    !(type == ICMPV6_PARAMPROB &&
3421da177e4SLinus Torvalds 		      code == ICMPV6_UNK_OPTION &&
3431da177e4SLinus Torvalds 		      (opt_unrec(skb, info))))
3441da177e4SLinus Torvalds 			return;
3451da177e4SLinus Torvalds 
3461da177e4SLinus Torvalds 		saddr = NULL;
3471da177e4SLinus Torvalds 	}
3481da177e4SLinus Torvalds 
3491da177e4SLinus Torvalds 	addr_type = ipv6_addr_type(&hdr->saddr);
3501da177e4SLinus Torvalds 
3511da177e4SLinus Torvalds 	/*
3521da177e4SLinus Torvalds 	 *	Source addr check
3531da177e4SLinus Torvalds 	 */
3541da177e4SLinus Torvalds 
3551da177e4SLinus Torvalds 	if (addr_type & IPV6_ADDR_LINKLOCAL)
3561da177e4SLinus Torvalds 		iif = skb->dev->ifindex;
3571da177e4SLinus Torvalds 
3581da177e4SLinus Torvalds 	/*
3598de3351eSYOSHIFUJI Hideaki 	 *	Must not send error if the source does not uniquely
3608de3351eSYOSHIFUJI Hideaki 	 *	identify a single node (RFC2463 Section 2.4).
3618de3351eSYOSHIFUJI Hideaki 	 *	We check unspecified / multicast addresses here,
3628de3351eSYOSHIFUJI Hideaki 	 *	and anycast addresses will be checked later.
3631da177e4SLinus Torvalds 	 */
3641da177e4SLinus Torvalds 	if ((addr_type == IPV6_ADDR_ANY) || (addr_type & IPV6_ADDR_MULTICAST)) {
36564ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: addr_any/mcast source\n");
3661da177e4SLinus Torvalds 		return;
3671da177e4SLinus Torvalds 	}
3681da177e4SLinus Torvalds 
3691da177e4SLinus Torvalds 	/*
3701da177e4SLinus Torvalds 	 *	Never answer to a ICMP packet.
3711da177e4SLinus Torvalds 	 */
3721da177e4SLinus Torvalds 	if (is_ineligible(skb)) {
37364ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: no reply to icmp error\n");
3741da177e4SLinus Torvalds 		return;
3751da177e4SLinus Torvalds 	}
3761da177e4SLinus Torvalds 
37779383236SMasahide NAKAMURA 	mip6_addr_swap(skb);
37879383236SMasahide NAKAMURA 
3791da177e4SLinus Torvalds 	memset(&fl, 0, sizeof(fl));
3801da177e4SLinus Torvalds 	fl.proto = IPPROTO_ICMPV6;
3811da177e4SLinus Torvalds 	ipv6_addr_copy(&fl.fl6_dst, &hdr->saddr);
3821da177e4SLinus Torvalds 	if (saddr)
3831da177e4SLinus Torvalds 		ipv6_addr_copy(&fl.fl6_src, saddr);
3841da177e4SLinus Torvalds 	fl.oif = iif;
3851da177e4SLinus Torvalds 	fl.fl_icmp_type = type;
3861da177e4SLinus Torvalds 	fl.fl_icmp_code = code;
387beb8d13bSVenkat Yekkirala 	security_skb_classify_flow(skb, &fl);
3881da177e4SLinus Torvalds 
3891da177e4SLinus Torvalds 	if (icmpv6_xmit_lock())
3901da177e4SLinus Torvalds 		return;
3911da177e4SLinus Torvalds 
39284427d53SYOSHIFUJI Hideaki 	sk = icmpv6_socket->sk;
39384427d53SYOSHIFUJI Hideaki 	np = inet6_sk(sk);
39484427d53SYOSHIFUJI Hideaki 
3951da177e4SLinus Torvalds 	if (!icmpv6_xrlim_allow(sk, type, &fl))
3961da177e4SLinus Torvalds 		goto out;
3971da177e4SLinus Torvalds 
3981da177e4SLinus Torvalds 	tmp_hdr.icmp6_type = type;
3991da177e4SLinus Torvalds 	tmp_hdr.icmp6_code = code;
4001da177e4SLinus Torvalds 	tmp_hdr.icmp6_cksum = 0;
4011da177e4SLinus Torvalds 	tmp_hdr.icmp6_pointer = htonl(info);
4021da177e4SLinus Torvalds 
4031da177e4SLinus Torvalds 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
4041da177e4SLinus Torvalds 		fl.oif = np->mcast_oif;
4051da177e4SLinus Torvalds 
4061da177e4SLinus Torvalds 	err = ip6_dst_lookup(sk, &dst, &fl);
4071da177e4SLinus Torvalds 	if (err)
4081da177e4SLinus Torvalds 		goto out;
4098de3351eSYOSHIFUJI Hideaki 
4108de3351eSYOSHIFUJI Hideaki 	/*
4118de3351eSYOSHIFUJI Hideaki 	 * We won't send icmp if the destination is known
4128de3351eSYOSHIFUJI Hideaki 	 * anycast.
4138de3351eSYOSHIFUJI Hideaki 	 */
4148de3351eSYOSHIFUJI Hideaki 	if (((struct rt6_info *)dst)->rt6i_flags & RTF_ANYCAST) {
4158de3351eSYOSHIFUJI Hideaki 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6_send: acast source\n");
4168de3351eSYOSHIFUJI Hideaki 		goto out_dst_release;
4178de3351eSYOSHIFUJI Hideaki 	}
4188de3351eSYOSHIFUJI Hideaki 
4191da177e4SLinus Torvalds 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
420e104411bSPatrick McHardy 		goto out;
4211da177e4SLinus Torvalds 
4221da177e4SLinus Torvalds 	if (ipv6_addr_is_multicast(&fl.fl6_dst))
4231da177e4SLinus Torvalds 		hlimit = np->mcast_hops;
4241da177e4SLinus Torvalds 	else
4251da177e4SLinus Torvalds 		hlimit = np->hop_limit;
4261da177e4SLinus Torvalds 	if (hlimit < 0)
4271da177e4SLinus Torvalds 		hlimit = dst_metric(dst, RTAX_HOPLIMIT);
4281da177e4SLinus Torvalds 	if (hlimit < 0)
4291da177e4SLinus Torvalds 		hlimit = ipv6_get_hoplimit(dst->dev);
4301da177e4SLinus Torvalds 
431e012d51cSYOSHIFUJI Hideaki 	tclass = np->tclass;
43241a1f8eaSYOSHIFUJI Hideaki 	if (tclass < 0)
43341a1f8eaSYOSHIFUJI Hideaki 		tclass = 0;
43441a1f8eaSYOSHIFUJI Hideaki 
4351da177e4SLinus Torvalds 	msg.skb = skb;
4361da177e4SLinus Torvalds 	msg.offset = skb->nh.raw - skb->data;
437763ecff1SYasuyuki Kozakai 	msg.type = type;
4381da177e4SLinus Torvalds 
4391da177e4SLinus Torvalds 	len = skb->len - msg.offset;
4401da177e4SLinus Torvalds 	len = min_t(unsigned int, len, IPV6_MIN_MTU - sizeof(struct ipv6hdr) -sizeof(struct icmp6hdr));
4411da177e4SLinus Torvalds 	if (len < 0) {
44264ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmp: len problem\n");
4431da177e4SLinus Torvalds 		goto out_dst_release;
4441da177e4SLinus Torvalds 	}
4451da177e4SLinus Torvalds 
4461da177e4SLinus Torvalds 	idev = in6_dev_get(skb->dev);
4471da177e4SLinus Torvalds 
4481da177e4SLinus Torvalds 	err = ip6_append_data(sk, icmpv6_getfrag, &msg,
4491da177e4SLinus Torvalds 			      len + sizeof(struct icmp6hdr),
4501da177e4SLinus Torvalds 			      sizeof(struct icmp6hdr),
45141a1f8eaSYOSHIFUJI Hideaki 			      hlimit, tclass, NULL, &fl, (struct rt6_info*)dst,
4521da177e4SLinus Torvalds 			      MSG_DONTWAIT);
4531da177e4SLinus Torvalds 	if (err) {
4541da177e4SLinus Torvalds 		ip6_flush_pending_frames(sk);
4551da177e4SLinus Torvalds 		goto out_put;
4561da177e4SLinus Torvalds 	}
4571da177e4SLinus Torvalds 	err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, len + sizeof(struct icmp6hdr));
4581da177e4SLinus Torvalds 
4591da177e4SLinus Torvalds 	if (type >= ICMPV6_DEST_UNREACH && type <= ICMPV6_PARAMPROB)
4601da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_OUTDESTUNREACHS, type - ICMPV6_DEST_UNREACH);
4611da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
4621da177e4SLinus Torvalds 
4631da177e4SLinus Torvalds out_put:
4641da177e4SLinus Torvalds 	if (likely(idev != NULL))
4651da177e4SLinus Torvalds 		in6_dev_put(idev);
4661da177e4SLinus Torvalds out_dst_release:
4671da177e4SLinus Torvalds 	dst_release(dst);
4681da177e4SLinus Torvalds out:
4691da177e4SLinus Torvalds 	icmpv6_xmit_unlock();
4701da177e4SLinus Torvalds }
4711da177e4SLinus Torvalds 
4721da177e4SLinus Torvalds static void icmpv6_echo_reply(struct sk_buff *skb)
4731da177e4SLinus Torvalds {
47484427d53SYOSHIFUJI Hideaki 	struct sock *sk;
4751da177e4SLinus Torvalds 	struct inet6_dev *idev;
47684427d53SYOSHIFUJI Hideaki 	struct ipv6_pinfo *np;
4771da177e4SLinus Torvalds 	struct in6_addr *saddr = NULL;
4781da177e4SLinus Torvalds 	struct icmp6hdr *icmph = (struct icmp6hdr *) skb->h.raw;
4791da177e4SLinus Torvalds 	struct icmp6hdr tmp_hdr;
4801da177e4SLinus Torvalds 	struct flowi fl;
4811da177e4SLinus Torvalds 	struct icmpv6_msg msg;
4821da177e4SLinus Torvalds 	struct dst_entry *dst;
4831da177e4SLinus Torvalds 	int err = 0;
4841da177e4SLinus Torvalds 	int hlimit;
48541a1f8eaSYOSHIFUJI Hideaki 	int tclass;
4861da177e4SLinus Torvalds 
4871da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->daddr;
4881da177e4SLinus Torvalds 
4891da177e4SLinus Torvalds 	if (!ipv6_unicast_destination(skb))
4901da177e4SLinus Torvalds 		saddr = NULL;
4911da177e4SLinus Torvalds 
4921da177e4SLinus Torvalds 	memcpy(&tmp_hdr, icmph, sizeof(tmp_hdr));
4931da177e4SLinus Torvalds 	tmp_hdr.icmp6_type = ICMPV6_ECHO_REPLY;
4941da177e4SLinus Torvalds 
4951da177e4SLinus Torvalds 	memset(&fl, 0, sizeof(fl));
4961da177e4SLinus Torvalds 	fl.proto = IPPROTO_ICMPV6;
4971da177e4SLinus Torvalds 	ipv6_addr_copy(&fl.fl6_dst, &skb->nh.ipv6h->saddr);
4981da177e4SLinus Torvalds 	if (saddr)
4991da177e4SLinus Torvalds 		ipv6_addr_copy(&fl.fl6_src, saddr);
5001da177e4SLinus Torvalds 	fl.oif = skb->dev->ifindex;
5011da177e4SLinus Torvalds 	fl.fl_icmp_type = ICMPV6_ECHO_REPLY;
502beb8d13bSVenkat Yekkirala 	security_skb_classify_flow(skb, &fl);
5031da177e4SLinus Torvalds 
5041da177e4SLinus Torvalds 	if (icmpv6_xmit_lock())
5051da177e4SLinus Torvalds 		return;
5061da177e4SLinus Torvalds 
50784427d53SYOSHIFUJI Hideaki 	sk = icmpv6_socket->sk;
50884427d53SYOSHIFUJI Hideaki 	np = inet6_sk(sk);
50984427d53SYOSHIFUJI Hideaki 
5101da177e4SLinus Torvalds 	if (!fl.oif && ipv6_addr_is_multicast(&fl.fl6_dst))
5111da177e4SLinus Torvalds 		fl.oif = np->mcast_oif;
5121da177e4SLinus Torvalds 
5131da177e4SLinus Torvalds 	err = ip6_dst_lookup(sk, &dst, &fl);
5141da177e4SLinus Torvalds 	if (err)
5151da177e4SLinus Torvalds 		goto out;
5161da177e4SLinus Torvalds 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0)
517e104411bSPatrick McHardy 		goto out;
5181da177e4SLinus Torvalds 
5191da177e4SLinus Torvalds 	if (ipv6_addr_is_multicast(&fl.fl6_dst))
5201da177e4SLinus Torvalds 		hlimit = np->mcast_hops;
5211da177e4SLinus Torvalds 	else
5221da177e4SLinus Torvalds 		hlimit = np->hop_limit;
5231da177e4SLinus Torvalds 	if (hlimit < 0)
5241da177e4SLinus Torvalds 		hlimit = dst_metric(dst, RTAX_HOPLIMIT);
5251da177e4SLinus Torvalds 	if (hlimit < 0)
5261da177e4SLinus Torvalds 		hlimit = ipv6_get_hoplimit(dst->dev);
5271da177e4SLinus Torvalds 
528e012d51cSYOSHIFUJI Hideaki 	tclass = np->tclass;
52941a1f8eaSYOSHIFUJI Hideaki 	if (tclass < 0)
53041a1f8eaSYOSHIFUJI Hideaki 		tclass = 0;
53141a1f8eaSYOSHIFUJI Hideaki 
5321da177e4SLinus Torvalds 	idev = in6_dev_get(skb->dev);
5331da177e4SLinus Torvalds 
5341da177e4SLinus Torvalds 	msg.skb = skb;
5351da177e4SLinus Torvalds 	msg.offset = 0;
536763ecff1SYasuyuki Kozakai 	msg.type = ICMPV6_ECHO_REPLY;
5371da177e4SLinus Torvalds 
5381da177e4SLinus Torvalds 	err = ip6_append_data(sk, icmpv6_getfrag, &msg, skb->len + sizeof(struct icmp6hdr),
53941a1f8eaSYOSHIFUJI Hideaki 				sizeof(struct icmp6hdr), hlimit, tclass, NULL, &fl,
5401da177e4SLinus Torvalds 				(struct rt6_info*)dst, MSG_DONTWAIT);
5411da177e4SLinus Torvalds 
5421da177e4SLinus Torvalds 	if (err) {
5431da177e4SLinus Torvalds 		ip6_flush_pending_frames(sk);
5441da177e4SLinus Torvalds 		goto out_put;
5451da177e4SLinus Torvalds 	}
5461da177e4SLinus Torvalds 	err = icmpv6_push_pending_frames(sk, &fl, &tmp_hdr, skb->len + sizeof(struct icmp6hdr));
5471da177e4SLinus Torvalds 
5481da177e4SLinus Torvalds         ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTECHOREPLIES);
5491da177e4SLinus Torvalds         ICMP6_INC_STATS_BH(idev, ICMP6_MIB_OUTMSGS);
5501da177e4SLinus Torvalds 
5511da177e4SLinus Torvalds out_put:
5521da177e4SLinus Torvalds 	if (likely(idev != NULL))
5531da177e4SLinus Torvalds 		in6_dev_put(idev);
5541da177e4SLinus Torvalds 	dst_release(dst);
5551da177e4SLinus Torvalds out:
5561da177e4SLinus Torvalds 	icmpv6_xmit_unlock();
5571da177e4SLinus Torvalds }
5581da177e4SLinus Torvalds 
55904ce6909SAl Viro static void icmpv6_notify(struct sk_buff *skb, int type, int code, __be32 info)
5601da177e4SLinus Torvalds {
5611da177e4SLinus Torvalds 	struct in6_addr *saddr, *daddr;
5621da177e4SLinus Torvalds 	struct inet6_protocol *ipprot;
5631da177e4SLinus Torvalds 	struct sock *sk;
5641da177e4SLinus Torvalds 	int inner_offset;
5651da177e4SLinus Torvalds 	int hash;
5661da177e4SLinus Torvalds 	u8 nexthdr;
5671da177e4SLinus Torvalds 
5681da177e4SLinus Torvalds 	if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
5691da177e4SLinus Torvalds 		return;
5701da177e4SLinus Torvalds 
5711da177e4SLinus Torvalds 	nexthdr = ((struct ipv6hdr *)skb->data)->nexthdr;
5721da177e4SLinus Torvalds 	if (ipv6_ext_hdr(nexthdr)) {
5731da177e4SLinus Torvalds 		/* now skip over extension headers */
5740d3d077cSHerbert Xu 		inner_offset = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &nexthdr);
5751da177e4SLinus Torvalds 		if (inner_offset<0)
5761da177e4SLinus Torvalds 			return;
5771da177e4SLinus Torvalds 	} else {
5781da177e4SLinus Torvalds 		inner_offset = sizeof(struct ipv6hdr);
5791da177e4SLinus Torvalds 	}
5801da177e4SLinus Torvalds 
5811da177e4SLinus Torvalds 	/* Checkin header including 8 bytes of inner protocol header. */
5821da177e4SLinus Torvalds 	if (!pskb_may_pull(skb, inner_offset+8))
5831da177e4SLinus Torvalds 		return;
5841da177e4SLinus Torvalds 
5851da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->saddr;
5861da177e4SLinus Torvalds 	daddr = &skb->nh.ipv6h->daddr;
5871da177e4SLinus Torvalds 
5881da177e4SLinus Torvalds 	/* BUGGG_FUTURE: we should try to parse exthdrs in this packet.
5891da177e4SLinus Torvalds 	   Without this we will not able f.e. to make source routed
5901da177e4SLinus Torvalds 	   pmtu discovery.
5911da177e4SLinus Torvalds 	   Corresponding argument (opt) to notifiers is already added.
5921da177e4SLinus Torvalds 	   --ANK (980726)
5931da177e4SLinus Torvalds 	 */
5941da177e4SLinus Torvalds 
5951da177e4SLinus Torvalds 	hash = nexthdr & (MAX_INET_PROTOS - 1);
5961da177e4SLinus Torvalds 
5971da177e4SLinus Torvalds 	rcu_read_lock();
5981da177e4SLinus Torvalds 	ipprot = rcu_dereference(inet6_protos[hash]);
5991da177e4SLinus Torvalds 	if (ipprot && ipprot->err_handler)
6001da177e4SLinus Torvalds 		ipprot->err_handler(skb, NULL, type, code, inner_offset, info);
6011da177e4SLinus Torvalds 	rcu_read_unlock();
6021da177e4SLinus Torvalds 
6031da177e4SLinus Torvalds 	read_lock(&raw_v6_lock);
6041da177e4SLinus Torvalds 	if ((sk = sk_head(&raw_v6_htable[hash])) != NULL) {
6050bd1b59bSAndrew McDonald 		while((sk = __raw_v6_lookup(sk, nexthdr, daddr, saddr,
6062dac4b96SYOSHIFUJI Hideaki 					    IP6CB(skb)->iif))) {
6071da177e4SLinus Torvalds 			rawv6_err(sk, skb, NULL, type, code, inner_offset, info);
6081da177e4SLinus Torvalds 			sk = sk_next(sk);
6091da177e4SLinus Torvalds 		}
6101da177e4SLinus Torvalds 	}
6111da177e4SLinus Torvalds 	read_unlock(&raw_v6_lock);
6121da177e4SLinus Torvalds }
6131da177e4SLinus Torvalds 
6141da177e4SLinus Torvalds /*
6151da177e4SLinus Torvalds  *	Handle icmp messages
6161da177e4SLinus Torvalds  */
6171da177e4SLinus Torvalds 
618951dbc8aSPatrick McHardy static int icmpv6_rcv(struct sk_buff **pskb)
6191da177e4SLinus Torvalds {
6201da177e4SLinus Torvalds 	struct sk_buff *skb = *pskb;
6211da177e4SLinus Torvalds 	struct net_device *dev = skb->dev;
6221da177e4SLinus Torvalds 	struct inet6_dev *idev = __in6_dev_get(dev);
6231da177e4SLinus Torvalds 	struct in6_addr *saddr, *daddr;
6241da177e4SLinus Torvalds 	struct ipv6hdr *orig_hdr;
6251da177e4SLinus Torvalds 	struct icmp6hdr *hdr;
6261da177e4SLinus Torvalds 	int type;
6271da177e4SLinus Torvalds 
6281da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INMSGS);
6291da177e4SLinus Torvalds 
6301da177e4SLinus Torvalds 	saddr = &skb->nh.ipv6h->saddr;
6311da177e4SLinus Torvalds 	daddr = &skb->nh.ipv6h->daddr;
6321da177e4SLinus Torvalds 
6331da177e4SLinus Torvalds 	/* Perform checksum. */
634fb286bb2SHerbert Xu 	switch (skb->ip_summed) {
63584fa7933SPatrick McHardy 	case CHECKSUM_COMPLETE:
636fb286bb2SHerbert Xu 		if (!csum_ipv6_magic(saddr, daddr, skb->len, IPPROTO_ICMPV6,
637fb286bb2SHerbert Xu 				     skb->csum))
638fb286bb2SHerbert Xu 			break;
639fb286bb2SHerbert Xu 		/* fall through */
640fb286bb2SHerbert Xu 	case CHECKSUM_NONE:
641fb286bb2SHerbert Xu 		skb->csum = ~csum_ipv6_magic(saddr, daddr, skb->len,
642fb286bb2SHerbert Xu 					     IPPROTO_ICMPV6, 0);
643fb286bb2SHerbert Xu 		if (__skb_checksum_complete(skb)) {
64446b86a2dSJoe Perches 			LIMIT_NETDEBUG(KERN_DEBUG "ICMPv6 checksum failed [" NIP6_FMT " > " NIP6_FMT "]\n",
64564ce2073SPatrick McHardy 				       NIP6(*saddr), NIP6(*daddr));
6461da177e4SLinus Torvalds 			goto discard_it;
6471da177e4SLinus Torvalds 		}
6481da177e4SLinus Torvalds 	}
6491da177e4SLinus Torvalds 
6501da177e4SLinus Torvalds 	if (!pskb_pull(skb, sizeof(struct icmp6hdr)))
6511da177e4SLinus Torvalds 		goto discard_it;
6521da177e4SLinus Torvalds 
6531da177e4SLinus Torvalds 	hdr = (struct icmp6hdr *) skb->h.raw;
6541da177e4SLinus Torvalds 
6551da177e4SLinus Torvalds 	type = hdr->icmp6_type;
6561da177e4SLinus Torvalds 
6571da177e4SLinus Torvalds 	if (type >= ICMPV6_DEST_UNREACH && type <= ICMPV6_PARAMPROB)
6581da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_INDESTUNREACHS, type - ICMPV6_DEST_UNREACH);
6591da177e4SLinus Torvalds 	else if (type >= ICMPV6_ECHO_REQUEST && type <= NDISC_REDIRECT)
6601da177e4SLinus Torvalds 		ICMP6_INC_STATS_OFFSET_BH(idev, ICMP6_MIB_INECHOS, type - ICMPV6_ECHO_REQUEST);
6611da177e4SLinus Torvalds 
6621da177e4SLinus Torvalds 	switch (type) {
6631da177e4SLinus Torvalds 	case ICMPV6_ECHO_REQUEST:
6641da177e4SLinus Torvalds 		icmpv6_echo_reply(skb);
6651da177e4SLinus Torvalds 		break;
6661da177e4SLinus Torvalds 
6671da177e4SLinus Torvalds 	case ICMPV6_ECHO_REPLY:
6681da177e4SLinus Torvalds 		/* we couldn't care less */
6691da177e4SLinus Torvalds 		break;
6701da177e4SLinus Torvalds 
6711da177e4SLinus Torvalds 	case ICMPV6_PKT_TOOBIG:
6721da177e4SLinus Torvalds 		/* BUGGG_FUTURE: if packet contains rthdr, we cannot update
6731da177e4SLinus Torvalds 		   standard destination cache. Seems, only "advanced"
6741da177e4SLinus Torvalds 		   destination cache will allow to solve this problem
6751da177e4SLinus Torvalds 		   --ANK (980726)
6761da177e4SLinus Torvalds 		 */
6771da177e4SLinus Torvalds 		if (!pskb_may_pull(skb, sizeof(struct ipv6hdr)))
6781da177e4SLinus Torvalds 			goto discard_it;
6791da177e4SLinus Torvalds 		hdr = (struct icmp6hdr *) skb->h.raw;
6801da177e4SLinus Torvalds 		orig_hdr = (struct ipv6hdr *) (hdr + 1);
6811da177e4SLinus Torvalds 		rt6_pmtu_discovery(&orig_hdr->daddr, &orig_hdr->saddr, dev,
6821da177e4SLinus Torvalds 				   ntohl(hdr->icmp6_mtu));
6831da177e4SLinus Torvalds 
6841da177e4SLinus Torvalds 		/*
6851da177e4SLinus Torvalds 		 *	Drop through to notify
6861da177e4SLinus Torvalds 		 */
6871da177e4SLinus Torvalds 
6881da177e4SLinus Torvalds 	case ICMPV6_DEST_UNREACH:
6891da177e4SLinus Torvalds 	case ICMPV6_TIME_EXCEED:
6901da177e4SLinus Torvalds 	case ICMPV6_PARAMPROB:
6911da177e4SLinus Torvalds 		icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
6921da177e4SLinus Torvalds 		break;
6931da177e4SLinus Torvalds 
6941da177e4SLinus Torvalds 	case NDISC_ROUTER_SOLICITATION:
6951da177e4SLinus Torvalds 	case NDISC_ROUTER_ADVERTISEMENT:
6961da177e4SLinus Torvalds 	case NDISC_NEIGHBOUR_SOLICITATION:
6971da177e4SLinus Torvalds 	case NDISC_NEIGHBOUR_ADVERTISEMENT:
6981da177e4SLinus Torvalds 	case NDISC_REDIRECT:
6991da177e4SLinus Torvalds 		ndisc_rcv(skb);
7001da177e4SLinus Torvalds 		break;
7011da177e4SLinus Torvalds 
7021da177e4SLinus Torvalds 	case ICMPV6_MGM_QUERY:
7031da177e4SLinus Torvalds 		igmp6_event_query(skb);
7041da177e4SLinus Torvalds 		break;
7051da177e4SLinus Torvalds 
7061da177e4SLinus Torvalds 	case ICMPV6_MGM_REPORT:
7071da177e4SLinus Torvalds 		igmp6_event_report(skb);
7081da177e4SLinus Torvalds 		break;
7091da177e4SLinus Torvalds 
7101da177e4SLinus Torvalds 	case ICMPV6_MGM_REDUCTION:
7111da177e4SLinus Torvalds 	case ICMPV6_NI_QUERY:
7121da177e4SLinus Torvalds 	case ICMPV6_NI_REPLY:
7131da177e4SLinus Torvalds 	case ICMPV6_MLD2_REPORT:
7141da177e4SLinus Torvalds 	case ICMPV6_DHAAD_REQUEST:
7151da177e4SLinus Torvalds 	case ICMPV6_DHAAD_REPLY:
7161da177e4SLinus Torvalds 	case ICMPV6_MOBILE_PREFIX_SOL:
7171da177e4SLinus Torvalds 	case ICMPV6_MOBILE_PREFIX_ADV:
7181da177e4SLinus Torvalds 		break;
7191da177e4SLinus Torvalds 
7201da177e4SLinus Torvalds 	default:
72164ce2073SPatrick McHardy 		LIMIT_NETDEBUG(KERN_DEBUG "icmpv6: msg of unknown type\n");
7221da177e4SLinus Torvalds 
7231da177e4SLinus Torvalds 		/* informational */
7241da177e4SLinus Torvalds 		if (type & ICMPV6_INFOMSG_MASK)
7251da177e4SLinus Torvalds 			break;
7261da177e4SLinus Torvalds 
7271da177e4SLinus Torvalds 		/*
7281da177e4SLinus Torvalds 		 * error of unknown type.
7291da177e4SLinus Torvalds 		 * must pass to upper level
7301da177e4SLinus Torvalds 		 */
7311da177e4SLinus Torvalds 
7321da177e4SLinus Torvalds 		icmpv6_notify(skb, type, hdr->icmp6_code, hdr->icmp6_mtu);
7331da177e4SLinus Torvalds 	};
7341da177e4SLinus Torvalds 	kfree_skb(skb);
7351da177e4SLinus Torvalds 	return 0;
7361da177e4SLinus Torvalds 
7371da177e4SLinus Torvalds discard_it:
7381da177e4SLinus Torvalds 	ICMP6_INC_STATS_BH(idev, ICMP6_MIB_INERRORS);
7391da177e4SLinus Torvalds 	kfree_skb(skb);
7401da177e4SLinus Torvalds 	return 0;
7411da177e4SLinus Torvalds }
7421da177e4SLinus Torvalds 
743640c41c7SIngo Molnar /*
744640c41c7SIngo Molnar  * Special lock-class for __icmpv6_socket:
745640c41c7SIngo Molnar  */
746640c41c7SIngo Molnar static struct lock_class_key icmpv6_socket_sk_dst_lock_key;
747640c41c7SIngo Molnar 
7481da177e4SLinus Torvalds int __init icmpv6_init(struct net_proto_family *ops)
7491da177e4SLinus Torvalds {
7501da177e4SLinus Torvalds 	struct sock *sk;
7511da177e4SLinus Torvalds 	int err, i, j;
7521da177e4SLinus Torvalds 
7536f912042SKAMEZAWA Hiroyuki 	for_each_possible_cpu(i) {
7541da177e4SLinus Torvalds 		err = sock_create_kern(PF_INET6, SOCK_RAW, IPPROTO_ICMPV6,
7551da177e4SLinus Torvalds 				       &per_cpu(__icmpv6_socket, i));
7561da177e4SLinus Torvalds 		if (err < 0) {
7571da177e4SLinus Torvalds 			printk(KERN_ERR
7581da177e4SLinus Torvalds 			       "Failed to initialize the ICMP6 control socket "
7591da177e4SLinus Torvalds 			       "(err %d).\n",
7601da177e4SLinus Torvalds 			       err);
7611da177e4SLinus Torvalds 			goto fail;
7621da177e4SLinus Torvalds 		}
7631da177e4SLinus Torvalds 
7641da177e4SLinus Torvalds 		sk = per_cpu(__icmpv6_socket, i)->sk;
7651da177e4SLinus Torvalds 		sk->sk_allocation = GFP_ATOMIC;
766640c41c7SIngo Molnar 		/*
767640c41c7SIngo Molnar 		 * Split off their lock-class, because sk->sk_dst_lock
768640c41c7SIngo Molnar 		 * gets used from softirqs, which is safe for
769640c41c7SIngo Molnar 		 * __icmpv6_socket (because those never get directly used
770640c41c7SIngo Molnar 		 * via userspace syscalls), but unsafe for normal sockets.
771640c41c7SIngo Molnar 		 */
772640c41c7SIngo Molnar 		lockdep_set_class(&sk->sk_dst_lock,
773640c41c7SIngo Molnar 				  &icmpv6_socket_sk_dst_lock_key);
7741da177e4SLinus Torvalds 
7751da177e4SLinus Torvalds 		/* Enough space for 2 64K ICMP packets, including
7761da177e4SLinus Torvalds 		 * sk_buff struct overhead.
7771da177e4SLinus Torvalds 		 */
7781da177e4SLinus Torvalds 		sk->sk_sndbuf =
7791da177e4SLinus Torvalds 			(2 * ((64 * 1024) + sizeof(struct sk_buff)));
7801da177e4SLinus Torvalds 
7811da177e4SLinus Torvalds 		sk->sk_prot->unhash(sk);
7821da177e4SLinus Torvalds 	}
7831da177e4SLinus Torvalds 
7841da177e4SLinus Torvalds 
7851da177e4SLinus Torvalds 	if (inet6_add_protocol(&icmpv6_protocol, IPPROTO_ICMPV6) < 0) {
7861da177e4SLinus Torvalds 		printk(KERN_ERR "Failed to register ICMP6 protocol\n");
7871da177e4SLinus Torvalds 		err = -EAGAIN;
7881da177e4SLinus Torvalds 		goto fail;
7891da177e4SLinus Torvalds 	}
7901da177e4SLinus Torvalds 
7911da177e4SLinus Torvalds 	return 0;
7921da177e4SLinus Torvalds 
7931da177e4SLinus Torvalds  fail:
7941da177e4SLinus Torvalds 	for (j = 0; j < i; j++) {
7951da177e4SLinus Torvalds 		if (!cpu_possible(j))
7961da177e4SLinus Torvalds 			continue;
7971da177e4SLinus Torvalds 		sock_release(per_cpu(__icmpv6_socket, j));
7981da177e4SLinus Torvalds 	}
7991da177e4SLinus Torvalds 
8001da177e4SLinus Torvalds 	return err;
8011da177e4SLinus Torvalds }
8021da177e4SLinus Torvalds 
8031da177e4SLinus Torvalds void icmpv6_cleanup(void)
8041da177e4SLinus Torvalds {
8051da177e4SLinus Torvalds 	int i;
8061da177e4SLinus Torvalds 
8076f912042SKAMEZAWA Hiroyuki 	for_each_possible_cpu(i) {
8081da177e4SLinus Torvalds 		sock_release(per_cpu(__icmpv6_socket, i));
8091da177e4SLinus Torvalds 	}
8101da177e4SLinus Torvalds 	inet6_del_protocol(&icmpv6_protocol, IPPROTO_ICMPV6);
8111da177e4SLinus Torvalds }
8121da177e4SLinus Torvalds 
8139b5b5cffSArjan van de Ven static const struct icmp6_err {
8141da177e4SLinus Torvalds 	int err;
8151da177e4SLinus Torvalds 	int fatal;
8161da177e4SLinus Torvalds } tab_unreach[] = {
8171da177e4SLinus Torvalds 	{	/* NOROUTE */
8181da177e4SLinus Torvalds 		.err	= ENETUNREACH,
8191da177e4SLinus Torvalds 		.fatal	= 0,
8201da177e4SLinus Torvalds 	},
8211da177e4SLinus Torvalds 	{	/* ADM_PROHIBITED */
8221da177e4SLinus Torvalds 		.err	= EACCES,
8231da177e4SLinus Torvalds 		.fatal	= 1,
8241da177e4SLinus Torvalds 	},
8251da177e4SLinus Torvalds 	{	/* Was NOT_NEIGHBOUR, now reserved */
8261da177e4SLinus Torvalds 		.err	= EHOSTUNREACH,
8271da177e4SLinus Torvalds 		.fatal	= 0,
8281da177e4SLinus Torvalds 	},
8291da177e4SLinus Torvalds 	{	/* ADDR_UNREACH	*/
8301da177e4SLinus Torvalds 		.err	= EHOSTUNREACH,
8311da177e4SLinus Torvalds 		.fatal	= 0,
8321da177e4SLinus Torvalds 	},
8331da177e4SLinus Torvalds 	{	/* PORT_UNREACH	*/
8341da177e4SLinus Torvalds 		.err	= ECONNREFUSED,
8351da177e4SLinus Torvalds 		.fatal	= 1,
8361da177e4SLinus Torvalds 	},
8371da177e4SLinus Torvalds };
8381da177e4SLinus Torvalds 
8391da177e4SLinus Torvalds int icmpv6_err_convert(int type, int code, int *err)
8401da177e4SLinus Torvalds {
8411da177e4SLinus Torvalds 	int fatal = 0;
8421da177e4SLinus Torvalds 
8431da177e4SLinus Torvalds 	*err = EPROTO;
8441da177e4SLinus Torvalds 
8451da177e4SLinus Torvalds 	switch (type) {
8461da177e4SLinus Torvalds 	case ICMPV6_DEST_UNREACH:
8471da177e4SLinus Torvalds 		fatal = 1;
8481da177e4SLinus Torvalds 		if (code <= ICMPV6_PORT_UNREACH) {
8491da177e4SLinus Torvalds 			*err  = tab_unreach[code].err;
8501da177e4SLinus Torvalds 			fatal = tab_unreach[code].fatal;
8511da177e4SLinus Torvalds 		}
8521da177e4SLinus Torvalds 		break;
8531da177e4SLinus Torvalds 
8541da177e4SLinus Torvalds 	case ICMPV6_PKT_TOOBIG:
8551da177e4SLinus Torvalds 		*err = EMSGSIZE;
8561da177e4SLinus Torvalds 		break;
8571da177e4SLinus Torvalds 
8581da177e4SLinus Torvalds 	case ICMPV6_PARAMPROB:
8591da177e4SLinus Torvalds 		*err = EPROTO;
8601da177e4SLinus Torvalds 		fatal = 1;
8611da177e4SLinus Torvalds 		break;
8621da177e4SLinus Torvalds 
8631da177e4SLinus Torvalds 	case ICMPV6_TIME_EXCEED:
8641da177e4SLinus Torvalds 		*err = EHOSTUNREACH;
8651da177e4SLinus Torvalds 		break;
8661da177e4SLinus Torvalds 	};
8671da177e4SLinus Torvalds 
8681da177e4SLinus Torvalds 	return fatal;
8691da177e4SLinus Torvalds }
8701da177e4SLinus Torvalds 
8711da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL
8721da177e4SLinus Torvalds ctl_table ipv6_icmp_table[] = {
8731da177e4SLinus Torvalds 	{
8741da177e4SLinus Torvalds 		.ctl_name	= NET_IPV6_ICMP_RATELIMIT,
8751da177e4SLinus Torvalds 		.procname	= "ratelimit",
8761da177e4SLinus Torvalds 		.data		= &sysctl_icmpv6_time,
8771da177e4SLinus Torvalds 		.maxlen		= sizeof(int),
8781da177e4SLinus Torvalds 		.mode		= 0644,
8791da177e4SLinus Torvalds 		.proc_handler	= &proc_dointvec
8801da177e4SLinus Torvalds 	},
8811da177e4SLinus Torvalds 	{ .ctl_name = 0 },
8821da177e4SLinus Torvalds };
8831da177e4SLinus Torvalds #endif
8841da177e4SLinus Torvalds 
885