11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * Linux INET6 implementation 31da177e4SLinus Torvalds * FIB front-end. 41da177e4SLinus Torvalds * 51da177e4SLinus Torvalds * Authors: 61da177e4SLinus Torvalds * Pedro Roque <roque@di.fc.ul.pt> 71da177e4SLinus Torvalds * 81da177e4SLinus Torvalds * This program is free software; you can redistribute it and/or 91da177e4SLinus Torvalds * modify it under the terms of the GNU General Public License 101da177e4SLinus Torvalds * as published by the Free Software Foundation; either version 111da177e4SLinus Torvalds * 2 of the License, or (at your option) any later version. 121da177e4SLinus Torvalds */ 131da177e4SLinus Torvalds 141da177e4SLinus Torvalds /* Changes: 151da177e4SLinus Torvalds * 161da177e4SLinus Torvalds * YOSHIFUJI Hideaki @USAGI 171da177e4SLinus Torvalds * reworked default router selection. 181da177e4SLinus Torvalds * - respect outgoing interface 191da177e4SLinus Torvalds * - select from (probably) reachable routers (i.e. 201da177e4SLinus Torvalds * routers in REACHABLE, STALE, DELAY or PROBE states). 211da177e4SLinus Torvalds * - always select the same router if it is (probably) 221da177e4SLinus Torvalds * reachable. otherwise, round-robin the list. 23c0bece9fSYOSHIFUJI Hideaki * Ville Nuorvala 24c0bece9fSYOSHIFUJI Hideaki * Fixed routing subtrees. 251da177e4SLinus Torvalds */ 261da177e4SLinus Torvalds 27f3213831SJoe Perches #define pr_fmt(fmt) "IPv6: " fmt 28f3213831SJoe Perches 294fc268d2SRandy Dunlap #include <linux/capability.h> 301da177e4SLinus Torvalds #include <linux/errno.h> 31bc3b2d7fSPaul Gortmaker #include <linux/export.h> 321da177e4SLinus Torvalds #include <linux/types.h> 331da177e4SLinus Torvalds #include <linux/times.h> 341da177e4SLinus Torvalds #include <linux/socket.h> 351da177e4SLinus Torvalds #include <linux/sockios.h> 361da177e4SLinus Torvalds #include <linux/net.h> 371da177e4SLinus Torvalds #include <linux/route.h> 381da177e4SLinus Torvalds #include <linux/netdevice.h> 391da177e4SLinus Torvalds #include <linux/in6.h> 407bc570c8SYOSHIFUJI Hideaki #include <linux/mroute6.h> 411da177e4SLinus Torvalds #include <linux/init.h> 421da177e4SLinus Torvalds #include <linux/if_arp.h> 431da177e4SLinus Torvalds #include <linux/proc_fs.h> 441da177e4SLinus Torvalds #include <linux/seq_file.h> 455b7c931dSDaniel Lezcano #include <linux/nsproxy.h> 465a0e3ad6STejun Heo #include <linux/slab.h> 47457c4cbcSEric W. Biederman #include <net/net_namespace.h> 481da177e4SLinus Torvalds #include <net/snmp.h> 491da177e4SLinus Torvalds #include <net/ipv6.h> 501da177e4SLinus Torvalds #include <net/ip6_fib.h> 511da177e4SLinus Torvalds #include <net/ip6_route.h> 521da177e4SLinus Torvalds #include <net/ndisc.h> 531da177e4SLinus Torvalds #include <net/addrconf.h> 541da177e4SLinus Torvalds #include <net/tcp.h> 551da177e4SLinus Torvalds #include <linux/rtnetlink.h> 561da177e4SLinus Torvalds #include <net/dst.h> 57904af04dSJiri Benc #include <net/dst_metadata.h> 581da177e4SLinus Torvalds #include <net/xfrm.h> 598d71740cSTom Tucker #include <net/netevent.h> 6021713ebcSThomas Graf #include <net/netlink.h> 6151ebd318SNicolas Dichtel #include <net/nexthop.h> 6219e42e45SRoopa Prabhu #include <net/lwtunnel.h> 63904af04dSJiri Benc #include <net/ip_tunnels.h> 641da177e4SLinus Torvalds 651da177e4SLinus Torvalds #include <asm/uaccess.h> 661da177e4SLinus Torvalds 671da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL 681da177e4SLinus Torvalds #include <linux/sysctl.h> 691da177e4SLinus Torvalds #endif 701da177e4SLinus Torvalds 71afc154e9SHannes Frederic Sowa enum rt6_nud_state { 727e980569SJiri Benc RT6_NUD_FAIL_HARD = -3, 737e980569SJiri Benc RT6_NUD_FAIL_PROBE = -2, 747e980569SJiri Benc RT6_NUD_FAIL_DO_RR = -1, 75afc154e9SHannes Frederic Sowa RT6_NUD_SUCCEED = 1 76afc154e9SHannes Frederic Sowa }; 77afc154e9SHannes Frederic Sowa 7883a09abdSMartin KaFai Lau static void ip6_rt_copy_init(struct rt6_info *rt, struct rt6_info *ort); 791da177e4SLinus Torvalds static struct dst_entry *ip6_dst_check(struct dst_entry *dst, u32 cookie); 800dbaee3bSDavid S. Miller static unsigned int ip6_default_advmss(const struct dst_entry *dst); 81ebb762f2SSteffen Klassert static unsigned int ip6_mtu(const struct dst_entry *dst); 821da177e4SLinus Torvalds static struct dst_entry *ip6_negative_advice(struct dst_entry *); 831da177e4SLinus Torvalds static void ip6_dst_destroy(struct dst_entry *); 841da177e4SLinus Torvalds static void ip6_dst_ifdown(struct dst_entry *, 851da177e4SLinus Torvalds struct net_device *dev, int how); 86569d3645SDaniel Lezcano static int ip6_dst_gc(struct dst_ops *ops); 871da177e4SLinus Torvalds 881da177e4SLinus Torvalds static int ip6_pkt_discard(struct sk_buff *skb); 89aad88724SEric Dumazet static int ip6_pkt_discard_out(struct sock *sk, struct sk_buff *skb); 907150aedeSKamala R static int ip6_pkt_prohibit(struct sk_buff *skb); 91aad88724SEric Dumazet static int ip6_pkt_prohibit_out(struct sock *sk, struct sk_buff *skb); 921da177e4SLinus Torvalds static void ip6_link_failure(struct sk_buff *skb); 936700c270SDavid S. Miller static void ip6_rt_update_pmtu(struct dst_entry *dst, struct sock *sk, 946700c270SDavid S. Miller struct sk_buff *skb, u32 mtu); 956700c270SDavid S. Miller static void rt6_do_redirect(struct dst_entry *dst, struct sock *sk, 966700c270SDavid S. Miller struct sk_buff *skb); 974b32b5adSMartin KaFai Lau static void rt6_dst_from_metrics_check(struct rt6_info *rt); 9852bd4c0cSNicolas Dichtel static int rt6_score_route(struct rt6_info *rt, int oif, int strict); 991da177e4SLinus Torvalds 10070ceb4f5SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_ROUTE_INFO 101efa2cea0SDaniel Lezcano static struct rt6_info *rt6_add_route_info(struct net *net, 102b71d1d42SEric Dumazet const struct in6_addr *prefix, int prefixlen, 103b71d1d42SEric Dumazet const struct in6_addr *gwaddr, int ifindex, 10495c96174SEric Dumazet unsigned int pref); 105efa2cea0SDaniel Lezcano static struct rt6_info *rt6_get_route_info(struct net *net, 106b71d1d42SEric Dumazet const struct in6_addr *prefix, int prefixlen, 107b71d1d42SEric Dumazet const struct in6_addr *gwaddr, int ifindex); 10870ceb4f5SYOSHIFUJI Hideaki #endif 10970ceb4f5SYOSHIFUJI Hideaki 1108d0b94afSMartin KaFai Lau struct uncached_list { 1118d0b94afSMartin KaFai Lau spinlock_t lock; 1128d0b94afSMartin KaFai Lau struct list_head head; 1138d0b94afSMartin KaFai Lau }; 1148d0b94afSMartin KaFai Lau 1158d0b94afSMartin KaFai Lau static DEFINE_PER_CPU_ALIGNED(struct uncached_list, rt6_uncached_list); 1168d0b94afSMartin KaFai Lau 1178d0b94afSMartin KaFai Lau static void rt6_uncached_list_add(struct rt6_info *rt) 1188d0b94afSMartin KaFai Lau { 1198d0b94afSMartin KaFai Lau struct uncached_list *ul = raw_cpu_ptr(&rt6_uncached_list); 1208d0b94afSMartin KaFai Lau 1218d0b94afSMartin KaFai Lau rt->dst.flags |= DST_NOCACHE; 1228d0b94afSMartin KaFai Lau rt->rt6i_uncached_list = ul; 1238d0b94afSMartin KaFai Lau 1248d0b94afSMartin KaFai Lau spin_lock_bh(&ul->lock); 1258d0b94afSMartin KaFai Lau list_add_tail(&rt->rt6i_uncached, &ul->head); 1268d0b94afSMartin KaFai Lau spin_unlock_bh(&ul->lock); 1278d0b94afSMartin KaFai Lau } 1288d0b94afSMartin KaFai Lau 1298d0b94afSMartin KaFai Lau static void rt6_uncached_list_del(struct rt6_info *rt) 1308d0b94afSMartin KaFai Lau { 1318d0b94afSMartin KaFai Lau if (!list_empty(&rt->rt6i_uncached)) { 1328d0b94afSMartin KaFai Lau struct uncached_list *ul = rt->rt6i_uncached_list; 1338d0b94afSMartin KaFai Lau 1348d0b94afSMartin KaFai Lau spin_lock_bh(&ul->lock); 1358d0b94afSMartin KaFai Lau list_del(&rt->rt6i_uncached); 1368d0b94afSMartin KaFai Lau spin_unlock_bh(&ul->lock); 1378d0b94afSMartin KaFai Lau } 1388d0b94afSMartin KaFai Lau } 1398d0b94afSMartin KaFai Lau 1408d0b94afSMartin KaFai Lau static void rt6_uncached_list_flush_dev(struct net *net, struct net_device *dev) 1418d0b94afSMartin KaFai Lau { 1428d0b94afSMartin KaFai Lau struct net_device *loopback_dev = net->loopback_dev; 1438d0b94afSMartin KaFai Lau int cpu; 1448d0b94afSMartin KaFai Lau 1458d0b94afSMartin KaFai Lau for_each_possible_cpu(cpu) { 1468d0b94afSMartin KaFai Lau struct uncached_list *ul = per_cpu_ptr(&rt6_uncached_list, cpu); 1478d0b94afSMartin KaFai Lau struct rt6_info *rt; 1488d0b94afSMartin KaFai Lau 1498d0b94afSMartin KaFai Lau spin_lock_bh(&ul->lock); 1508d0b94afSMartin KaFai Lau list_for_each_entry(rt, &ul->head, rt6i_uncached) { 1518d0b94afSMartin KaFai Lau struct inet6_dev *rt_idev = rt->rt6i_idev; 1528d0b94afSMartin KaFai Lau struct net_device *rt_dev = rt->dst.dev; 1538d0b94afSMartin KaFai Lau 1548d0b94afSMartin KaFai Lau if (rt_idev && (rt_idev->dev == dev || !dev) && 1558d0b94afSMartin KaFai Lau rt_idev->dev != loopback_dev) { 1568d0b94afSMartin KaFai Lau rt->rt6i_idev = in6_dev_get(loopback_dev); 1578d0b94afSMartin KaFai Lau in6_dev_put(rt_idev); 1588d0b94afSMartin KaFai Lau } 1598d0b94afSMartin KaFai Lau 1608d0b94afSMartin KaFai Lau if (rt_dev && (rt_dev == dev || !dev) && 1618d0b94afSMartin KaFai Lau rt_dev != loopback_dev) { 1628d0b94afSMartin KaFai Lau rt->dst.dev = loopback_dev; 1638d0b94afSMartin KaFai Lau dev_hold(rt->dst.dev); 1648d0b94afSMartin KaFai Lau dev_put(rt_dev); 1658d0b94afSMartin KaFai Lau } 1668d0b94afSMartin KaFai Lau } 1678d0b94afSMartin KaFai Lau spin_unlock_bh(&ul->lock); 1688d0b94afSMartin KaFai Lau } 1698d0b94afSMartin KaFai Lau } 1708d0b94afSMartin KaFai Lau 171d52d3997SMartin KaFai Lau static u32 *rt6_pcpu_cow_metrics(struct rt6_info *rt) 172d52d3997SMartin KaFai Lau { 173d52d3997SMartin KaFai Lau return dst_metrics_write_ptr(rt->dst.from); 174d52d3997SMartin KaFai Lau } 175d52d3997SMartin KaFai Lau 17606582540SDavid S. Miller static u32 *ipv6_cow_metrics(struct dst_entry *dst, unsigned long old) 17706582540SDavid S. Miller { 17806582540SDavid S. Miller struct rt6_info *rt = (struct rt6_info *)dst; 17906582540SDavid S. Miller 180d52d3997SMartin KaFai Lau if (rt->rt6i_flags & RTF_PCPU) 181d52d3997SMartin KaFai Lau return rt6_pcpu_cow_metrics(rt); 182d52d3997SMartin KaFai Lau else if (rt->rt6i_flags & RTF_CACHE) 1834b32b5adSMartin KaFai Lau return NULL; 1844b32b5adSMartin KaFai Lau else 1853b471175SMartin KaFai Lau return dst_cow_metrics_generic(dst, old); 18606582540SDavid S. Miller } 18706582540SDavid S. Miller 188f894cbf8SDavid S. Miller static inline const void *choose_neigh_daddr(struct rt6_info *rt, 189f894cbf8SDavid S. Miller struct sk_buff *skb, 190f894cbf8SDavid S. Miller const void *daddr) 19139232973SDavid S. Miller { 19239232973SDavid S. Miller struct in6_addr *p = &rt->rt6i_gateway; 19339232973SDavid S. Miller 194a7563f34SDavid S. Miller if (!ipv6_addr_any(p)) 19539232973SDavid S. Miller return (const void *) p; 196f894cbf8SDavid S. Miller else if (skb) 197f894cbf8SDavid S. Miller return &ipv6_hdr(skb)->daddr; 19839232973SDavid S. Miller return daddr; 19939232973SDavid S. Miller } 20039232973SDavid S. Miller 201f894cbf8SDavid S. Miller static struct neighbour *ip6_neigh_lookup(const struct dst_entry *dst, 202f894cbf8SDavid S. Miller struct sk_buff *skb, 203f894cbf8SDavid S. Miller const void *daddr) 204d3aaeb38SDavid S. Miller { 20539232973SDavid S. Miller struct rt6_info *rt = (struct rt6_info *) dst; 20639232973SDavid S. Miller struct neighbour *n; 20739232973SDavid S. Miller 208f894cbf8SDavid S. Miller daddr = choose_neigh_daddr(rt, skb, daddr); 2098e022ee6SYOSHIFUJI Hideaki / 吉藤英明 n = __ipv6_neigh_lookup(dst->dev, daddr); 210f83c7790SDavid S. Miller if (n) 211f83c7790SDavid S. Miller return n; 212f83c7790SDavid S. Miller return neigh_create(&nd_tbl, daddr, dst->dev); 213f83c7790SDavid S. Miller } 214f83c7790SDavid S. Miller 2159a7ec3a9SDaniel Lezcano static struct dst_ops ip6_dst_ops_template = { 2161da177e4SLinus Torvalds .family = AF_INET6, 2171da177e4SLinus Torvalds .gc = ip6_dst_gc, 2181da177e4SLinus Torvalds .gc_thresh = 1024, 2191da177e4SLinus Torvalds .check = ip6_dst_check, 2200dbaee3bSDavid S. Miller .default_advmss = ip6_default_advmss, 221ebb762f2SSteffen Klassert .mtu = ip6_mtu, 22206582540SDavid S. Miller .cow_metrics = ipv6_cow_metrics, 2231da177e4SLinus Torvalds .destroy = ip6_dst_destroy, 2241da177e4SLinus Torvalds .ifdown = ip6_dst_ifdown, 2251da177e4SLinus Torvalds .negative_advice = ip6_negative_advice, 2261da177e4SLinus Torvalds .link_failure = ip6_link_failure, 2271da177e4SLinus Torvalds .update_pmtu = ip6_rt_update_pmtu, 2286e157b6aSDavid S. Miller .redirect = rt6_do_redirect, 2291ac06e03SHerbert Xu .local_out = __ip6_local_out, 230d3aaeb38SDavid S. Miller .neigh_lookup = ip6_neigh_lookup, 2311da177e4SLinus Torvalds }; 2321da177e4SLinus Torvalds 233ebb762f2SSteffen Klassert static unsigned int ip6_blackhole_mtu(const struct dst_entry *dst) 234ec831ea7SRoland Dreier { 235618f9bc7SSteffen Klassert unsigned int mtu = dst_metric_raw(dst, RTAX_MTU); 236618f9bc7SSteffen Klassert 237618f9bc7SSteffen Klassert return mtu ? : dst->dev->mtu; 238ec831ea7SRoland Dreier } 239ec831ea7SRoland Dreier 2406700c270SDavid S. Miller static void ip6_rt_blackhole_update_pmtu(struct dst_entry *dst, struct sock *sk, 2416700c270SDavid S. Miller struct sk_buff *skb, u32 mtu) 24214e50e57SDavid S. Miller { 24314e50e57SDavid S. Miller } 24414e50e57SDavid S. Miller 2456700c270SDavid S. Miller static void ip6_rt_blackhole_redirect(struct dst_entry *dst, struct sock *sk, 2466700c270SDavid S. Miller struct sk_buff *skb) 247b587ee3bSDavid S. Miller { 248b587ee3bSDavid S. Miller } 249b587ee3bSDavid S. Miller 2500972ddb2SHeld Bernhard static u32 *ip6_rt_blackhole_cow_metrics(struct dst_entry *dst, 2510972ddb2SHeld Bernhard unsigned long old) 2520972ddb2SHeld Bernhard { 2530972ddb2SHeld Bernhard return NULL; 2540972ddb2SHeld Bernhard } 2550972ddb2SHeld Bernhard 25614e50e57SDavid S. Miller static struct dst_ops ip6_dst_blackhole_ops = { 25714e50e57SDavid S. Miller .family = AF_INET6, 25814e50e57SDavid S. Miller .destroy = ip6_dst_destroy, 25914e50e57SDavid S. Miller .check = ip6_dst_check, 260ebb762f2SSteffen Klassert .mtu = ip6_blackhole_mtu, 261214f45c9SEric Dumazet .default_advmss = ip6_default_advmss, 26214e50e57SDavid S. Miller .update_pmtu = ip6_rt_blackhole_update_pmtu, 263b587ee3bSDavid S. Miller .redirect = ip6_rt_blackhole_redirect, 2640972ddb2SHeld Bernhard .cow_metrics = ip6_rt_blackhole_cow_metrics, 265d3aaeb38SDavid S. Miller .neigh_lookup = ip6_neigh_lookup, 26614e50e57SDavid S. Miller }; 26714e50e57SDavid S. Miller 26862fa8a84SDavid S. Miller static const u32 ip6_template_metrics[RTAX_MAX] = { 26914edd87dSLi RongQing [RTAX_HOPLIMIT - 1] = 0, 27062fa8a84SDavid S. Miller }; 27162fa8a84SDavid S. Miller 272fb0af4c7SEric Dumazet static const struct rt6_info ip6_null_entry_template = { 2731da177e4SLinus Torvalds .dst = { 2741da177e4SLinus Torvalds .__refcnt = ATOMIC_INIT(1), 2751da177e4SLinus Torvalds .__use = 1, 2762c20cbd7SNicolas Dichtel .obsolete = DST_OBSOLETE_FORCE_CHK, 2771da177e4SLinus Torvalds .error = -ENETUNREACH, 2781da177e4SLinus Torvalds .input = ip6_pkt_discard, 2791da177e4SLinus Torvalds .output = ip6_pkt_discard_out, 2801da177e4SLinus Torvalds }, 2811da177e4SLinus Torvalds .rt6i_flags = (RTF_REJECT | RTF_NONEXTHOP), 2824f724279SJean-Mickael Guerin .rt6i_protocol = RTPROT_KERNEL, 2831da177e4SLinus Torvalds .rt6i_metric = ~(u32) 0, 2841da177e4SLinus Torvalds .rt6i_ref = ATOMIC_INIT(1), 2851da177e4SLinus Torvalds }; 2861da177e4SLinus Torvalds 287101367c2SThomas Graf #ifdef CONFIG_IPV6_MULTIPLE_TABLES 288101367c2SThomas Graf 289fb0af4c7SEric Dumazet static const struct rt6_info ip6_prohibit_entry_template = { 290101367c2SThomas Graf .dst = { 291101367c2SThomas Graf .__refcnt = ATOMIC_INIT(1), 292101367c2SThomas Graf .__use = 1, 2932c20cbd7SNicolas Dichtel .obsolete = DST_OBSOLETE_FORCE_CHK, 294101367c2SThomas Graf .error = -EACCES, 2959ce8ade0SThomas Graf .input = ip6_pkt_prohibit, 2969ce8ade0SThomas Graf .output = ip6_pkt_prohibit_out, 297101367c2SThomas Graf }, 298101367c2SThomas Graf .rt6i_flags = (RTF_REJECT | RTF_NONEXTHOP), 2994f724279SJean-Mickael Guerin .rt6i_protocol = RTPROT_KERNEL, 300101367c2SThomas Graf .rt6i_metric = ~(u32) 0, 301101367c2SThomas Graf .rt6i_ref = ATOMIC_INIT(1), 302101367c2SThomas Graf }; 303101367c2SThomas Graf 304fb0af4c7SEric Dumazet static const struct rt6_info ip6_blk_hole_entry_template = { 305101367c2SThomas Graf .dst = { 306101367c2SThomas Graf .__refcnt = ATOMIC_INIT(1), 307101367c2SThomas Graf .__use = 1, 3082c20cbd7SNicolas Dichtel .obsolete = DST_OBSOLETE_FORCE_CHK, 309101367c2SThomas Graf .error = -EINVAL, 310352e512cSHerbert Xu .input = dst_discard, 311aad88724SEric Dumazet .output = dst_discard_sk, 312101367c2SThomas Graf }, 313101367c2SThomas Graf .rt6i_flags = (RTF_REJECT | RTF_NONEXTHOP), 3144f724279SJean-Mickael Guerin .rt6i_protocol = RTPROT_KERNEL, 315101367c2SThomas Graf .rt6i_metric = ~(u32) 0, 316101367c2SThomas Graf .rt6i_ref = ATOMIC_INIT(1), 317101367c2SThomas Graf }; 318101367c2SThomas Graf 319101367c2SThomas Graf #endif 320101367c2SThomas Graf 3211da177e4SLinus Torvalds /* allocate dst with ip6_dst_ops */ 322d52d3997SMartin KaFai Lau static struct rt6_info *__ip6_dst_alloc(struct net *net, 323957c665fSDavid S. Miller struct net_device *dev, 324ad706862SMartin KaFai Lau int flags) 3251da177e4SLinus Torvalds { 32697bab73fSDavid S. Miller struct rt6_info *rt = dst_alloc(&net->ipv6.ip6_dst_ops, dev, 3276f3118b5SNicolas Dichtel 0, DST_OBSOLETE_FORCE_CHK, flags); 328cf911662SDavid S. Miller 32997bab73fSDavid S. Miller if (rt) { 3308104891bSSteffen Klassert struct dst_entry *dst = &rt->dst; 3318104891bSSteffen Klassert 3328104891bSSteffen Klassert memset(dst + 1, 0, sizeof(*rt) - sizeof(*dst)); 33351ebd318SNicolas Dichtel INIT_LIST_HEAD(&rt->rt6i_siblings); 3348d0b94afSMartin KaFai Lau INIT_LIST_HEAD(&rt->rt6i_uncached); 33597bab73fSDavid S. Miller } 336cf911662SDavid S. Miller return rt; 3371da177e4SLinus Torvalds } 3381da177e4SLinus Torvalds 339d52d3997SMartin KaFai Lau static struct rt6_info *ip6_dst_alloc(struct net *net, 340d52d3997SMartin KaFai Lau struct net_device *dev, 341ad706862SMartin KaFai Lau int flags) 342d52d3997SMartin KaFai Lau { 343ad706862SMartin KaFai Lau struct rt6_info *rt = __ip6_dst_alloc(net, dev, flags); 344d52d3997SMartin KaFai Lau 345d52d3997SMartin KaFai Lau if (rt) { 346d52d3997SMartin KaFai Lau rt->rt6i_pcpu = alloc_percpu_gfp(struct rt6_info *, GFP_ATOMIC); 347d52d3997SMartin KaFai Lau if (rt->rt6i_pcpu) { 348d52d3997SMartin KaFai Lau int cpu; 349d52d3997SMartin KaFai Lau 350d52d3997SMartin KaFai Lau for_each_possible_cpu(cpu) { 351d52d3997SMartin KaFai Lau struct rt6_info **p; 352d52d3997SMartin KaFai Lau 353d52d3997SMartin KaFai Lau p = per_cpu_ptr(rt->rt6i_pcpu, cpu); 354d52d3997SMartin KaFai Lau /* no one shares rt */ 355d52d3997SMartin KaFai Lau *p = NULL; 356d52d3997SMartin KaFai Lau } 357d52d3997SMartin KaFai Lau } else { 358d52d3997SMartin KaFai Lau dst_destroy((struct dst_entry *)rt); 359d52d3997SMartin KaFai Lau return NULL; 360d52d3997SMartin KaFai Lau } 361d52d3997SMartin KaFai Lau } 362d52d3997SMartin KaFai Lau 363d52d3997SMartin KaFai Lau return rt; 364d52d3997SMartin KaFai Lau } 365d52d3997SMartin KaFai Lau 3661da177e4SLinus Torvalds static void ip6_dst_destroy(struct dst_entry *dst) 3671da177e4SLinus Torvalds { 3681da177e4SLinus Torvalds struct rt6_info *rt = (struct rt6_info *)dst; 369ecd98837SYOSHIFUJI Hideaki / 吉藤英明 struct dst_entry *from = dst->from; 3708d0b94afSMartin KaFai Lau struct inet6_dev *idev; 3711da177e4SLinus Torvalds 3728e2ec639SYan, Zheng dst_destroy_metrics_generic(dst); 373d52d3997SMartin KaFai Lau free_percpu(rt->rt6i_pcpu); 3748d0b94afSMartin KaFai Lau rt6_uncached_list_del(rt); 3758d0b94afSMartin KaFai Lau 3768d0b94afSMartin KaFai Lau idev = rt->rt6i_idev; 37738308473SDavid S. Miller if (idev) { 3781da177e4SLinus Torvalds rt->rt6i_idev = NULL; 3791da177e4SLinus Torvalds in6_dev_put(idev); 3801da177e4SLinus Torvalds } 3811716a961SGao feng 382ecd98837SYOSHIFUJI Hideaki / 吉藤英明 dst->from = NULL; 383ecd98837SYOSHIFUJI Hideaki / 吉藤英明 dst_release(from); 384b3419363SDavid S. Miller } 385b3419363SDavid S. Miller 3861da177e4SLinus Torvalds static void ip6_dst_ifdown(struct dst_entry *dst, struct net_device *dev, 3871da177e4SLinus Torvalds int how) 3881da177e4SLinus Torvalds { 3891da177e4SLinus Torvalds struct rt6_info *rt = (struct rt6_info *)dst; 3901da177e4SLinus Torvalds struct inet6_dev *idev = rt->rt6i_idev; 3915a3e55d6SDenis V. Lunev struct net_device *loopback_dev = 392c346dca1SYOSHIFUJI Hideaki dev_net(dev)->loopback_dev; 3931da177e4SLinus Torvalds 39497cac082SDavid S. Miller if (dev != loopback_dev) { 39597cac082SDavid S. Miller if (idev && idev->dev == dev) { 3965a3e55d6SDenis V. Lunev struct inet6_dev *loopback_idev = 3975a3e55d6SDenis V. Lunev in6_dev_get(loopback_dev); 39838308473SDavid S. Miller if (loopback_idev) { 3991da177e4SLinus Torvalds rt->rt6i_idev = loopback_idev; 4001da177e4SLinus Torvalds in6_dev_put(idev); 4011da177e4SLinus Torvalds } 4021da177e4SLinus Torvalds } 40397cac082SDavid S. Miller } 4041da177e4SLinus Torvalds } 4051da177e4SLinus Torvalds 406a50feda5SEric Dumazet static bool rt6_check_expired(const struct rt6_info *rt) 4071da177e4SLinus Torvalds { 4081716a961SGao feng if (rt->rt6i_flags & RTF_EXPIRES) { 4091716a961SGao feng if (time_after(jiffies, rt->dst.expires)) 410a50feda5SEric Dumazet return true; 4111716a961SGao feng } else if (rt->dst.from) { 4123fd91fb3SLi RongQing return rt6_check_expired((struct rt6_info *) rt->dst.from); 4131716a961SGao feng } 414a50feda5SEric Dumazet return false; 4151da177e4SLinus Torvalds } 4161da177e4SLinus Torvalds 41751ebd318SNicolas Dichtel /* Multipath route selection: 41851ebd318SNicolas Dichtel * Hash based function using packet header and flowlabel. 41951ebd318SNicolas Dichtel * Adapted from fib_info_hashfn() 42051ebd318SNicolas Dichtel */ 42151ebd318SNicolas Dichtel static int rt6_info_hash_nhsfn(unsigned int candidate_count, 42251ebd318SNicolas Dichtel const struct flowi6 *fl6) 42351ebd318SNicolas Dichtel { 42451ebd318SNicolas Dichtel unsigned int val = fl6->flowi6_proto; 42551ebd318SNicolas Dichtel 426c08977bbSYOSHIFUJI Hideaki / 吉藤英明 val ^= ipv6_addr_hash(&fl6->daddr); 427c08977bbSYOSHIFUJI Hideaki / 吉藤英明 val ^= ipv6_addr_hash(&fl6->saddr); 42851ebd318SNicolas Dichtel 42951ebd318SNicolas Dichtel /* Work only if this not encapsulated */ 43051ebd318SNicolas Dichtel switch (fl6->flowi6_proto) { 43151ebd318SNicolas Dichtel case IPPROTO_UDP: 43251ebd318SNicolas Dichtel case IPPROTO_TCP: 43351ebd318SNicolas Dichtel case IPPROTO_SCTP: 434b3ce5ae1SNicolas Dichtel val ^= (__force u16)fl6->fl6_sport; 435b3ce5ae1SNicolas Dichtel val ^= (__force u16)fl6->fl6_dport; 43651ebd318SNicolas Dichtel break; 43751ebd318SNicolas Dichtel 43851ebd318SNicolas Dichtel case IPPROTO_ICMPV6: 439b3ce5ae1SNicolas Dichtel val ^= (__force u16)fl6->fl6_icmp_type; 440b3ce5ae1SNicolas Dichtel val ^= (__force u16)fl6->fl6_icmp_code; 44151ebd318SNicolas Dichtel break; 44251ebd318SNicolas Dichtel } 44351ebd318SNicolas Dichtel /* RFC6438 recommands to use flowlabel */ 444b3ce5ae1SNicolas Dichtel val ^= (__force u32)fl6->flowlabel; 44551ebd318SNicolas Dichtel 44651ebd318SNicolas Dichtel /* Perhaps, we need to tune, this function? */ 44751ebd318SNicolas Dichtel val = val ^ (val >> 7) ^ (val >> 12); 44851ebd318SNicolas Dichtel return val % candidate_count; 44951ebd318SNicolas Dichtel } 45051ebd318SNicolas Dichtel 45151ebd318SNicolas Dichtel static struct rt6_info *rt6_multipath_select(struct rt6_info *match, 45252bd4c0cSNicolas Dichtel struct flowi6 *fl6, int oif, 45352bd4c0cSNicolas Dichtel int strict) 45451ebd318SNicolas Dichtel { 45551ebd318SNicolas Dichtel struct rt6_info *sibling, *next_sibling; 45651ebd318SNicolas Dichtel int route_choosen; 45751ebd318SNicolas Dichtel 45851ebd318SNicolas Dichtel route_choosen = rt6_info_hash_nhsfn(match->rt6i_nsiblings + 1, fl6); 45951ebd318SNicolas Dichtel /* Don't change the route, if route_choosen == 0 46051ebd318SNicolas Dichtel * (siblings does not include ourself) 46151ebd318SNicolas Dichtel */ 46251ebd318SNicolas Dichtel if (route_choosen) 46351ebd318SNicolas Dichtel list_for_each_entry_safe(sibling, next_sibling, 46451ebd318SNicolas Dichtel &match->rt6i_siblings, rt6i_siblings) { 46551ebd318SNicolas Dichtel route_choosen--; 46651ebd318SNicolas Dichtel if (route_choosen == 0) { 46752bd4c0cSNicolas Dichtel if (rt6_score_route(sibling, oif, strict) < 0) 46852bd4c0cSNicolas Dichtel break; 46951ebd318SNicolas Dichtel match = sibling; 47051ebd318SNicolas Dichtel break; 47151ebd318SNicolas Dichtel } 47251ebd318SNicolas Dichtel } 47351ebd318SNicolas Dichtel return match; 47451ebd318SNicolas Dichtel } 47551ebd318SNicolas Dichtel 4761da177e4SLinus Torvalds /* 477c71099acSThomas Graf * Route lookup. Any table->tb6_lock is implied. 4781da177e4SLinus Torvalds */ 4791da177e4SLinus Torvalds 4808ed67789SDaniel Lezcano static inline struct rt6_info *rt6_device_match(struct net *net, 4818ed67789SDaniel Lezcano struct rt6_info *rt, 482b71d1d42SEric Dumazet const struct in6_addr *saddr, 4831da177e4SLinus Torvalds int oif, 484d420895eSYOSHIFUJI Hideaki int flags) 4851da177e4SLinus Torvalds { 4861da177e4SLinus Torvalds struct rt6_info *local = NULL; 4871da177e4SLinus Torvalds struct rt6_info *sprt; 4881da177e4SLinus Torvalds 489dd3abc4eSYOSHIFUJI Hideaki if (!oif && ipv6_addr_any(saddr)) 490dd3abc4eSYOSHIFUJI Hideaki goto out; 491dd3abc4eSYOSHIFUJI Hideaki 492d8d1f30bSChangli Gao for (sprt = rt; sprt; sprt = sprt->dst.rt6_next) { 493d1918542SDavid S. Miller struct net_device *dev = sprt->dst.dev; 494dd3abc4eSYOSHIFUJI Hideaki 495dd3abc4eSYOSHIFUJI Hideaki if (oif) { 4961da177e4SLinus Torvalds if (dev->ifindex == oif) 4971da177e4SLinus Torvalds return sprt; 4981da177e4SLinus Torvalds if (dev->flags & IFF_LOOPBACK) { 49938308473SDavid S. Miller if (!sprt->rt6i_idev || 5001da177e4SLinus Torvalds sprt->rt6i_idev->dev->ifindex != oif) { 501d420895eSYOSHIFUJI Hideaki if (flags & RT6_LOOKUP_F_IFACE && oif) 5021da177e4SLinus Torvalds continue; 5031da177e4SLinus Torvalds if (local && (!oif || 5041da177e4SLinus Torvalds local->rt6i_idev->dev->ifindex == oif)) 5051da177e4SLinus Torvalds continue; 5061da177e4SLinus Torvalds } 5071da177e4SLinus Torvalds local = sprt; 5081da177e4SLinus Torvalds } 509dd3abc4eSYOSHIFUJI Hideaki } else { 510dd3abc4eSYOSHIFUJI Hideaki if (ipv6_chk_addr(net, saddr, dev, 511dd3abc4eSYOSHIFUJI Hideaki flags & RT6_LOOKUP_F_IFACE)) 512dd3abc4eSYOSHIFUJI Hideaki return sprt; 513dd3abc4eSYOSHIFUJI Hideaki } 5141da177e4SLinus Torvalds } 5151da177e4SLinus Torvalds 516dd3abc4eSYOSHIFUJI Hideaki if (oif) { 5171da177e4SLinus Torvalds if (local) 5181da177e4SLinus Torvalds return local; 5191da177e4SLinus Torvalds 520d420895eSYOSHIFUJI Hideaki if (flags & RT6_LOOKUP_F_IFACE) 5218ed67789SDaniel Lezcano return net->ipv6.ip6_null_entry; 5221da177e4SLinus Torvalds } 523dd3abc4eSYOSHIFUJI Hideaki out: 5241da177e4SLinus Torvalds return rt; 5251da177e4SLinus Torvalds } 5261da177e4SLinus Torvalds 52727097255SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_ROUTER_PREF 528c2f17e82SHannes Frederic Sowa struct __rt6_probe_work { 529c2f17e82SHannes Frederic Sowa struct work_struct work; 530c2f17e82SHannes Frederic Sowa struct in6_addr target; 531c2f17e82SHannes Frederic Sowa struct net_device *dev; 532c2f17e82SHannes Frederic Sowa }; 533c2f17e82SHannes Frederic Sowa 534c2f17e82SHannes Frederic Sowa static void rt6_probe_deferred(struct work_struct *w) 535c2f17e82SHannes Frederic Sowa { 536c2f17e82SHannes Frederic Sowa struct in6_addr mcaddr; 537c2f17e82SHannes Frederic Sowa struct __rt6_probe_work *work = 538c2f17e82SHannes Frederic Sowa container_of(w, struct __rt6_probe_work, work); 539c2f17e82SHannes Frederic Sowa 540c2f17e82SHannes Frederic Sowa addrconf_addr_solict_mult(&work->target, &mcaddr); 541ab450605SJiri Benc ndisc_send_ns(work->dev, NULL, &work->target, &mcaddr, NULL, NULL); 542c2f17e82SHannes Frederic Sowa dev_put(work->dev); 543662f5533SMichael Büsch kfree(work); 544c2f17e82SHannes Frederic Sowa } 545c2f17e82SHannes Frederic Sowa 54627097255SYOSHIFUJI Hideaki static void rt6_probe(struct rt6_info *rt) 54727097255SYOSHIFUJI Hideaki { 548990edb42SMartin KaFai Lau struct __rt6_probe_work *work; 549f2c31e32SEric Dumazet struct neighbour *neigh; 55027097255SYOSHIFUJI Hideaki /* 55127097255SYOSHIFUJI Hideaki * Okay, this does not seem to be appropriate 55227097255SYOSHIFUJI Hideaki * for now, however, we need to check if it 55327097255SYOSHIFUJI Hideaki * is really so; aka Router Reachability Probing. 55427097255SYOSHIFUJI Hideaki * 55527097255SYOSHIFUJI Hideaki * Router Reachability Probe MUST be rate-limited 55627097255SYOSHIFUJI Hideaki * to no more than one per minute. 55727097255SYOSHIFUJI Hideaki */ 5582152caeaSYOSHIFUJI Hideaki / 吉藤英明 if (!rt || !(rt->rt6i_flags & RTF_GATEWAY)) 559fdd6681dSAmerigo Wang return; 5602152caeaSYOSHIFUJI Hideaki / 吉藤英明 rcu_read_lock_bh(); 5612152caeaSYOSHIFUJI Hideaki / 吉藤英明 neigh = __ipv6_neigh_lookup_noref(rt->dst.dev, &rt->rt6i_gateway); 5622152caeaSYOSHIFUJI Hideaki / 吉藤英明 if (neigh) { 5638d6c31bfSMartin KaFai Lau if (neigh->nud_state & NUD_VALID) 5648d6c31bfSMartin KaFai Lau goto out; 5658d6c31bfSMartin KaFai Lau 566990edb42SMartin KaFai Lau work = NULL; 5672152caeaSYOSHIFUJI Hideaki / 吉藤英明 write_lock(&neigh->lock); 568990edb42SMartin KaFai Lau if (!(neigh->nud_state & NUD_VALID) && 569990edb42SMartin KaFai Lau time_after(jiffies, 570990edb42SMartin KaFai Lau neigh->updated + 571990edb42SMartin KaFai Lau rt->rt6i_idev->cnf.rtr_probe_interval)) { 572c2f17e82SHannes Frederic Sowa work = kmalloc(sizeof(*work), GFP_ATOMIC); 573990edb42SMartin KaFai Lau if (work) 5747e980569SJiri Benc __neigh_set_probe_once(neigh); 575990edb42SMartin KaFai Lau } 576c2f17e82SHannes Frederic Sowa write_unlock(&neigh->lock); 577990edb42SMartin KaFai Lau } else { 578990edb42SMartin KaFai Lau work = kmalloc(sizeof(*work), GFP_ATOMIC); 579990edb42SMartin KaFai Lau } 580c2f17e82SHannes Frederic Sowa 581c2f17e82SHannes Frederic Sowa if (work) { 582c2f17e82SHannes Frederic Sowa INIT_WORK(&work->work, rt6_probe_deferred); 583c2f17e82SHannes Frederic Sowa work->target = rt->rt6i_gateway; 584c2f17e82SHannes Frederic Sowa dev_hold(rt->dst.dev); 585c2f17e82SHannes Frederic Sowa work->dev = rt->dst.dev; 586c2f17e82SHannes Frederic Sowa schedule_work(&work->work); 587c2f17e82SHannes Frederic Sowa } 588990edb42SMartin KaFai Lau 5898d6c31bfSMartin KaFai Lau out: 5902152caeaSYOSHIFUJI Hideaki / 吉藤英明 rcu_read_unlock_bh(); 591f2c31e32SEric Dumazet } 59227097255SYOSHIFUJI Hideaki #else 59327097255SYOSHIFUJI Hideaki static inline void rt6_probe(struct rt6_info *rt) 59427097255SYOSHIFUJI Hideaki { 59527097255SYOSHIFUJI Hideaki } 59627097255SYOSHIFUJI Hideaki #endif 59727097255SYOSHIFUJI Hideaki 5981da177e4SLinus Torvalds /* 599554cfb7eSYOSHIFUJI Hideaki * Default Router Selection (RFC 2461 6.3.6) 6001da177e4SLinus Torvalds */ 601b6f99a21SDave Jones static inline int rt6_check_dev(struct rt6_info *rt, int oif) 6021da177e4SLinus Torvalds { 603d1918542SDavid S. Miller struct net_device *dev = rt->dst.dev; 604161980f4SDavid S. Miller if (!oif || dev->ifindex == oif) 605554cfb7eSYOSHIFUJI Hideaki return 2; 606161980f4SDavid S. Miller if ((dev->flags & IFF_LOOPBACK) && 607161980f4SDavid S. Miller rt->rt6i_idev && rt->rt6i_idev->dev->ifindex == oif) 608161980f4SDavid S. Miller return 1; 609554cfb7eSYOSHIFUJI Hideaki return 0; 6101da177e4SLinus Torvalds } 6111da177e4SLinus Torvalds 612afc154e9SHannes Frederic Sowa static inline enum rt6_nud_state rt6_check_neigh(struct rt6_info *rt) 6131da177e4SLinus Torvalds { 614f2c31e32SEric Dumazet struct neighbour *neigh; 615afc154e9SHannes Frederic Sowa enum rt6_nud_state ret = RT6_NUD_FAIL_HARD; 616f2c31e32SEric Dumazet 6174d0c5911SYOSHIFUJI Hideaki if (rt->rt6i_flags & RTF_NONEXTHOP || 6184d0c5911SYOSHIFUJI Hideaki !(rt->rt6i_flags & RTF_GATEWAY)) 619afc154e9SHannes Frederic Sowa return RT6_NUD_SUCCEED; 620145a3621SYOSHIFUJI Hideaki / 吉藤英明 621145a3621SYOSHIFUJI Hideaki / 吉藤英明 rcu_read_lock_bh(); 622145a3621SYOSHIFUJI Hideaki / 吉藤英明 neigh = __ipv6_neigh_lookup_noref(rt->dst.dev, &rt->rt6i_gateway); 623145a3621SYOSHIFUJI Hideaki / 吉藤英明 if (neigh) { 624145a3621SYOSHIFUJI Hideaki / 吉藤英明 read_lock(&neigh->lock); 625554cfb7eSYOSHIFUJI Hideaki if (neigh->nud_state & NUD_VALID) 626afc154e9SHannes Frederic Sowa ret = RT6_NUD_SUCCEED; 627398bcbebSYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_ROUTER_PREF 628a5a81f0bSPaul Marks else if (!(neigh->nud_state & NUD_FAILED)) 629afc154e9SHannes Frederic Sowa ret = RT6_NUD_SUCCEED; 6307e980569SJiri Benc else 6317e980569SJiri Benc ret = RT6_NUD_FAIL_PROBE; 632398bcbebSYOSHIFUJI Hideaki #endif 633145a3621SYOSHIFUJI Hideaki / 吉藤英明 read_unlock(&neigh->lock); 634afc154e9SHannes Frederic Sowa } else { 635afc154e9SHannes Frederic Sowa ret = IS_ENABLED(CONFIG_IPV6_ROUTER_PREF) ? 6367e980569SJiri Benc RT6_NUD_SUCCEED : RT6_NUD_FAIL_DO_RR; 637a5a81f0bSPaul Marks } 638145a3621SYOSHIFUJI Hideaki / 吉藤英明 rcu_read_unlock_bh(); 639145a3621SYOSHIFUJI Hideaki / 吉藤英明 640a5a81f0bSPaul Marks return ret; 6411da177e4SLinus Torvalds } 6421da177e4SLinus Torvalds 643554cfb7eSYOSHIFUJI Hideaki static int rt6_score_route(struct rt6_info *rt, int oif, 644554cfb7eSYOSHIFUJI Hideaki int strict) 645554cfb7eSYOSHIFUJI Hideaki { 646a5a81f0bSPaul Marks int m; 6474d0c5911SYOSHIFUJI Hideaki 6484d0c5911SYOSHIFUJI Hideaki m = rt6_check_dev(rt, oif); 64977d16f45SYOSHIFUJI Hideaki if (!m && (strict & RT6_LOOKUP_F_IFACE)) 650afc154e9SHannes Frederic Sowa return RT6_NUD_FAIL_HARD; 651ebacaaa0SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_ROUTER_PREF 652ebacaaa0SYOSHIFUJI Hideaki m |= IPV6_DECODE_PREF(IPV6_EXTRACT_PREF(rt->rt6i_flags)) << 2; 653ebacaaa0SYOSHIFUJI Hideaki #endif 654afc154e9SHannes Frederic Sowa if (strict & RT6_LOOKUP_F_REACHABLE) { 655afc154e9SHannes Frederic Sowa int n = rt6_check_neigh(rt); 656afc154e9SHannes Frederic Sowa if (n < 0) 657afc154e9SHannes Frederic Sowa return n; 658afc154e9SHannes Frederic Sowa } 659554cfb7eSYOSHIFUJI Hideaki return m; 660554cfb7eSYOSHIFUJI Hideaki } 661554cfb7eSYOSHIFUJI Hideaki 662f11e6659SDavid S. Miller static struct rt6_info *find_match(struct rt6_info *rt, int oif, int strict, 663afc154e9SHannes Frederic Sowa int *mpri, struct rt6_info *match, 664afc154e9SHannes Frederic Sowa bool *do_rr) 665554cfb7eSYOSHIFUJI Hideaki { 666554cfb7eSYOSHIFUJI Hideaki int m; 667afc154e9SHannes Frederic Sowa bool match_do_rr = false; 66835103d11SAndy Gospodarek struct inet6_dev *idev = rt->rt6i_idev; 66935103d11SAndy Gospodarek struct net_device *dev = rt->dst.dev; 67035103d11SAndy Gospodarek 67135103d11SAndy Gospodarek if (dev && !netif_carrier_ok(dev) && 67235103d11SAndy Gospodarek idev->cnf.ignore_routes_with_linkdown) 67335103d11SAndy Gospodarek goto out; 674554cfb7eSYOSHIFUJI Hideaki 675554cfb7eSYOSHIFUJI Hideaki if (rt6_check_expired(rt)) 676f11e6659SDavid S. Miller goto out; 677554cfb7eSYOSHIFUJI Hideaki 678554cfb7eSYOSHIFUJI Hideaki m = rt6_score_route(rt, oif, strict); 6797e980569SJiri Benc if (m == RT6_NUD_FAIL_DO_RR) { 680afc154e9SHannes Frederic Sowa match_do_rr = true; 681afc154e9SHannes Frederic Sowa m = 0; /* lowest valid score */ 6827e980569SJiri Benc } else if (m == RT6_NUD_FAIL_HARD) { 683f11e6659SDavid S. Miller goto out; 6841da177e4SLinus Torvalds } 685f11e6659SDavid S. Miller 686afc154e9SHannes Frederic Sowa if (strict & RT6_LOOKUP_F_REACHABLE) 687afc154e9SHannes Frederic Sowa rt6_probe(rt); 688afc154e9SHannes Frederic Sowa 6897e980569SJiri Benc /* note that m can be RT6_NUD_FAIL_PROBE at this point */ 690afc154e9SHannes Frederic Sowa if (m > *mpri) { 691afc154e9SHannes Frederic Sowa *do_rr = match_do_rr; 692afc154e9SHannes Frederic Sowa *mpri = m; 693afc154e9SHannes Frederic Sowa match = rt; 694afc154e9SHannes Frederic Sowa } 695f11e6659SDavid S. Miller out: 696f11e6659SDavid S. Miller return match; 6971da177e4SLinus Torvalds } 6981da177e4SLinus Torvalds 699f11e6659SDavid S. Miller static struct rt6_info *find_rr_leaf(struct fib6_node *fn, 700f11e6659SDavid S. Miller struct rt6_info *rr_head, 701afc154e9SHannes Frederic Sowa u32 metric, int oif, int strict, 702afc154e9SHannes Frederic Sowa bool *do_rr) 703f11e6659SDavid S. Miller { 7049fbdcfafSSteffen Klassert struct rt6_info *rt, *match, *cont; 705f11e6659SDavid S. Miller int mpri = -1; 706f11e6659SDavid S. Miller 707f11e6659SDavid S. Miller match = NULL; 7089fbdcfafSSteffen Klassert cont = NULL; 7099fbdcfafSSteffen Klassert for (rt = rr_head; rt; rt = rt->dst.rt6_next) { 7109fbdcfafSSteffen Klassert if (rt->rt6i_metric != metric) { 7119fbdcfafSSteffen Klassert cont = rt; 7129fbdcfafSSteffen Klassert break; 7139fbdcfafSSteffen Klassert } 7149fbdcfafSSteffen Klassert 715afc154e9SHannes Frederic Sowa match = find_match(rt, oif, strict, &mpri, match, do_rr); 7169fbdcfafSSteffen Klassert } 7179fbdcfafSSteffen Klassert 7189fbdcfafSSteffen Klassert for (rt = fn->leaf; rt && rt != rr_head; rt = rt->dst.rt6_next) { 7199fbdcfafSSteffen Klassert if (rt->rt6i_metric != metric) { 7209fbdcfafSSteffen Klassert cont = rt; 7219fbdcfafSSteffen Klassert break; 7229fbdcfafSSteffen Klassert } 7239fbdcfafSSteffen Klassert 7249fbdcfafSSteffen Klassert match = find_match(rt, oif, strict, &mpri, match, do_rr); 7259fbdcfafSSteffen Klassert } 7269fbdcfafSSteffen Klassert 7279fbdcfafSSteffen Klassert if (match || !cont) 7289fbdcfafSSteffen Klassert return match; 7299fbdcfafSSteffen Klassert 7309fbdcfafSSteffen Klassert for (rt = cont; rt; rt = rt->dst.rt6_next) 731afc154e9SHannes Frederic Sowa match = find_match(rt, oif, strict, &mpri, match, do_rr); 732f11e6659SDavid S. Miller 733f11e6659SDavid S. Miller return match; 734f11e6659SDavid S. Miller } 735f11e6659SDavid S. Miller 736f11e6659SDavid S. Miller static struct rt6_info *rt6_select(struct fib6_node *fn, int oif, int strict) 737f11e6659SDavid S. Miller { 738f11e6659SDavid S. Miller struct rt6_info *match, *rt0; 7398ed67789SDaniel Lezcano struct net *net; 740afc154e9SHannes Frederic Sowa bool do_rr = false; 741f11e6659SDavid S. Miller 742f11e6659SDavid S. Miller rt0 = fn->rr_ptr; 743f11e6659SDavid S. Miller if (!rt0) 744f11e6659SDavid S. Miller fn->rr_ptr = rt0 = fn->leaf; 745f11e6659SDavid S. Miller 746afc154e9SHannes Frederic Sowa match = find_rr_leaf(fn, rt0, rt0->rt6i_metric, oif, strict, 747afc154e9SHannes Frederic Sowa &do_rr); 748f11e6659SDavid S. Miller 749afc154e9SHannes Frederic Sowa if (do_rr) { 750d8d1f30bSChangli Gao struct rt6_info *next = rt0->dst.rt6_next; 751f11e6659SDavid S. Miller 752554cfb7eSYOSHIFUJI Hideaki /* no entries matched; do round-robin */ 753f11e6659SDavid S. Miller if (!next || next->rt6i_metric != rt0->rt6i_metric) 754f11e6659SDavid S. Miller next = fn->leaf; 755f11e6659SDavid S. Miller 756f11e6659SDavid S. Miller if (next != rt0) 757f11e6659SDavid S. Miller fn->rr_ptr = next; 758554cfb7eSYOSHIFUJI Hideaki } 759554cfb7eSYOSHIFUJI Hideaki 760d1918542SDavid S. Miller net = dev_net(rt0->dst.dev); 761a02cec21SEric Dumazet return match ? match : net->ipv6.ip6_null_entry; 7621da177e4SLinus Torvalds } 7631da177e4SLinus Torvalds 7648b9df265SMartin KaFai Lau static bool rt6_is_gw_or_nonexthop(const struct rt6_info *rt) 7658b9df265SMartin KaFai Lau { 7668b9df265SMartin KaFai Lau return (rt->rt6i_flags & (RTF_NONEXTHOP | RTF_GATEWAY)); 7678b9df265SMartin KaFai Lau } 7688b9df265SMartin KaFai Lau 76970ceb4f5SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_ROUTE_INFO 77070ceb4f5SYOSHIFUJI Hideaki int rt6_route_rcv(struct net_device *dev, u8 *opt, int len, 771b71d1d42SEric Dumazet const struct in6_addr *gwaddr) 77270ceb4f5SYOSHIFUJI Hideaki { 773c346dca1SYOSHIFUJI Hideaki struct net *net = dev_net(dev); 77470ceb4f5SYOSHIFUJI Hideaki struct route_info *rinfo = (struct route_info *) opt; 77570ceb4f5SYOSHIFUJI Hideaki struct in6_addr prefix_buf, *prefix; 77670ceb4f5SYOSHIFUJI Hideaki unsigned int pref; 7774bed72e4SYOSHIFUJI Hideaki unsigned long lifetime; 77870ceb4f5SYOSHIFUJI Hideaki struct rt6_info *rt; 77970ceb4f5SYOSHIFUJI Hideaki 78070ceb4f5SYOSHIFUJI Hideaki if (len < sizeof(struct route_info)) { 78170ceb4f5SYOSHIFUJI Hideaki return -EINVAL; 78270ceb4f5SYOSHIFUJI Hideaki } 78370ceb4f5SYOSHIFUJI Hideaki 78470ceb4f5SYOSHIFUJI Hideaki /* Sanity check for prefix_len and length */ 78570ceb4f5SYOSHIFUJI Hideaki if (rinfo->length > 3) { 78670ceb4f5SYOSHIFUJI Hideaki return -EINVAL; 78770ceb4f5SYOSHIFUJI Hideaki } else if (rinfo->prefix_len > 128) { 78870ceb4f5SYOSHIFUJI Hideaki return -EINVAL; 78970ceb4f5SYOSHIFUJI Hideaki } else if (rinfo->prefix_len > 64) { 79070ceb4f5SYOSHIFUJI Hideaki if (rinfo->length < 2) { 79170ceb4f5SYOSHIFUJI Hideaki return -EINVAL; 79270ceb4f5SYOSHIFUJI Hideaki } 79370ceb4f5SYOSHIFUJI Hideaki } else if (rinfo->prefix_len > 0) { 79470ceb4f5SYOSHIFUJI Hideaki if (rinfo->length < 1) { 79570ceb4f5SYOSHIFUJI Hideaki return -EINVAL; 79670ceb4f5SYOSHIFUJI Hideaki } 79770ceb4f5SYOSHIFUJI Hideaki } 79870ceb4f5SYOSHIFUJI Hideaki 79970ceb4f5SYOSHIFUJI Hideaki pref = rinfo->route_pref; 80070ceb4f5SYOSHIFUJI Hideaki if (pref == ICMPV6_ROUTER_PREF_INVALID) 8013933fc95SJens Rosenboom return -EINVAL; 80270ceb4f5SYOSHIFUJI Hideaki 8034bed72e4SYOSHIFUJI Hideaki lifetime = addrconf_timeout_fixup(ntohl(rinfo->lifetime), HZ); 80470ceb4f5SYOSHIFUJI Hideaki 80570ceb4f5SYOSHIFUJI Hideaki if (rinfo->length == 3) 80670ceb4f5SYOSHIFUJI Hideaki prefix = (struct in6_addr *)rinfo->prefix; 80770ceb4f5SYOSHIFUJI Hideaki else { 80870ceb4f5SYOSHIFUJI Hideaki /* this function is safe */ 80970ceb4f5SYOSHIFUJI Hideaki ipv6_addr_prefix(&prefix_buf, 81070ceb4f5SYOSHIFUJI Hideaki (struct in6_addr *)rinfo->prefix, 81170ceb4f5SYOSHIFUJI Hideaki rinfo->prefix_len); 81270ceb4f5SYOSHIFUJI Hideaki prefix = &prefix_buf; 81370ceb4f5SYOSHIFUJI Hideaki } 81470ceb4f5SYOSHIFUJI Hideaki 815f104a567SDuan Jiong if (rinfo->prefix_len == 0) 816f104a567SDuan Jiong rt = rt6_get_dflt_router(gwaddr, dev); 817f104a567SDuan Jiong else 818f104a567SDuan Jiong rt = rt6_get_route_info(net, prefix, rinfo->prefix_len, 819f104a567SDuan Jiong gwaddr, dev->ifindex); 82070ceb4f5SYOSHIFUJI Hideaki 82170ceb4f5SYOSHIFUJI Hideaki if (rt && !lifetime) { 822e0a1ad73SThomas Graf ip6_del_rt(rt); 82370ceb4f5SYOSHIFUJI Hideaki rt = NULL; 82470ceb4f5SYOSHIFUJI Hideaki } 82570ceb4f5SYOSHIFUJI Hideaki 82670ceb4f5SYOSHIFUJI Hideaki if (!rt && lifetime) 827efa2cea0SDaniel Lezcano rt = rt6_add_route_info(net, prefix, rinfo->prefix_len, gwaddr, dev->ifindex, 82870ceb4f5SYOSHIFUJI Hideaki pref); 82970ceb4f5SYOSHIFUJI Hideaki else if (rt) 83070ceb4f5SYOSHIFUJI Hideaki rt->rt6i_flags = RTF_ROUTEINFO | 83170ceb4f5SYOSHIFUJI Hideaki (rt->rt6i_flags & ~RTF_PREF_MASK) | RTF_PREF(pref); 83270ceb4f5SYOSHIFUJI Hideaki 83370ceb4f5SYOSHIFUJI Hideaki if (rt) { 8341716a961SGao feng if (!addrconf_finite_timeout(lifetime)) 8351716a961SGao feng rt6_clean_expires(rt); 8361716a961SGao feng else 8371716a961SGao feng rt6_set_expires(rt, jiffies + HZ * lifetime); 8381716a961SGao feng 83994e187c0SAmerigo Wang ip6_rt_put(rt); 84070ceb4f5SYOSHIFUJI Hideaki } 84170ceb4f5SYOSHIFUJI Hideaki return 0; 84270ceb4f5SYOSHIFUJI Hideaki } 84370ceb4f5SYOSHIFUJI Hideaki #endif 84470ceb4f5SYOSHIFUJI Hideaki 845a3c00e46SMartin KaFai Lau static struct fib6_node* fib6_backtrack(struct fib6_node *fn, 846a3c00e46SMartin KaFai Lau struct in6_addr *saddr) 847a3c00e46SMartin KaFai Lau { 848a3c00e46SMartin KaFai Lau struct fib6_node *pn; 849a3c00e46SMartin KaFai Lau while (1) { 850a3c00e46SMartin KaFai Lau if (fn->fn_flags & RTN_TL_ROOT) 851a3c00e46SMartin KaFai Lau return NULL; 852a3c00e46SMartin KaFai Lau pn = fn->parent; 853a3c00e46SMartin KaFai Lau if (FIB6_SUBTREE(pn) && FIB6_SUBTREE(pn) != fn) 854a3c00e46SMartin KaFai Lau fn = fib6_lookup(FIB6_SUBTREE(pn), NULL, saddr); 855a3c00e46SMartin KaFai Lau else 856a3c00e46SMartin KaFai Lau fn = pn; 857a3c00e46SMartin KaFai Lau if (fn->fn_flags & RTN_RTINFO) 858a3c00e46SMartin KaFai Lau return fn; 859a3c00e46SMartin KaFai Lau } 860a3c00e46SMartin KaFai Lau } 861c71099acSThomas Graf 8628ed67789SDaniel Lezcano static struct rt6_info *ip6_pol_route_lookup(struct net *net, 8638ed67789SDaniel Lezcano struct fib6_table *table, 8644c9483b2SDavid S. Miller struct flowi6 *fl6, int flags) 8651da177e4SLinus Torvalds { 8661da177e4SLinus Torvalds struct fib6_node *fn; 8671da177e4SLinus Torvalds struct rt6_info *rt; 8681da177e4SLinus Torvalds 869c71099acSThomas Graf read_lock_bh(&table->tb6_lock); 8704c9483b2SDavid S. Miller fn = fib6_lookup(&table->tb6_root, &fl6->daddr, &fl6->saddr); 871c71099acSThomas Graf restart: 872c71099acSThomas Graf rt = fn->leaf; 8734c9483b2SDavid S. Miller rt = rt6_device_match(net, rt, &fl6->saddr, fl6->flowi6_oif, flags); 87451ebd318SNicolas Dichtel if (rt->rt6i_nsiblings && fl6->flowi6_oif == 0) 87552bd4c0cSNicolas Dichtel rt = rt6_multipath_select(rt, fl6, fl6->flowi6_oif, flags); 876a3c00e46SMartin KaFai Lau if (rt == net->ipv6.ip6_null_entry) { 877a3c00e46SMartin KaFai Lau fn = fib6_backtrack(fn, &fl6->saddr); 878a3c00e46SMartin KaFai Lau if (fn) 879a3c00e46SMartin KaFai Lau goto restart; 880a3c00e46SMartin KaFai Lau } 881d8d1f30bSChangli Gao dst_use(&rt->dst, jiffies); 882c71099acSThomas Graf read_unlock_bh(&table->tb6_lock); 8831da177e4SLinus Torvalds return rt; 884c71099acSThomas Graf 885c71099acSThomas Graf } 886c71099acSThomas Graf 887ea6e574eSFlorian Westphal struct dst_entry *ip6_route_lookup(struct net *net, struct flowi6 *fl6, 888ea6e574eSFlorian Westphal int flags) 889ea6e574eSFlorian Westphal { 890ea6e574eSFlorian Westphal return fib6_rule_lookup(net, fl6, flags, ip6_pol_route_lookup); 891ea6e574eSFlorian Westphal } 892ea6e574eSFlorian Westphal EXPORT_SYMBOL_GPL(ip6_route_lookup); 893ea6e574eSFlorian Westphal 8949acd9f3aSYOSHIFUJI Hideaki struct rt6_info *rt6_lookup(struct net *net, const struct in6_addr *daddr, 8959acd9f3aSYOSHIFUJI Hideaki const struct in6_addr *saddr, int oif, int strict) 896c71099acSThomas Graf { 8974c9483b2SDavid S. Miller struct flowi6 fl6 = { 8984c9483b2SDavid S. Miller .flowi6_oif = oif, 8994c9483b2SDavid S. Miller .daddr = *daddr, 900c71099acSThomas Graf }; 901c71099acSThomas Graf struct dst_entry *dst; 90277d16f45SYOSHIFUJI Hideaki int flags = strict ? RT6_LOOKUP_F_IFACE : 0; 903c71099acSThomas Graf 904adaa70bbSThomas Graf if (saddr) { 9054c9483b2SDavid S. Miller memcpy(&fl6.saddr, saddr, sizeof(*saddr)); 906adaa70bbSThomas Graf flags |= RT6_LOOKUP_F_HAS_SADDR; 907adaa70bbSThomas Graf } 908adaa70bbSThomas Graf 9094c9483b2SDavid S. Miller dst = fib6_rule_lookup(net, &fl6, flags, ip6_pol_route_lookup); 910c71099acSThomas Graf if (dst->error == 0) 911c71099acSThomas Graf return (struct rt6_info *) dst; 912c71099acSThomas Graf 913c71099acSThomas Graf dst_release(dst); 914c71099acSThomas Graf 9151da177e4SLinus Torvalds return NULL; 9161da177e4SLinus Torvalds } 9177159039aSYOSHIFUJI Hideaki EXPORT_SYMBOL(rt6_lookup); 9187159039aSYOSHIFUJI Hideaki 919c71099acSThomas Graf /* ip6_ins_rt is called with FREE table->tb6_lock. 9201da177e4SLinus Torvalds It takes new route entry, the addition fails by any reason the 9211da177e4SLinus Torvalds route is freed. In any case, if caller does not hold it, it may 9221da177e4SLinus Torvalds be destroyed. 9231da177e4SLinus Torvalds */ 9241da177e4SLinus Torvalds 925e5fd387aSMichal Kubeček static int __ip6_ins_rt(struct rt6_info *rt, struct nl_info *info, 926e715b6d3SFlorian Westphal struct mx6_config *mxc) 9271da177e4SLinus Torvalds { 9281da177e4SLinus Torvalds int err; 929c71099acSThomas Graf struct fib6_table *table; 9301da177e4SLinus Torvalds 931c71099acSThomas Graf table = rt->rt6i_table; 932c71099acSThomas Graf write_lock_bh(&table->tb6_lock); 933e715b6d3SFlorian Westphal err = fib6_add(&table->tb6_root, rt, info, mxc); 934c71099acSThomas Graf write_unlock_bh(&table->tb6_lock); 9351da177e4SLinus Torvalds 9361da177e4SLinus Torvalds return err; 9371da177e4SLinus Torvalds } 9381da177e4SLinus Torvalds 93940e22e8fSThomas Graf int ip6_ins_rt(struct rt6_info *rt) 94040e22e8fSThomas Graf { 941e715b6d3SFlorian Westphal struct nl_info info = { .nl_net = dev_net(rt->dst.dev), }; 942e715b6d3SFlorian Westphal struct mx6_config mxc = { .mx = NULL, }; 943e715b6d3SFlorian Westphal 944e715b6d3SFlorian Westphal return __ip6_ins_rt(rt, &info, &mxc); 94540e22e8fSThomas Graf } 94640e22e8fSThomas Graf 9478b9df265SMartin KaFai Lau static struct rt6_info *ip6_rt_cache_alloc(struct rt6_info *ort, 94821efcfa0SEric Dumazet const struct in6_addr *daddr, 949b71d1d42SEric Dumazet const struct in6_addr *saddr) 9501da177e4SLinus Torvalds { 9511da177e4SLinus Torvalds struct rt6_info *rt; 9521da177e4SLinus Torvalds 9531da177e4SLinus Torvalds /* 9541da177e4SLinus Torvalds * Clone the route. 9551da177e4SLinus Torvalds */ 9561da177e4SLinus Torvalds 957d52d3997SMartin KaFai Lau if (ort->rt6i_flags & (RTF_CACHE | RTF_PCPU)) 95883a09abdSMartin KaFai Lau ort = (struct rt6_info *)ort->dst.from; 9591da177e4SLinus Torvalds 960ad706862SMartin KaFai Lau rt = __ip6_dst_alloc(dev_net(ort->dst.dev), ort->dst.dev, 0); 96183a09abdSMartin KaFai Lau 96283a09abdSMartin KaFai Lau if (!rt) 96383a09abdSMartin KaFai Lau return NULL; 96483a09abdSMartin KaFai Lau 96583a09abdSMartin KaFai Lau ip6_rt_copy_init(rt, ort); 9668b9df265SMartin KaFai Lau rt->rt6i_flags |= RTF_CACHE; 96783a09abdSMartin KaFai Lau rt->rt6i_metric = 0; 96883a09abdSMartin KaFai Lau rt->dst.flags |= DST_HOST; 96983a09abdSMartin KaFai Lau rt->rt6i_dst.addr = *daddr; 97083a09abdSMartin KaFai Lau rt->rt6i_dst.plen = 128; 9718b9df265SMartin KaFai Lau 9728b9df265SMartin KaFai Lau if (!rt6_is_gw_or_nonexthop(ort)) { 973bb3c3686SDavid S. Miller if (ort->rt6i_dst.plen != 128 && 97421efcfa0SEric Dumazet ipv6_addr_equal(&ort->rt6i_dst.addr, daddr)) 97558c4fb86SYOSHIFUJI Hideaki rt->rt6i_flags |= RTF_ANYCAST; 9761da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES 9771da177e4SLinus Torvalds if (rt->rt6i_src.plen && saddr) { 9784e3fd7a0SAlexey Dobriyan rt->rt6i_src.addr = *saddr; 9791da177e4SLinus Torvalds rt->rt6i_src.plen = 128; 9801da177e4SLinus Torvalds } 9811da177e4SLinus Torvalds #endif 98295a9a5baSYOSHIFUJI Hideaki } 98395a9a5baSYOSHIFUJI Hideaki 984299d9939SYOSHIFUJI Hideaki return rt; 985299d9939SYOSHIFUJI Hideaki } 986299d9939SYOSHIFUJI Hideaki 987d52d3997SMartin KaFai Lau static struct rt6_info *ip6_rt_pcpu_alloc(struct rt6_info *rt) 988d52d3997SMartin KaFai Lau { 989d52d3997SMartin KaFai Lau struct rt6_info *pcpu_rt; 990d52d3997SMartin KaFai Lau 991d52d3997SMartin KaFai Lau pcpu_rt = __ip6_dst_alloc(dev_net(rt->dst.dev), 992ad706862SMartin KaFai Lau rt->dst.dev, rt->dst.flags); 993d52d3997SMartin KaFai Lau 994d52d3997SMartin KaFai Lau if (!pcpu_rt) 995d52d3997SMartin KaFai Lau return NULL; 996d52d3997SMartin KaFai Lau ip6_rt_copy_init(pcpu_rt, rt); 997d52d3997SMartin KaFai Lau pcpu_rt->rt6i_protocol = rt->rt6i_protocol; 998d52d3997SMartin KaFai Lau pcpu_rt->rt6i_flags |= RTF_PCPU; 999d52d3997SMartin KaFai Lau return pcpu_rt; 1000d52d3997SMartin KaFai Lau } 1001d52d3997SMartin KaFai Lau 1002d52d3997SMartin KaFai Lau /* It should be called with read_lock_bh(&tb6_lock) acquired */ 1003d52d3997SMartin KaFai Lau static struct rt6_info *rt6_get_pcpu_route(struct rt6_info *rt) 1004d52d3997SMartin KaFai Lau { 1005a73e4195SMartin KaFai Lau struct rt6_info *pcpu_rt, **p; 1006d52d3997SMartin KaFai Lau 1007d52d3997SMartin KaFai Lau p = this_cpu_ptr(rt->rt6i_pcpu); 1008d52d3997SMartin KaFai Lau pcpu_rt = *p; 1009d52d3997SMartin KaFai Lau 1010a73e4195SMartin KaFai Lau if (pcpu_rt) { 1011a73e4195SMartin KaFai Lau dst_hold(&pcpu_rt->dst); 1012a73e4195SMartin KaFai Lau rt6_dst_from_metrics_check(pcpu_rt); 1013a73e4195SMartin KaFai Lau } 1014a73e4195SMartin KaFai Lau return pcpu_rt; 1015a73e4195SMartin KaFai Lau } 1016a73e4195SMartin KaFai Lau 1017a73e4195SMartin KaFai Lau static struct rt6_info *rt6_make_pcpu_route(struct rt6_info *rt) 1018a73e4195SMartin KaFai Lau { 10199c7370a1SMartin KaFai Lau struct fib6_table *table = rt->rt6i_table; 1020a73e4195SMartin KaFai Lau struct rt6_info *pcpu_rt, *prev, **p; 1021d52d3997SMartin KaFai Lau 1022d52d3997SMartin KaFai Lau pcpu_rt = ip6_rt_pcpu_alloc(rt); 1023d52d3997SMartin KaFai Lau if (!pcpu_rt) { 1024d52d3997SMartin KaFai Lau struct net *net = dev_net(rt->dst.dev); 1025d52d3997SMartin KaFai Lau 10269c7370a1SMartin KaFai Lau dst_hold(&net->ipv6.ip6_null_entry->dst); 10279c7370a1SMartin KaFai Lau return net->ipv6.ip6_null_entry; 1028d52d3997SMartin KaFai Lau } 1029d52d3997SMartin KaFai Lau 10309c7370a1SMartin KaFai Lau read_lock_bh(&table->tb6_lock); 10319c7370a1SMartin KaFai Lau if (rt->rt6i_pcpu) { 1032a73e4195SMartin KaFai Lau p = this_cpu_ptr(rt->rt6i_pcpu); 1033d52d3997SMartin KaFai Lau prev = cmpxchg(p, NULL, pcpu_rt); 1034d52d3997SMartin KaFai Lau if (prev) { 1035d52d3997SMartin KaFai Lau /* If someone did it before us, return prev instead */ 1036d52d3997SMartin KaFai Lau dst_destroy(&pcpu_rt->dst); 1037d52d3997SMartin KaFai Lau pcpu_rt = prev; 1038d52d3997SMartin KaFai Lau } 10399c7370a1SMartin KaFai Lau } else { 10409c7370a1SMartin KaFai Lau /* rt has been removed from the fib6 tree 10419c7370a1SMartin KaFai Lau * before we have a chance to acquire the read_lock. 10429c7370a1SMartin KaFai Lau * In this case, don't brother to create a pcpu rt 10439c7370a1SMartin KaFai Lau * since rt is going away anyway. The next 10449c7370a1SMartin KaFai Lau * dst_check() will trigger a re-lookup. 10459c7370a1SMartin KaFai Lau */ 10469c7370a1SMartin KaFai Lau dst_destroy(&pcpu_rt->dst); 10479c7370a1SMartin KaFai Lau pcpu_rt = rt; 10489c7370a1SMartin KaFai Lau } 1049d52d3997SMartin KaFai Lau dst_hold(&pcpu_rt->dst); 1050d52d3997SMartin KaFai Lau rt6_dst_from_metrics_check(pcpu_rt); 10519c7370a1SMartin KaFai Lau read_unlock_bh(&table->tb6_lock); 1052d52d3997SMartin KaFai Lau return pcpu_rt; 1053d52d3997SMartin KaFai Lau } 1054d52d3997SMartin KaFai Lau 10558ed67789SDaniel Lezcano static struct rt6_info *ip6_pol_route(struct net *net, struct fib6_table *table, int oif, 10564c9483b2SDavid S. Miller struct flowi6 *fl6, int flags) 10571da177e4SLinus Torvalds { 1058367efcb9SMartin KaFai Lau struct fib6_node *fn, *saved_fn; 105945e4fd26SMartin KaFai Lau struct rt6_info *rt; 1060c71099acSThomas Graf int strict = 0; 10611da177e4SLinus Torvalds 106277d16f45SYOSHIFUJI Hideaki strict |= flags & RT6_LOOKUP_F_IFACE; 1063367efcb9SMartin KaFai Lau if (net->ipv6.devconf_all->forwarding == 0) 1064367efcb9SMartin KaFai Lau strict |= RT6_LOOKUP_F_REACHABLE; 10651da177e4SLinus Torvalds 1066c71099acSThomas Graf read_lock_bh(&table->tb6_lock); 10671da177e4SLinus Torvalds 10684c9483b2SDavid S. Miller fn = fib6_lookup(&table->tb6_root, &fl6->daddr, &fl6->saddr); 1069367efcb9SMartin KaFai Lau saved_fn = fn; 10701da177e4SLinus Torvalds 1071a3c00e46SMartin KaFai Lau redo_rt6_select: 1072367efcb9SMartin KaFai Lau rt = rt6_select(fn, oif, strict); 107352bd4c0cSNicolas Dichtel if (rt->rt6i_nsiblings) 1074367efcb9SMartin KaFai Lau rt = rt6_multipath_select(rt, fl6, oif, strict); 1075a3c00e46SMartin KaFai Lau if (rt == net->ipv6.ip6_null_entry) { 1076a3c00e46SMartin KaFai Lau fn = fib6_backtrack(fn, &fl6->saddr); 1077a3c00e46SMartin KaFai Lau if (fn) 1078a3c00e46SMartin KaFai Lau goto redo_rt6_select; 1079367efcb9SMartin KaFai Lau else if (strict & RT6_LOOKUP_F_REACHABLE) { 1080367efcb9SMartin KaFai Lau /* also consider unreachable route */ 1081367efcb9SMartin KaFai Lau strict &= ~RT6_LOOKUP_F_REACHABLE; 1082367efcb9SMartin KaFai Lau fn = saved_fn; 1083367efcb9SMartin KaFai Lau goto redo_rt6_select; 1084367efcb9SMartin KaFai Lau } 1085a3c00e46SMartin KaFai Lau } 1086a3c00e46SMartin KaFai Lau 1087d52d3997SMartin KaFai Lau 1088d52d3997SMartin KaFai Lau if (rt == net->ipv6.ip6_null_entry || (rt->rt6i_flags & RTF_CACHE)) { 10893da59bd9SMartin KaFai Lau dst_use(&rt->dst, jiffies); 1090c71099acSThomas Graf read_unlock_bh(&table->tb6_lock); 10911da177e4SLinus Torvalds 1092d52d3997SMartin KaFai Lau rt6_dst_from_metrics_check(rt); 1093d52d3997SMartin KaFai Lau return rt; 10943da59bd9SMartin KaFai Lau } else if (unlikely((fl6->flowi6_flags & FLOWI_FLAG_KNOWN_NH) && 10953da59bd9SMartin KaFai Lau !(rt->rt6i_flags & RTF_GATEWAY))) { 10963da59bd9SMartin KaFai Lau /* Create a RTF_CACHE clone which will not be 10973da59bd9SMartin KaFai Lau * owned by the fib6 tree. It is for the special case where 10983da59bd9SMartin KaFai Lau * the daddr in the skb during the neighbor look-up is different 10993da59bd9SMartin KaFai Lau * from the fl6->daddr used to look-up route here. 11003da59bd9SMartin KaFai Lau */ 1101c71099acSThomas Graf 11023da59bd9SMartin KaFai Lau struct rt6_info *uncached_rt; 11033da59bd9SMartin KaFai Lau 1104d52d3997SMartin KaFai Lau dst_use(&rt->dst, jiffies); 1105d52d3997SMartin KaFai Lau read_unlock_bh(&table->tb6_lock); 1106d52d3997SMartin KaFai Lau 11073da59bd9SMartin KaFai Lau uncached_rt = ip6_rt_cache_alloc(rt, &fl6->daddr, NULL); 11083da59bd9SMartin KaFai Lau dst_release(&rt->dst); 11093da59bd9SMartin KaFai Lau 11103da59bd9SMartin KaFai Lau if (uncached_rt) 11118d0b94afSMartin KaFai Lau rt6_uncached_list_add(uncached_rt); 11123da59bd9SMartin KaFai Lau else 11133da59bd9SMartin KaFai Lau uncached_rt = net->ipv6.ip6_null_entry; 1114d52d3997SMartin KaFai Lau 11153da59bd9SMartin KaFai Lau dst_hold(&uncached_rt->dst); 11163da59bd9SMartin KaFai Lau return uncached_rt; 11173da59bd9SMartin KaFai Lau 1118d52d3997SMartin KaFai Lau } else { 1119d52d3997SMartin KaFai Lau /* Get a percpu copy */ 1120d52d3997SMartin KaFai Lau 1121d52d3997SMartin KaFai Lau struct rt6_info *pcpu_rt; 1122d52d3997SMartin KaFai Lau 1123d52d3997SMartin KaFai Lau rt->dst.lastuse = jiffies; 1124d52d3997SMartin KaFai Lau rt->dst.__use++; 1125d52d3997SMartin KaFai Lau pcpu_rt = rt6_get_pcpu_route(rt); 1126d52d3997SMartin KaFai Lau 11279c7370a1SMartin KaFai Lau if (pcpu_rt) { 1128d52d3997SMartin KaFai Lau read_unlock_bh(&table->tb6_lock); 11299c7370a1SMartin KaFai Lau } else { 11309c7370a1SMartin KaFai Lau /* We have to do the read_unlock first 11319c7370a1SMartin KaFai Lau * because rt6_make_pcpu_route() may trigger 11329c7370a1SMartin KaFai Lau * ip6_dst_gc() which will take the write_lock. 11339c7370a1SMartin KaFai Lau */ 11349c7370a1SMartin KaFai Lau dst_hold(&rt->dst); 11359c7370a1SMartin KaFai Lau read_unlock_bh(&table->tb6_lock); 11369c7370a1SMartin KaFai Lau pcpu_rt = rt6_make_pcpu_route(rt); 11379c7370a1SMartin KaFai Lau dst_release(&rt->dst); 11389c7370a1SMartin KaFai Lau } 1139d52d3997SMartin KaFai Lau 1140d52d3997SMartin KaFai Lau return pcpu_rt; 11419c7370a1SMartin KaFai Lau 1142d52d3997SMartin KaFai Lau } 1143c71099acSThomas Graf } 1144c71099acSThomas Graf 11458ed67789SDaniel Lezcano static struct rt6_info *ip6_pol_route_input(struct net *net, struct fib6_table *table, 11464c9483b2SDavid S. Miller struct flowi6 *fl6, int flags) 11474acad72dSPavel Emelyanov { 11484c9483b2SDavid S. Miller return ip6_pol_route(net, table, fl6->flowi6_iif, fl6, flags); 11494acad72dSPavel Emelyanov } 11504acad72dSPavel Emelyanov 115172331bc0SShmulik Ladkani static struct dst_entry *ip6_route_input_lookup(struct net *net, 115272331bc0SShmulik Ladkani struct net_device *dev, 115372331bc0SShmulik Ladkani struct flowi6 *fl6, int flags) 115472331bc0SShmulik Ladkani { 115572331bc0SShmulik Ladkani if (rt6_need_strict(&fl6->daddr) && dev->type != ARPHRD_PIMREG) 115672331bc0SShmulik Ladkani flags |= RT6_LOOKUP_F_IFACE; 115772331bc0SShmulik Ladkani 115872331bc0SShmulik Ladkani return fib6_rule_lookup(net, fl6, flags, ip6_pol_route_input); 115972331bc0SShmulik Ladkani } 116072331bc0SShmulik Ladkani 1161c71099acSThomas Graf void ip6_route_input(struct sk_buff *skb) 1162c71099acSThomas Graf { 1163b71d1d42SEric Dumazet const struct ipv6hdr *iph = ipv6_hdr(skb); 1164c346dca1SYOSHIFUJI Hideaki struct net *net = dev_net(skb->dev); 1165adaa70bbSThomas Graf int flags = RT6_LOOKUP_F_HAS_SADDR; 1166904af04dSJiri Benc struct ip_tunnel_info *tun_info; 11674c9483b2SDavid S. Miller struct flowi6 fl6 = { 11684c9483b2SDavid S. Miller .flowi6_iif = skb->dev->ifindex, 11694c9483b2SDavid S. Miller .daddr = iph->daddr, 11704c9483b2SDavid S. Miller .saddr = iph->saddr, 11716502ca52SYOSHIFUJI Hideaki / 吉藤英明 .flowlabel = ip6_flowinfo(iph), 11724c9483b2SDavid S. Miller .flowi6_mark = skb->mark, 11734c9483b2SDavid S. Miller .flowi6_proto = iph->nexthdr, 1174c71099acSThomas Graf }; 1175adaa70bbSThomas Graf 1176904af04dSJiri Benc tun_info = skb_tunnel_info(skb); 117746fa062aSJiri Benc if (tun_info && !(tun_info->mode & IP_TUNNEL_INFO_TX)) 1178904af04dSJiri Benc fl6.flowi6_tun_key.tun_id = tun_info->key.tun_id; 117906e9d040SJiri Benc skb_dst_drop(skb); 118072331bc0SShmulik Ladkani skb_dst_set(skb, ip6_route_input_lookup(net, skb->dev, &fl6, flags)); 1181c71099acSThomas Graf } 1182c71099acSThomas Graf 11838ed67789SDaniel Lezcano static struct rt6_info *ip6_pol_route_output(struct net *net, struct fib6_table *table, 11844c9483b2SDavid S. Miller struct flowi6 *fl6, int flags) 1185c71099acSThomas Graf { 11864c9483b2SDavid S. Miller return ip6_pol_route(net, table, fl6->flowi6_oif, fl6, flags); 1187c71099acSThomas Graf } 1188c71099acSThomas Graf 11899c7a4f9cSFlorian Westphal struct dst_entry *ip6_route_output(struct net *net, const struct sock *sk, 11904c9483b2SDavid S. Miller struct flowi6 *fl6) 1191c71099acSThomas Graf { 1192c71099acSThomas Graf int flags = 0; 1193c71099acSThomas Graf 11941fb9489bSPavel Emelyanov fl6->flowi6_iif = LOOPBACK_IFINDEX; 11954dc27d1cSDavid McCullough 11964c9483b2SDavid S. Miller if ((sk && sk->sk_bound_dev_if) || rt6_need_strict(&fl6->daddr)) 119777d16f45SYOSHIFUJI Hideaki flags |= RT6_LOOKUP_F_IFACE; 1198c71099acSThomas Graf 11994c9483b2SDavid S. Miller if (!ipv6_addr_any(&fl6->saddr)) 1200adaa70bbSThomas Graf flags |= RT6_LOOKUP_F_HAS_SADDR; 12010c9a2ac1SYOSHIFUJI Hideaki / 吉藤英明 else if (sk) 12020c9a2ac1SYOSHIFUJI Hideaki / 吉藤英明 flags |= rt6_srcprefs2flags(inet6_sk(sk)->srcprefs); 1203adaa70bbSThomas Graf 12044c9483b2SDavid S. Miller return fib6_rule_lookup(net, fl6, flags, ip6_pol_route_output); 12051da177e4SLinus Torvalds } 12067159039aSYOSHIFUJI Hideaki EXPORT_SYMBOL(ip6_route_output); 12071da177e4SLinus Torvalds 12082774c131SDavid S. Miller struct dst_entry *ip6_blackhole_route(struct net *net, struct dst_entry *dst_orig) 120914e50e57SDavid S. Miller { 12105c1e6aa3SDavid S. Miller struct rt6_info *rt, *ort = (struct rt6_info *) dst_orig; 121114e50e57SDavid S. Miller struct dst_entry *new = NULL; 121214e50e57SDavid S. Miller 1213f5b0a874SDavid S. Miller rt = dst_alloc(&ip6_dst_blackhole_ops, ort->dst.dev, 1, DST_OBSOLETE_NONE, 0); 121414e50e57SDavid S. Miller if (rt) { 1215d8d1f30bSChangli Gao new = &rt->dst; 121614e50e57SDavid S. Miller 12178104891bSSteffen Klassert memset(new + 1, 0, sizeof(*rt) - sizeof(*new)); 12188104891bSSteffen Klassert 121914e50e57SDavid S. Miller new->__use = 1; 1220352e512cSHerbert Xu new->input = dst_discard; 1221aad88724SEric Dumazet new->output = dst_discard_sk; 122214e50e57SDavid S. Miller 122321efcfa0SEric Dumazet if (dst_metrics_read_only(&ort->dst)) 122421efcfa0SEric Dumazet new->_metrics = ort->dst._metrics; 122521efcfa0SEric Dumazet else 1226defb3519SDavid S. Miller dst_copy_metrics(new, &ort->dst); 122714e50e57SDavid S. Miller rt->rt6i_idev = ort->rt6i_idev; 122814e50e57SDavid S. Miller if (rt->rt6i_idev) 122914e50e57SDavid S. Miller in6_dev_hold(rt->rt6i_idev); 123014e50e57SDavid S. Miller 12314e3fd7a0SAlexey Dobriyan rt->rt6i_gateway = ort->rt6i_gateway; 12321716a961SGao feng rt->rt6i_flags = ort->rt6i_flags; 123314e50e57SDavid S. Miller rt->rt6i_metric = 0; 123414e50e57SDavid S. Miller 123514e50e57SDavid S. Miller memcpy(&rt->rt6i_dst, &ort->rt6i_dst, sizeof(struct rt6key)); 123614e50e57SDavid S. Miller #ifdef CONFIG_IPV6_SUBTREES 123714e50e57SDavid S. Miller memcpy(&rt->rt6i_src, &ort->rt6i_src, sizeof(struct rt6key)); 123814e50e57SDavid S. Miller #endif 123914e50e57SDavid S. Miller 124014e50e57SDavid S. Miller dst_free(new); 124114e50e57SDavid S. Miller } 124214e50e57SDavid S. Miller 124369ead7afSDavid S. Miller dst_release(dst_orig); 124469ead7afSDavid S. Miller return new ? new : ERR_PTR(-ENOMEM); 124514e50e57SDavid S. Miller } 124614e50e57SDavid S. Miller 12471da177e4SLinus Torvalds /* 12481da177e4SLinus Torvalds * Destination cache support functions 12491da177e4SLinus Torvalds */ 12501da177e4SLinus Torvalds 12514b32b5adSMartin KaFai Lau static void rt6_dst_from_metrics_check(struct rt6_info *rt) 12524b32b5adSMartin KaFai Lau { 12534b32b5adSMartin KaFai Lau if (rt->dst.from && 12544b32b5adSMartin KaFai Lau dst_metrics_ptr(&rt->dst) != dst_metrics_ptr(rt->dst.from)) 12554b32b5adSMartin KaFai Lau dst_init_metrics(&rt->dst, dst_metrics_ptr(rt->dst.from), true); 12564b32b5adSMartin KaFai Lau } 12574b32b5adSMartin KaFai Lau 12583da59bd9SMartin KaFai Lau static struct dst_entry *rt6_check(struct rt6_info *rt, u32 cookie) 12593da59bd9SMartin KaFai Lau { 12603da59bd9SMartin KaFai Lau if (!rt->rt6i_node || (rt->rt6i_node->fn_sernum != cookie)) 12613da59bd9SMartin KaFai Lau return NULL; 12623da59bd9SMartin KaFai Lau 12633da59bd9SMartin KaFai Lau if (rt6_check_expired(rt)) 12643da59bd9SMartin KaFai Lau return NULL; 12653da59bd9SMartin KaFai Lau 12663da59bd9SMartin KaFai Lau return &rt->dst; 12673da59bd9SMartin KaFai Lau } 12683da59bd9SMartin KaFai Lau 12693da59bd9SMartin KaFai Lau static struct dst_entry *rt6_dst_from_check(struct rt6_info *rt, u32 cookie) 12703da59bd9SMartin KaFai Lau { 12713da59bd9SMartin KaFai Lau if (rt->dst.obsolete == DST_OBSOLETE_FORCE_CHK && 12723da59bd9SMartin KaFai Lau rt6_check((struct rt6_info *)(rt->dst.from), cookie)) 12733da59bd9SMartin KaFai Lau return &rt->dst; 12743da59bd9SMartin KaFai Lau else 12753da59bd9SMartin KaFai Lau return NULL; 12763da59bd9SMartin KaFai Lau } 12773da59bd9SMartin KaFai Lau 12781da177e4SLinus Torvalds static struct dst_entry *ip6_dst_check(struct dst_entry *dst, u32 cookie) 12791da177e4SLinus Torvalds { 12801da177e4SLinus Torvalds struct rt6_info *rt; 12811da177e4SLinus Torvalds 12821da177e4SLinus Torvalds rt = (struct rt6_info *) dst; 12831da177e4SLinus Torvalds 12846f3118b5SNicolas Dichtel /* All IPV6 dsts are created with ->obsolete set to the value 12856f3118b5SNicolas Dichtel * DST_OBSOLETE_FORCE_CHK which forces validation calls down 12866f3118b5SNicolas Dichtel * into this function always. 12876f3118b5SNicolas Dichtel */ 1288e3bc10bdSHannes Frederic Sowa 12894b32b5adSMartin KaFai Lau rt6_dst_from_metrics_check(rt); 12904b32b5adSMartin KaFai Lau 1291d52d3997SMartin KaFai Lau if ((rt->rt6i_flags & RTF_PCPU) || unlikely(dst->flags & DST_NOCACHE)) 12923da59bd9SMartin KaFai Lau return rt6_dst_from_check(rt, cookie); 12933da59bd9SMartin KaFai Lau else 12943da59bd9SMartin KaFai Lau return rt6_check(rt, cookie); 12951da177e4SLinus Torvalds } 12961da177e4SLinus Torvalds 12971da177e4SLinus Torvalds static struct dst_entry *ip6_negative_advice(struct dst_entry *dst) 12981da177e4SLinus Torvalds { 12991da177e4SLinus Torvalds struct rt6_info *rt = (struct rt6_info *) dst; 13001da177e4SLinus Torvalds 13011da177e4SLinus Torvalds if (rt) { 130254c1a859SYOSHIFUJI Hideaki / 吉藤英明 if (rt->rt6i_flags & RTF_CACHE) { 130354c1a859SYOSHIFUJI Hideaki / 吉藤英明 if (rt6_check_expired(rt)) { 1304e0a1ad73SThomas Graf ip6_del_rt(rt); 130554c1a859SYOSHIFUJI Hideaki / 吉藤英明 dst = NULL; 13061da177e4SLinus Torvalds } 130754c1a859SYOSHIFUJI Hideaki / 吉藤英明 } else { 130854c1a859SYOSHIFUJI Hideaki / 吉藤英明 dst_release(dst); 130954c1a859SYOSHIFUJI Hideaki / 吉藤英明 dst = NULL; 131054c1a859SYOSHIFUJI Hideaki / 吉藤英明 } 131154c1a859SYOSHIFUJI Hideaki / 吉藤英明 } 131254c1a859SYOSHIFUJI Hideaki / 吉藤英明 return dst; 13131da177e4SLinus Torvalds } 13141da177e4SLinus Torvalds 13151da177e4SLinus Torvalds static void ip6_link_failure(struct sk_buff *skb) 13161da177e4SLinus Torvalds { 13171da177e4SLinus Torvalds struct rt6_info *rt; 13181da177e4SLinus Torvalds 13193ffe533cSAlexey Dobriyan icmpv6_send(skb, ICMPV6_DEST_UNREACH, ICMPV6_ADDR_UNREACH, 0); 13201da177e4SLinus Torvalds 1321adf30907SEric Dumazet rt = (struct rt6_info *) skb_dst(skb); 13221da177e4SLinus Torvalds if (rt) { 13231eb4f758SHannes Frederic Sowa if (rt->rt6i_flags & RTF_CACHE) { 13241eb4f758SHannes Frederic Sowa dst_hold(&rt->dst); 13251eb4f758SHannes Frederic Sowa if (ip6_del_rt(rt)) 13261eb4f758SHannes Frederic Sowa dst_free(&rt->dst); 13271eb4f758SHannes Frederic Sowa } else if (rt->rt6i_node && (rt->rt6i_flags & RTF_DEFAULT)) { 13281da177e4SLinus Torvalds rt->rt6i_node->fn_sernum = -1; 13291da177e4SLinus Torvalds } 13301da177e4SLinus Torvalds } 13311eb4f758SHannes Frederic Sowa } 13321da177e4SLinus Torvalds 133345e4fd26SMartin KaFai Lau static void rt6_do_update_pmtu(struct rt6_info *rt, u32 mtu) 133445e4fd26SMartin KaFai Lau { 133545e4fd26SMartin KaFai Lau struct net *net = dev_net(rt->dst.dev); 133645e4fd26SMartin KaFai Lau 133745e4fd26SMartin KaFai Lau rt->rt6i_flags |= RTF_MODIFIED; 133845e4fd26SMartin KaFai Lau rt->rt6i_pmtu = mtu; 133945e4fd26SMartin KaFai Lau rt6_update_expires(rt, net->ipv6.sysctl.ip6_rt_mtu_expires); 134045e4fd26SMartin KaFai Lau } 134145e4fd26SMartin KaFai Lau 134245e4fd26SMartin KaFai Lau static void __ip6_rt_update_pmtu(struct dst_entry *dst, const struct sock *sk, 134345e4fd26SMartin KaFai Lau const struct ipv6hdr *iph, u32 mtu) 13441da177e4SLinus Torvalds { 13451da177e4SLinus Torvalds struct rt6_info *rt6 = (struct rt6_info *)dst; 13461da177e4SLinus Torvalds 134745e4fd26SMartin KaFai Lau if (rt6->rt6i_flags & RTF_LOCAL) 134845e4fd26SMartin KaFai Lau return; 134945e4fd26SMartin KaFai Lau 135081aded24SDavid S. Miller dst_confirm(dst); 135145e4fd26SMartin KaFai Lau mtu = max_t(u32, mtu, IPV6_MIN_MTU); 135245e4fd26SMartin KaFai Lau if (mtu >= dst_mtu(dst)) 135345e4fd26SMartin KaFai Lau return; 135481aded24SDavid S. Miller 135545e4fd26SMartin KaFai Lau if (rt6->rt6i_flags & RTF_CACHE) { 135645e4fd26SMartin KaFai Lau rt6_do_update_pmtu(rt6, mtu); 135745e4fd26SMartin KaFai Lau } else { 135845e4fd26SMartin KaFai Lau const struct in6_addr *daddr, *saddr; 135945e4fd26SMartin KaFai Lau struct rt6_info *nrt6; 13609d289715SHagen Paul Pfeifer 136145e4fd26SMartin KaFai Lau if (iph) { 136245e4fd26SMartin KaFai Lau daddr = &iph->daddr; 136345e4fd26SMartin KaFai Lau saddr = &iph->saddr; 136445e4fd26SMartin KaFai Lau } else if (sk) { 136545e4fd26SMartin KaFai Lau daddr = &sk->sk_v6_daddr; 136645e4fd26SMartin KaFai Lau saddr = &inet6_sk(sk)->saddr; 136745e4fd26SMartin KaFai Lau } else { 136845e4fd26SMartin KaFai Lau return; 13691da177e4SLinus Torvalds } 137045e4fd26SMartin KaFai Lau nrt6 = ip6_rt_cache_alloc(rt6, daddr, saddr); 137145e4fd26SMartin KaFai Lau if (nrt6) { 137245e4fd26SMartin KaFai Lau rt6_do_update_pmtu(nrt6, mtu); 137345e4fd26SMartin KaFai Lau 137445e4fd26SMartin KaFai Lau /* ip6_ins_rt(nrt6) will bump the 137545e4fd26SMartin KaFai Lau * rt6->rt6i_node->fn_sernum 137645e4fd26SMartin KaFai Lau * which will fail the next rt6_check() and 137745e4fd26SMartin KaFai Lau * invalidate the sk->sk_dst_cache. 137845e4fd26SMartin KaFai Lau */ 137945e4fd26SMartin KaFai Lau ip6_ins_rt(nrt6); 138045e4fd26SMartin KaFai Lau } 138145e4fd26SMartin KaFai Lau } 138245e4fd26SMartin KaFai Lau } 138345e4fd26SMartin KaFai Lau 138445e4fd26SMartin KaFai Lau static void ip6_rt_update_pmtu(struct dst_entry *dst, struct sock *sk, 138545e4fd26SMartin KaFai Lau struct sk_buff *skb, u32 mtu) 138645e4fd26SMartin KaFai Lau { 138745e4fd26SMartin KaFai Lau __ip6_rt_update_pmtu(dst, sk, skb ? ipv6_hdr(skb) : NULL, mtu); 13881da177e4SLinus Torvalds } 13891da177e4SLinus Torvalds 139042ae66c8SDavid S. Miller void ip6_update_pmtu(struct sk_buff *skb, struct net *net, __be32 mtu, 139142ae66c8SDavid S. Miller int oif, u32 mark) 139281aded24SDavid S. Miller { 139381aded24SDavid S. Miller const struct ipv6hdr *iph = (struct ipv6hdr *) skb->data; 139481aded24SDavid S. Miller struct dst_entry *dst; 139581aded24SDavid S. Miller struct flowi6 fl6; 139681aded24SDavid S. Miller 139781aded24SDavid S. Miller memset(&fl6, 0, sizeof(fl6)); 139881aded24SDavid S. Miller fl6.flowi6_oif = oif; 13991b3c61dcSLorenzo Colitti fl6.flowi6_mark = mark ? mark : IP6_REPLY_MARK(net, skb->mark); 140081aded24SDavid S. Miller fl6.daddr = iph->daddr; 140181aded24SDavid S. Miller fl6.saddr = iph->saddr; 14026502ca52SYOSHIFUJI Hideaki / 吉藤英明 fl6.flowlabel = ip6_flowinfo(iph); 140381aded24SDavid S. Miller 140481aded24SDavid S. Miller dst = ip6_route_output(net, NULL, &fl6); 140581aded24SDavid S. Miller if (!dst->error) 140645e4fd26SMartin KaFai Lau __ip6_rt_update_pmtu(dst, NULL, iph, ntohl(mtu)); 140781aded24SDavid S. Miller dst_release(dst); 140881aded24SDavid S. Miller } 140981aded24SDavid S. Miller EXPORT_SYMBOL_GPL(ip6_update_pmtu); 141081aded24SDavid S. Miller 141181aded24SDavid S. Miller void ip6_sk_update_pmtu(struct sk_buff *skb, struct sock *sk, __be32 mtu) 141281aded24SDavid S. Miller { 141381aded24SDavid S. Miller ip6_update_pmtu(skb, sock_net(sk), mtu, 141481aded24SDavid S. Miller sk->sk_bound_dev_if, sk->sk_mark); 141581aded24SDavid S. Miller } 141681aded24SDavid S. Miller EXPORT_SYMBOL_GPL(ip6_sk_update_pmtu); 141781aded24SDavid S. Miller 1418b55b76b2SDuan Jiong /* Handle redirects */ 1419b55b76b2SDuan Jiong struct ip6rd_flowi { 1420b55b76b2SDuan Jiong struct flowi6 fl6; 1421b55b76b2SDuan Jiong struct in6_addr gateway; 1422b55b76b2SDuan Jiong }; 1423b55b76b2SDuan Jiong 1424b55b76b2SDuan Jiong static struct rt6_info *__ip6_route_redirect(struct net *net, 1425b55b76b2SDuan Jiong struct fib6_table *table, 1426b55b76b2SDuan Jiong struct flowi6 *fl6, 1427b55b76b2SDuan Jiong int flags) 1428b55b76b2SDuan Jiong { 1429b55b76b2SDuan Jiong struct ip6rd_flowi *rdfl = (struct ip6rd_flowi *)fl6; 1430b55b76b2SDuan Jiong struct rt6_info *rt; 1431b55b76b2SDuan Jiong struct fib6_node *fn; 1432b55b76b2SDuan Jiong 1433b55b76b2SDuan Jiong /* Get the "current" route for this destination and 1434b55b76b2SDuan Jiong * check if the redirect has come from approriate router. 1435b55b76b2SDuan Jiong * 1436b55b76b2SDuan Jiong * RFC 4861 specifies that redirects should only be 1437b55b76b2SDuan Jiong * accepted if they come from the nexthop to the target. 1438b55b76b2SDuan Jiong * Due to the way the routes are chosen, this notion 1439b55b76b2SDuan Jiong * is a bit fuzzy and one might need to check all possible 1440b55b76b2SDuan Jiong * routes. 1441b55b76b2SDuan Jiong */ 1442b55b76b2SDuan Jiong 1443b55b76b2SDuan Jiong read_lock_bh(&table->tb6_lock); 1444b55b76b2SDuan Jiong fn = fib6_lookup(&table->tb6_root, &fl6->daddr, &fl6->saddr); 1445b55b76b2SDuan Jiong restart: 1446b55b76b2SDuan Jiong for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) { 1447b55b76b2SDuan Jiong if (rt6_check_expired(rt)) 1448b55b76b2SDuan Jiong continue; 1449b55b76b2SDuan Jiong if (rt->dst.error) 1450b55b76b2SDuan Jiong break; 1451b55b76b2SDuan Jiong if (!(rt->rt6i_flags & RTF_GATEWAY)) 1452b55b76b2SDuan Jiong continue; 1453b55b76b2SDuan Jiong if (fl6->flowi6_oif != rt->dst.dev->ifindex) 1454b55b76b2SDuan Jiong continue; 1455b55b76b2SDuan Jiong if (!ipv6_addr_equal(&rdfl->gateway, &rt->rt6i_gateway)) 1456b55b76b2SDuan Jiong continue; 1457b55b76b2SDuan Jiong break; 1458b55b76b2SDuan Jiong } 1459b55b76b2SDuan Jiong 1460b55b76b2SDuan Jiong if (!rt) 1461b55b76b2SDuan Jiong rt = net->ipv6.ip6_null_entry; 1462b55b76b2SDuan Jiong else if (rt->dst.error) { 1463b55b76b2SDuan Jiong rt = net->ipv6.ip6_null_entry; 1464b0a1ba59SMartin KaFai Lau goto out; 1465b0a1ba59SMartin KaFai Lau } 1466b0a1ba59SMartin KaFai Lau 1467b0a1ba59SMartin KaFai Lau if (rt == net->ipv6.ip6_null_entry) { 1468a3c00e46SMartin KaFai Lau fn = fib6_backtrack(fn, &fl6->saddr); 1469a3c00e46SMartin KaFai Lau if (fn) 1470a3c00e46SMartin KaFai Lau goto restart; 1471b55b76b2SDuan Jiong } 1472a3c00e46SMartin KaFai Lau 1473b0a1ba59SMartin KaFai Lau out: 1474b55b76b2SDuan Jiong dst_hold(&rt->dst); 1475b55b76b2SDuan Jiong 1476b55b76b2SDuan Jiong read_unlock_bh(&table->tb6_lock); 1477b55b76b2SDuan Jiong 1478b55b76b2SDuan Jiong return rt; 1479b55b76b2SDuan Jiong }; 1480b55b76b2SDuan Jiong 1481b55b76b2SDuan Jiong static struct dst_entry *ip6_route_redirect(struct net *net, 1482b55b76b2SDuan Jiong const struct flowi6 *fl6, 1483b55b76b2SDuan Jiong const struct in6_addr *gateway) 1484b55b76b2SDuan Jiong { 1485b55b76b2SDuan Jiong int flags = RT6_LOOKUP_F_HAS_SADDR; 1486b55b76b2SDuan Jiong struct ip6rd_flowi rdfl; 1487b55b76b2SDuan Jiong 1488b55b76b2SDuan Jiong rdfl.fl6 = *fl6; 1489b55b76b2SDuan Jiong rdfl.gateway = *gateway; 1490b55b76b2SDuan Jiong 1491b55b76b2SDuan Jiong return fib6_rule_lookup(net, &rdfl.fl6, 1492b55b76b2SDuan Jiong flags, __ip6_route_redirect); 1493b55b76b2SDuan Jiong } 1494b55b76b2SDuan Jiong 14953a5ad2eeSDavid S. Miller void ip6_redirect(struct sk_buff *skb, struct net *net, int oif, u32 mark) 14963a5ad2eeSDavid S. Miller { 14973a5ad2eeSDavid S. Miller const struct ipv6hdr *iph = (struct ipv6hdr *) skb->data; 14983a5ad2eeSDavid S. Miller struct dst_entry *dst; 14993a5ad2eeSDavid S. Miller struct flowi6 fl6; 15003a5ad2eeSDavid S. Miller 15013a5ad2eeSDavid S. Miller memset(&fl6, 0, sizeof(fl6)); 1502e374c618SJulian Anastasov fl6.flowi6_iif = LOOPBACK_IFINDEX; 15033a5ad2eeSDavid S. Miller fl6.flowi6_oif = oif; 15043a5ad2eeSDavid S. Miller fl6.flowi6_mark = mark; 15053a5ad2eeSDavid S. Miller fl6.daddr = iph->daddr; 15063a5ad2eeSDavid S. Miller fl6.saddr = iph->saddr; 15076502ca52SYOSHIFUJI Hideaki / 吉藤英明 fl6.flowlabel = ip6_flowinfo(iph); 15083a5ad2eeSDavid S. Miller 1509b55b76b2SDuan Jiong dst = ip6_route_redirect(net, &fl6, &ipv6_hdr(skb)->saddr); 15106700c270SDavid S. Miller rt6_do_redirect(dst, NULL, skb); 15113a5ad2eeSDavid S. Miller dst_release(dst); 15123a5ad2eeSDavid S. Miller } 15133a5ad2eeSDavid S. Miller EXPORT_SYMBOL_GPL(ip6_redirect); 15143a5ad2eeSDavid S. Miller 1515c92a59ecSDuan Jiong void ip6_redirect_no_header(struct sk_buff *skb, struct net *net, int oif, 1516c92a59ecSDuan Jiong u32 mark) 1517c92a59ecSDuan Jiong { 1518c92a59ecSDuan Jiong const struct ipv6hdr *iph = ipv6_hdr(skb); 1519c92a59ecSDuan Jiong const struct rd_msg *msg = (struct rd_msg *)icmp6_hdr(skb); 1520c92a59ecSDuan Jiong struct dst_entry *dst; 1521c92a59ecSDuan Jiong struct flowi6 fl6; 1522c92a59ecSDuan Jiong 1523c92a59ecSDuan Jiong memset(&fl6, 0, sizeof(fl6)); 1524e374c618SJulian Anastasov fl6.flowi6_iif = LOOPBACK_IFINDEX; 1525c92a59ecSDuan Jiong fl6.flowi6_oif = oif; 1526c92a59ecSDuan Jiong fl6.flowi6_mark = mark; 1527c92a59ecSDuan Jiong fl6.daddr = msg->dest; 1528c92a59ecSDuan Jiong fl6.saddr = iph->daddr; 1529c92a59ecSDuan Jiong 1530b55b76b2SDuan Jiong dst = ip6_route_redirect(net, &fl6, &iph->saddr); 1531c92a59ecSDuan Jiong rt6_do_redirect(dst, NULL, skb); 1532c92a59ecSDuan Jiong dst_release(dst); 1533c92a59ecSDuan Jiong } 1534c92a59ecSDuan Jiong 15353a5ad2eeSDavid S. Miller void ip6_sk_redirect(struct sk_buff *skb, struct sock *sk) 15363a5ad2eeSDavid S. Miller { 15373a5ad2eeSDavid S. Miller ip6_redirect(skb, sock_net(sk), sk->sk_bound_dev_if, sk->sk_mark); 15383a5ad2eeSDavid S. Miller } 15393a5ad2eeSDavid S. Miller EXPORT_SYMBOL_GPL(ip6_sk_redirect); 15403a5ad2eeSDavid S. Miller 15410dbaee3bSDavid S. Miller static unsigned int ip6_default_advmss(const struct dst_entry *dst) 15421da177e4SLinus Torvalds { 15430dbaee3bSDavid S. Miller struct net_device *dev = dst->dev; 15440dbaee3bSDavid S. Miller unsigned int mtu = dst_mtu(dst); 15450dbaee3bSDavid S. Miller struct net *net = dev_net(dev); 15460dbaee3bSDavid S. Miller 15471da177e4SLinus Torvalds mtu -= sizeof(struct ipv6hdr) + sizeof(struct tcphdr); 15481da177e4SLinus Torvalds 15495578689aSDaniel Lezcano if (mtu < net->ipv6.sysctl.ip6_rt_min_advmss) 15505578689aSDaniel Lezcano mtu = net->ipv6.sysctl.ip6_rt_min_advmss; 15511da177e4SLinus Torvalds 15521da177e4SLinus Torvalds /* 15531da177e4SLinus Torvalds * Maximal non-jumbo IPv6 payload is IPV6_MAXPLEN and 15541da177e4SLinus Torvalds * corresponding MSS is IPV6_MAXPLEN - tcp_header_size. 15551da177e4SLinus Torvalds * IPV6_MAXPLEN is also valid and means: "any MSS, 15561da177e4SLinus Torvalds * rely only on pmtu discovery" 15571da177e4SLinus Torvalds */ 15581da177e4SLinus Torvalds if (mtu > IPV6_MAXPLEN - sizeof(struct tcphdr)) 15591da177e4SLinus Torvalds mtu = IPV6_MAXPLEN; 15601da177e4SLinus Torvalds return mtu; 15611da177e4SLinus Torvalds } 15621da177e4SLinus Torvalds 1563ebb762f2SSteffen Klassert static unsigned int ip6_mtu(const struct dst_entry *dst) 1564d33e4553SDavid S. Miller { 15654b32b5adSMartin KaFai Lau const struct rt6_info *rt = (const struct rt6_info *)dst; 15664b32b5adSMartin KaFai Lau unsigned int mtu = rt->rt6i_pmtu; 1567d33e4553SDavid S. Miller struct inet6_dev *idev; 1568618f9bc7SSteffen Klassert 1569618f9bc7SSteffen Klassert if (mtu) 157030f78d8eSEric Dumazet goto out; 1571618f9bc7SSteffen Klassert 15724b32b5adSMartin KaFai Lau mtu = dst_metric_raw(dst, RTAX_MTU); 15734b32b5adSMartin KaFai Lau if (mtu) 15744b32b5adSMartin KaFai Lau goto out; 15754b32b5adSMartin KaFai Lau 1576618f9bc7SSteffen Klassert mtu = IPV6_MIN_MTU; 1577d33e4553SDavid S. Miller 1578d33e4553SDavid S. Miller rcu_read_lock(); 1579d33e4553SDavid S. Miller idev = __in6_dev_get(dst->dev); 1580d33e4553SDavid S. Miller if (idev) 1581d33e4553SDavid S. Miller mtu = idev->cnf.mtu6; 1582d33e4553SDavid S. Miller rcu_read_unlock(); 1583d33e4553SDavid S. Miller 158430f78d8eSEric Dumazet out: 158530f78d8eSEric Dumazet return min_t(unsigned int, mtu, IP6_MAX_MTU); 1586d33e4553SDavid S. Miller } 1587d33e4553SDavid S. Miller 15883b00944cSYOSHIFUJI Hideaki static struct dst_entry *icmp6_dst_gc_list; 15893b00944cSYOSHIFUJI Hideaki static DEFINE_SPINLOCK(icmp6_dst_lock); 15905d0bbeebSThomas Graf 15913b00944cSYOSHIFUJI Hideaki struct dst_entry *icmp6_dst_alloc(struct net_device *dev, 159287a11578SDavid S. Miller struct flowi6 *fl6) 15931da177e4SLinus Torvalds { 159487a11578SDavid S. Miller struct dst_entry *dst; 15951da177e4SLinus Torvalds struct rt6_info *rt; 15961da177e4SLinus Torvalds struct inet6_dev *idev = in6_dev_get(dev); 1597c346dca1SYOSHIFUJI Hideaki struct net *net = dev_net(dev); 15981da177e4SLinus Torvalds 159938308473SDavid S. Miller if (unlikely(!idev)) 1600122bdf67SEric Dumazet return ERR_PTR(-ENODEV); 16011da177e4SLinus Torvalds 1602ad706862SMartin KaFai Lau rt = ip6_dst_alloc(net, dev, 0); 160338308473SDavid S. Miller if (unlikely(!rt)) { 16041da177e4SLinus Torvalds in6_dev_put(idev); 160587a11578SDavid S. Miller dst = ERR_PTR(-ENOMEM); 16061da177e4SLinus Torvalds goto out; 16071da177e4SLinus Torvalds } 16081da177e4SLinus Torvalds 16098e2ec639SYan, Zheng rt->dst.flags |= DST_HOST; 16108e2ec639SYan, Zheng rt->dst.output = ip6_output; 1611d8d1f30bSChangli Gao atomic_set(&rt->dst.__refcnt, 1); 1612550bab42SJulian Anastasov rt->rt6i_gateway = fl6->daddr; 161387a11578SDavid S. Miller rt->rt6i_dst.addr = fl6->daddr; 16148e2ec639SYan, Zheng rt->rt6i_dst.plen = 128; 16158e2ec639SYan, Zheng rt->rt6i_idev = idev; 161614edd87dSLi RongQing dst_metric_set(&rt->dst, RTAX_HOPLIMIT, 0); 16171da177e4SLinus Torvalds 16183b00944cSYOSHIFUJI Hideaki spin_lock_bh(&icmp6_dst_lock); 1619d8d1f30bSChangli Gao rt->dst.next = icmp6_dst_gc_list; 1620d8d1f30bSChangli Gao icmp6_dst_gc_list = &rt->dst; 16213b00944cSYOSHIFUJI Hideaki spin_unlock_bh(&icmp6_dst_lock); 16221da177e4SLinus Torvalds 16235578689aSDaniel Lezcano fib6_force_start_gc(net); 16241da177e4SLinus Torvalds 162587a11578SDavid S. Miller dst = xfrm_lookup(net, &rt->dst, flowi6_to_flowi(fl6), NULL, 0); 162687a11578SDavid S. Miller 16271da177e4SLinus Torvalds out: 162887a11578SDavid S. Miller return dst; 16291da177e4SLinus Torvalds } 16301da177e4SLinus Torvalds 16313d0f24a7SStephen Hemminger int icmp6_dst_gc(void) 16321da177e4SLinus Torvalds { 1633e9476e95SHagen Paul Pfeifer struct dst_entry *dst, **pprev; 16343d0f24a7SStephen Hemminger int more = 0; 16351da177e4SLinus Torvalds 16363b00944cSYOSHIFUJI Hideaki spin_lock_bh(&icmp6_dst_lock); 16373b00944cSYOSHIFUJI Hideaki pprev = &icmp6_dst_gc_list; 16385d0bbeebSThomas Graf 16391da177e4SLinus Torvalds while ((dst = *pprev) != NULL) { 16401da177e4SLinus Torvalds if (!atomic_read(&dst->__refcnt)) { 16411da177e4SLinus Torvalds *pprev = dst->next; 16421da177e4SLinus Torvalds dst_free(dst); 16431da177e4SLinus Torvalds } else { 16441da177e4SLinus Torvalds pprev = &dst->next; 16453d0f24a7SStephen Hemminger ++more; 16461da177e4SLinus Torvalds } 16471da177e4SLinus Torvalds } 16481da177e4SLinus Torvalds 16493b00944cSYOSHIFUJI Hideaki spin_unlock_bh(&icmp6_dst_lock); 16505d0bbeebSThomas Graf 16513d0f24a7SStephen Hemminger return more; 16521da177e4SLinus Torvalds } 16531da177e4SLinus Torvalds 16541e493d19SDavid S. Miller static void icmp6_clean_all(int (*func)(struct rt6_info *rt, void *arg), 16551e493d19SDavid S. Miller void *arg) 16561e493d19SDavid S. Miller { 16571e493d19SDavid S. Miller struct dst_entry *dst, **pprev; 16581e493d19SDavid S. Miller 16591e493d19SDavid S. Miller spin_lock_bh(&icmp6_dst_lock); 16601e493d19SDavid S. Miller pprev = &icmp6_dst_gc_list; 16611e493d19SDavid S. Miller while ((dst = *pprev) != NULL) { 16621e493d19SDavid S. Miller struct rt6_info *rt = (struct rt6_info *) dst; 16631e493d19SDavid S. Miller if (func(rt, arg)) { 16641e493d19SDavid S. Miller *pprev = dst->next; 16651e493d19SDavid S. Miller dst_free(dst); 16661e493d19SDavid S. Miller } else { 16671e493d19SDavid S. Miller pprev = &dst->next; 16681e493d19SDavid S. Miller } 16691e493d19SDavid S. Miller } 16701e493d19SDavid S. Miller spin_unlock_bh(&icmp6_dst_lock); 16711e493d19SDavid S. Miller } 16721e493d19SDavid S. Miller 1673569d3645SDaniel Lezcano static int ip6_dst_gc(struct dst_ops *ops) 16741da177e4SLinus Torvalds { 167586393e52SAlexey Dobriyan struct net *net = container_of(ops, struct net, ipv6.ip6_dst_ops); 16767019b78eSDaniel Lezcano int rt_min_interval = net->ipv6.sysctl.ip6_rt_gc_min_interval; 16777019b78eSDaniel Lezcano int rt_max_size = net->ipv6.sysctl.ip6_rt_max_size; 16787019b78eSDaniel Lezcano int rt_elasticity = net->ipv6.sysctl.ip6_rt_gc_elasticity; 16797019b78eSDaniel Lezcano int rt_gc_timeout = net->ipv6.sysctl.ip6_rt_gc_timeout; 16807019b78eSDaniel Lezcano unsigned long rt_last_gc = net->ipv6.ip6_rt_last_gc; 1681fc66f95cSEric Dumazet int entries; 16821da177e4SLinus Torvalds 1683fc66f95cSEric Dumazet entries = dst_entries_get_fast(ops); 168449a18d86SMichal Kubeček if (time_after(rt_last_gc + rt_min_interval, jiffies) && 1685fc66f95cSEric Dumazet entries <= rt_max_size) 16861da177e4SLinus Torvalds goto out; 16871da177e4SLinus Torvalds 16886891a346SBenjamin Thery net->ipv6.ip6_rt_gc_expire++; 168914956643SLi RongQing fib6_run_gc(net->ipv6.ip6_rt_gc_expire, net, true); 1690fc66f95cSEric Dumazet entries = dst_entries_get_slow(ops); 1691fc66f95cSEric Dumazet if (entries < ops->gc_thresh) 16927019b78eSDaniel Lezcano net->ipv6.ip6_rt_gc_expire = rt_gc_timeout>>1; 16931da177e4SLinus Torvalds out: 16947019b78eSDaniel Lezcano net->ipv6.ip6_rt_gc_expire -= net->ipv6.ip6_rt_gc_expire>>rt_elasticity; 1695fc66f95cSEric Dumazet return entries > rt_max_size; 16961da177e4SLinus Torvalds } 16971da177e4SLinus Torvalds 1698e715b6d3SFlorian Westphal static int ip6_convert_metrics(struct mx6_config *mxc, 1699e715b6d3SFlorian Westphal const struct fib6_config *cfg) 1700e715b6d3SFlorian Westphal { 1701*c3a8d947SDaniel Borkmann bool ecn_ca = false; 1702e715b6d3SFlorian Westphal struct nlattr *nla; 1703e715b6d3SFlorian Westphal int remaining; 1704e715b6d3SFlorian Westphal u32 *mp; 1705e715b6d3SFlorian Westphal 170663159f29SIan Morris if (!cfg->fc_mx) 1707e715b6d3SFlorian Westphal return 0; 1708e715b6d3SFlorian Westphal 1709e715b6d3SFlorian Westphal mp = kzalloc(sizeof(u32) * RTAX_MAX, GFP_KERNEL); 1710e715b6d3SFlorian Westphal if (unlikely(!mp)) 1711e715b6d3SFlorian Westphal return -ENOMEM; 1712e715b6d3SFlorian Westphal 1713e715b6d3SFlorian Westphal nla_for_each_attr(nla, cfg->fc_mx, cfg->fc_mx_len, remaining) { 1714e715b6d3SFlorian Westphal int type = nla_type(nla); 1715ea697639SDaniel Borkmann u32 val; 1716ea697639SDaniel Borkmann 17171bb14807SDaniel Borkmann if (!type) 17181bb14807SDaniel Borkmann continue; 1719e715b6d3SFlorian Westphal if (unlikely(type > RTAX_MAX)) 1720e715b6d3SFlorian Westphal goto err; 17211bb14807SDaniel Borkmann 1722ea697639SDaniel Borkmann if (type == RTAX_CC_ALGO) { 1723ea697639SDaniel Borkmann char tmp[TCP_CA_NAME_MAX]; 1724e715b6d3SFlorian Westphal 1725ea697639SDaniel Borkmann nla_strlcpy(tmp, nla, sizeof(tmp)); 1726*c3a8d947SDaniel Borkmann val = tcp_ca_get_key_by_name(tmp, &ecn_ca); 1727ea697639SDaniel Borkmann if (val == TCP_CA_UNSPEC) 1728ea697639SDaniel Borkmann goto err; 1729ea697639SDaniel Borkmann } else { 1730ea697639SDaniel Borkmann val = nla_get_u32(nla); 1731ea697639SDaniel Borkmann } 1732b8d3e416SDaniel Borkmann if (type == RTAX_FEATURES && (val & ~RTAX_FEATURE_MASK)) 1733b8d3e416SDaniel Borkmann goto err; 1734ea697639SDaniel Borkmann 1735ea697639SDaniel Borkmann mp[type - 1] = val; 1736e715b6d3SFlorian Westphal __set_bit(type - 1, mxc->mx_valid); 1737e715b6d3SFlorian Westphal } 1738e715b6d3SFlorian Westphal 1739*c3a8d947SDaniel Borkmann if (ecn_ca) { 1740*c3a8d947SDaniel Borkmann __set_bit(RTAX_FEATURES - 1, mxc->mx_valid); 1741*c3a8d947SDaniel Borkmann mp[RTAX_FEATURES - 1] |= DST_FEATURE_ECN_CA; 1742*c3a8d947SDaniel Borkmann } 1743e715b6d3SFlorian Westphal 1744*c3a8d947SDaniel Borkmann mxc->mx = mp; 1745e715b6d3SFlorian Westphal return 0; 1746e715b6d3SFlorian Westphal err: 1747e715b6d3SFlorian Westphal kfree(mp); 1748e715b6d3SFlorian Westphal return -EINVAL; 1749e715b6d3SFlorian Westphal } 17501da177e4SLinus Torvalds 175186872cb5SThomas Graf int ip6_route_add(struct fib6_config *cfg) 17521da177e4SLinus Torvalds { 17531da177e4SLinus Torvalds int err; 17545578689aSDaniel Lezcano struct net *net = cfg->fc_nlinfo.nl_net; 17551da177e4SLinus Torvalds struct rt6_info *rt = NULL; 17561da177e4SLinus Torvalds struct net_device *dev = NULL; 17571da177e4SLinus Torvalds struct inet6_dev *idev = NULL; 1758c71099acSThomas Graf struct fib6_table *table; 1759e715b6d3SFlorian Westphal struct mx6_config mxc = { .mx = NULL, }; 17601da177e4SLinus Torvalds int addr_type; 17611da177e4SLinus Torvalds 176286872cb5SThomas Graf if (cfg->fc_dst_len > 128 || cfg->fc_src_len > 128) 17631da177e4SLinus Torvalds return -EINVAL; 17641da177e4SLinus Torvalds #ifndef CONFIG_IPV6_SUBTREES 176586872cb5SThomas Graf if (cfg->fc_src_len) 17661da177e4SLinus Torvalds return -EINVAL; 17671da177e4SLinus Torvalds #endif 176886872cb5SThomas Graf if (cfg->fc_ifindex) { 17691da177e4SLinus Torvalds err = -ENODEV; 17705578689aSDaniel Lezcano dev = dev_get_by_index(net, cfg->fc_ifindex); 17711da177e4SLinus Torvalds if (!dev) 17721da177e4SLinus Torvalds goto out; 17731da177e4SLinus Torvalds idev = in6_dev_get(dev); 17741da177e4SLinus Torvalds if (!idev) 17751da177e4SLinus Torvalds goto out; 17761da177e4SLinus Torvalds } 17771da177e4SLinus Torvalds 177886872cb5SThomas Graf if (cfg->fc_metric == 0) 177986872cb5SThomas Graf cfg->fc_metric = IP6_RT_PRIO_USER; 17801da177e4SLinus Torvalds 1781c71099acSThomas Graf err = -ENOBUFS; 178238308473SDavid S. Miller if (cfg->fc_nlinfo.nlh && 1783d71314b4SMatti Vaittinen !(cfg->fc_nlinfo.nlh->nlmsg_flags & NLM_F_CREATE)) { 1784d71314b4SMatti Vaittinen table = fib6_get_table(net, cfg->fc_table); 178538308473SDavid S. Miller if (!table) { 1786f3213831SJoe Perches pr_warn("NLM_F_CREATE should be specified when creating new route\n"); 1787d71314b4SMatti Vaittinen table = fib6_new_table(net, cfg->fc_table); 1788d71314b4SMatti Vaittinen } 1789d71314b4SMatti Vaittinen } else { 1790d71314b4SMatti Vaittinen table = fib6_new_table(net, cfg->fc_table); 1791d71314b4SMatti Vaittinen } 179238308473SDavid S. Miller 179338308473SDavid S. Miller if (!table) 1794c71099acSThomas Graf goto out; 1795c71099acSThomas Graf 1796ad706862SMartin KaFai Lau rt = ip6_dst_alloc(net, NULL, 1797ad706862SMartin KaFai Lau (cfg->fc_flags & RTF_ADDRCONF) ? 0 : DST_NOCOUNT); 17981da177e4SLinus Torvalds 179938308473SDavid S. Miller if (!rt) { 18001da177e4SLinus Torvalds err = -ENOMEM; 18011da177e4SLinus Torvalds goto out; 18021da177e4SLinus Torvalds } 18031da177e4SLinus Torvalds 18041716a961SGao feng if (cfg->fc_flags & RTF_EXPIRES) 18051716a961SGao feng rt6_set_expires(rt, jiffies + 18061716a961SGao feng clock_t_to_jiffies(cfg->fc_expires)); 18071716a961SGao feng else 18081716a961SGao feng rt6_clean_expires(rt); 18091da177e4SLinus Torvalds 181086872cb5SThomas Graf if (cfg->fc_protocol == RTPROT_UNSPEC) 181186872cb5SThomas Graf cfg->fc_protocol = RTPROT_BOOT; 181286872cb5SThomas Graf rt->rt6i_protocol = cfg->fc_protocol; 181386872cb5SThomas Graf 181486872cb5SThomas Graf addr_type = ipv6_addr_type(&cfg->fc_dst); 18151da177e4SLinus Torvalds 18161da177e4SLinus Torvalds if (addr_type & IPV6_ADDR_MULTICAST) 1817d8d1f30bSChangli Gao rt->dst.input = ip6_mc_input; 1818ab79ad14SMaciej Żenczykowski else if (cfg->fc_flags & RTF_LOCAL) 1819ab79ad14SMaciej Żenczykowski rt->dst.input = ip6_input; 18201da177e4SLinus Torvalds else 1821d8d1f30bSChangli Gao rt->dst.input = ip6_forward; 18221da177e4SLinus Torvalds 1823d8d1f30bSChangli Gao rt->dst.output = ip6_output; 18241da177e4SLinus Torvalds 182519e42e45SRoopa Prabhu if (cfg->fc_encap) { 182619e42e45SRoopa Prabhu struct lwtunnel_state *lwtstate; 182719e42e45SRoopa Prabhu 182819e42e45SRoopa Prabhu err = lwtunnel_build_state(dev, cfg->fc_encap_type, 1829127eb7cdSTom Herbert cfg->fc_encap, AF_INET6, cfg, 1830127eb7cdSTom Herbert &lwtstate); 183119e42e45SRoopa Prabhu if (err) 183219e42e45SRoopa Prabhu goto out; 183361adedf3SJiri Benc rt->dst.lwtstate = lwtstate_get(lwtstate); 183461adedf3SJiri Benc if (lwtunnel_output_redirect(rt->dst.lwtstate)) { 183561adedf3SJiri Benc rt->dst.lwtstate->orig_output = rt->dst.output; 183661adedf3SJiri Benc rt->dst.output = lwtunnel_output; 183719e42e45SRoopa Prabhu } 183861adedf3SJiri Benc if (lwtunnel_input_redirect(rt->dst.lwtstate)) { 183961adedf3SJiri Benc rt->dst.lwtstate->orig_input = rt->dst.input; 184061adedf3SJiri Benc rt->dst.input = lwtunnel_input; 184125368623STom Herbert } 184225368623STom Herbert } 184319e42e45SRoopa Prabhu 184486872cb5SThomas Graf ipv6_addr_prefix(&rt->rt6i_dst.addr, &cfg->fc_dst, cfg->fc_dst_len); 184586872cb5SThomas Graf rt->rt6i_dst.plen = cfg->fc_dst_len; 1846afc4eef8SMartin KaFai Lau if (rt->rt6i_dst.plen == 128) 184711d53b49SDavid S. Miller rt->dst.flags |= DST_HOST; 18481da177e4SLinus Torvalds 18491da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES 185086872cb5SThomas Graf ipv6_addr_prefix(&rt->rt6i_src.addr, &cfg->fc_src, cfg->fc_src_len); 185186872cb5SThomas Graf rt->rt6i_src.plen = cfg->fc_src_len; 18521da177e4SLinus Torvalds #endif 18531da177e4SLinus Torvalds 185486872cb5SThomas Graf rt->rt6i_metric = cfg->fc_metric; 18551da177e4SLinus Torvalds 18561da177e4SLinus Torvalds /* We cannot add true routes via loopback here, 18571da177e4SLinus Torvalds they would result in kernel looping; promote them to reject routes 18581da177e4SLinus Torvalds */ 185986872cb5SThomas Graf if ((cfg->fc_flags & RTF_REJECT) || 186038308473SDavid S. Miller (dev && (dev->flags & IFF_LOOPBACK) && 186138308473SDavid S. Miller !(addr_type & IPV6_ADDR_LOOPBACK) && 186238308473SDavid S. Miller !(cfg->fc_flags & RTF_LOCAL))) { 18631da177e4SLinus Torvalds /* hold loopback dev/idev if we haven't done so. */ 18645578689aSDaniel Lezcano if (dev != net->loopback_dev) { 18651da177e4SLinus Torvalds if (dev) { 18661da177e4SLinus Torvalds dev_put(dev); 18671da177e4SLinus Torvalds in6_dev_put(idev); 18681da177e4SLinus Torvalds } 18695578689aSDaniel Lezcano dev = net->loopback_dev; 18701da177e4SLinus Torvalds dev_hold(dev); 18711da177e4SLinus Torvalds idev = in6_dev_get(dev); 18721da177e4SLinus Torvalds if (!idev) { 18731da177e4SLinus Torvalds err = -ENODEV; 18741da177e4SLinus Torvalds goto out; 18751da177e4SLinus Torvalds } 18761da177e4SLinus Torvalds } 18771da177e4SLinus Torvalds rt->rt6i_flags = RTF_REJECT|RTF_NONEXTHOP; 1878ef2c7d7bSNicolas Dichtel switch (cfg->fc_type) { 1879ef2c7d7bSNicolas Dichtel case RTN_BLACKHOLE: 1880ef2c7d7bSNicolas Dichtel rt->dst.error = -EINVAL; 1881aad88724SEric Dumazet rt->dst.output = dst_discard_sk; 18827150aedeSKamala R rt->dst.input = dst_discard; 1883ef2c7d7bSNicolas Dichtel break; 1884ef2c7d7bSNicolas Dichtel case RTN_PROHIBIT: 1885ef2c7d7bSNicolas Dichtel rt->dst.error = -EACCES; 18867150aedeSKamala R rt->dst.output = ip6_pkt_prohibit_out; 18877150aedeSKamala R rt->dst.input = ip6_pkt_prohibit; 1888ef2c7d7bSNicolas Dichtel break; 1889b4949ab2SNicolas Dichtel case RTN_THROW: 1890ef2c7d7bSNicolas Dichtel default: 18917150aedeSKamala R rt->dst.error = (cfg->fc_type == RTN_THROW) ? -EAGAIN 18927150aedeSKamala R : -ENETUNREACH; 18937150aedeSKamala R rt->dst.output = ip6_pkt_discard_out; 18947150aedeSKamala R rt->dst.input = ip6_pkt_discard; 1895ef2c7d7bSNicolas Dichtel break; 1896ef2c7d7bSNicolas Dichtel } 18971da177e4SLinus Torvalds goto install_route; 18981da177e4SLinus Torvalds } 18991da177e4SLinus Torvalds 190086872cb5SThomas Graf if (cfg->fc_flags & RTF_GATEWAY) { 1901b71d1d42SEric Dumazet const struct in6_addr *gw_addr; 19021da177e4SLinus Torvalds int gwa_type; 19031da177e4SLinus Torvalds 190486872cb5SThomas Graf gw_addr = &cfg->fc_gateway; 1905330567b7SFlorian Westphal gwa_type = ipv6_addr_type(gw_addr); 190648ed7b26SFlorian Westphal 190748ed7b26SFlorian Westphal /* if gw_addr is local we will fail to detect this in case 190848ed7b26SFlorian Westphal * address is still TENTATIVE (DAD in progress). rt6_lookup() 190948ed7b26SFlorian Westphal * will return already-added prefix route via interface that 191048ed7b26SFlorian Westphal * prefix route was assigned to, which might be non-loopback. 191148ed7b26SFlorian Westphal */ 191248ed7b26SFlorian Westphal err = -EINVAL; 1913330567b7SFlorian Westphal if (ipv6_chk_addr_and_flags(net, gw_addr, 1914330567b7SFlorian Westphal gwa_type & IPV6_ADDR_LINKLOCAL ? 1915330567b7SFlorian Westphal dev : NULL, 0, 0)) 191648ed7b26SFlorian Westphal goto out; 191748ed7b26SFlorian Westphal 19184e3fd7a0SAlexey Dobriyan rt->rt6i_gateway = *gw_addr; 19191da177e4SLinus Torvalds 19201da177e4SLinus Torvalds if (gwa_type != (IPV6_ADDR_LINKLOCAL|IPV6_ADDR_UNICAST)) { 19211da177e4SLinus Torvalds struct rt6_info *grt; 19221da177e4SLinus Torvalds 19231da177e4SLinus Torvalds /* IPv6 strictly inhibits using not link-local 19241da177e4SLinus Torvalds addresses as nexthop address. 19251da177e4SLinus Torvalds Otherwise, router will not able to send redirects. 19261da177e4SLinus Torvalds It is very good, but in some (rare!) circumstances 19271da177e4SLinus Torvalds (SIT, PtP, NBMA NOARP links) it is handy to allow 19281da177e4SLinus Torvalds some exceptions. --ANK 19291da177e4SLinus Torvalds */ 19301da177e4SLinus Torvalds if (!(gwa_type & IPV6_ADDR_UNICAST)) 19311da177e4SLinus Torvalds goto out; 19321da177e4SLinus Torvalds 19335578689aSDaniel Lezcano grt = rt6_lookup(net, gw_addr, NULL, cfg->fc_ifindex, 1); 19341da177e4SLinus Torvalds 19351da177e4SLinus Torvalds err = -EHOSTUNREACH; 193638308473SDavid S. Miller if (!grt) 19371da177e4SLinus Torvalds goto out; 19381da177e4SLinus Torvalds if (dev) { 1939d1918542SDavid S. Miller if (dev != grt->dst.dev) { 194094e187c0SAmerigo Wang ip6_rt_put(grt); 19411da177e4SLinus Torvalds goto out; 19421da177e4SLinus Torvalds } 19431da177e4SLinus Torvalds } else { 1944d1918542SDavid S. Miller dev = grt->dst.dev; 19451da177e4SLinus Torvalds idev = grt->rt6i_idev; 19461da177e4SLinus Torvalds dev_hold(dev); 19471da177e4SLinus Torvalds in6_dev_hold(grt->rt6i_idev); 19481da177e4SLinus Torvalds } 19491da177e4SLinus Torvalds if (!(grt->rt6i_flags & RTF_GATEWAY)) 19501da177e4SLinus Torvalds err = 0; 195194e187c0SAmerigo Wang ip6_rt_put(grt); 19521da177e4SLinus Torvalds 19531da177e4SLinus Torvalds if (err) 19541da177e4SLinus Torvalds goto out; 19551da177e4SLinus Torvalds } 19561da177e4SLinus Torvalds err = -EINVAL; 195738308473SDavid S. Miller if (!dev || (dev->flags & IFF_LOOPBACK)) 19581da177e4SLinus Torvalds goto out; 19591da177e4SLinus Torvalds } 19601da177e4SLinus Torvalds 19611da177e4SLinus Torvalds err = -ENODEV; 196238308473SDavid S. Miller if (!dev) 19631da177e4SLinus Torvalds goto out; 19641da177e4SLinus Torvalds 1965c3968a85SDaniel Walter if (!ipv6_addr_any(&cfg->fc_prefsrc)) { 1966c3968a85SDaniel Walter if (!ipv6_chk_addr(net, &cfg->fc_prefsrc, dev, 0)) { 1967c3968a85SDaniel Walter err = -EINVAL; 1968c3968a85SDaniel Walter goto out; 1969c3968a85SDaniel Walter } 19704e3fd7a0SAlexey Dobriyan rt->rt6i_prefsrc.addr = cfg->fc_prefsrc; 1971c3968a85SDaniel Walter rt->rt6i_prefsrc.plen = 128; 1972c3968a85SDaniel Walter } else 1973c3968a85SDaniel Walter rt->rt6i_prefsrc.plen = 0; 1974c3968a85SDaniel Walter 197586872cb5SThomas Graf rt->rt6i_flags = cfg->fc_flags; 19761da177e4SLinus Torvalds 19771da177e4SLinus Torvalds install_route: 1978d8d1f30bSChangli Gao rt->dst.dev = dev; 19791da177e4SLinus Torvalds rt->rt6i_idev = idev; 1980c71099acSThomas Graf rt->rt6i_table = table; 198163152fc0SDaniel Lezcano 1982c346dca1SYOSHIFUJI Hideaki cfg->fc_nlinfo.nl_net = dev_net(dev); 198363152fc0SDaniel Lezcano 1984e715b6d3SFlorian Westphal err = ip6_convert_metrics(&mxc, cfg); 1985e715b6d3SFlorian Westphal if (err) 1986e715b6d3SFlorian Westphal goto out; 19871da177e4SLinus Torvalds 1988e715b6d3SFlorian Westphal err = __ip6_ins_rt(rt, &cfg->fc_nlinfo, &mxc); 1989e715b6d3SFlorian Westphal 1990e715b6d3SFlorian Westphal kfree(mxc.mx); 1991e715b6d3SFlorian Westphal return err; 19921da177e4SLinus Torvalds out: 19931da177e4SLinus Torvalds if (dev) 19941da177e4SLinus Torvalds dev_put(dev); 19951da177e4SLinus Torvalds if (idev) 19961da177e4SLinus Torvalds in6_dev_put(idev); 19971da177e4SLinus Torvalds if (rt) 1998d8d1f30bSChangli Gao dst_free(&rt->dst); 19991da177e4SLinus Torvalds return err; 20001da177e4SLinus Torvalds } 20011da177e4SLinus Torvalds 200286872cb5SThomas Graf static int __ip6_del_rt(struct rt6_info *rt, struct nl_info *info) 20031da177e4SLinus Torvalds { 20041da177e4SLinus Torvalds int err; 2005c71099acSThomas Graf struct fib6_table *table; 2006d1918542SDavid S. Miller struct net *net = dev_net(rt->dst.dev); 20071da177e4SLinus Torvalds 20086825a26cSGao feng if (rt == net->ipv6.ip6_null_entry) { 20096825a26cSGao feng err = -ENOENT; 20106825a26cSGao feng goto out; 20116825a26cSGao feng } 20126c813a72SPatrick McHardy 2013c71099acSThomas Graf table = rt->rt6i_table; 2014c71099acSThomas Graf write_lock_bh(&table->tb6_lock); 201586872cb5SThomas Graf err = fib6_del(rt, info); 2016c71099acSThomas Graf write_unlock_bh(&table->tb6_lock); 20171da177e4SLinus Torvalds 20186825a26cSGao feng out: 201994e187c0SAmerigo Wang ip6_rt_put(rt); 20201da177e4SLinus Torvalds return err; 20211da177e4SLinus Torvalds } 20221da177e4SLinus Torvalds 2023e0a1ad73SThomas Graf int ip6_del_rt(struct rt6_info *rt) 2024e0a1ad73SThomas Graf { 20254d1169c1SDenis V. Lunev struct nl_info info = { 2026d1918542SDavid S. Miller .nl_net = dev_net(rt->dst.dev), 20274d1169c1SDenis V. Lunev }; 2028528c4cebSDenis V. Lunev return __ip6_del_rt(rt, &info); 2029e0a1ad73SThomas Graf } 2030e0a1ad73SThomas Graf 203186872cb5SThomas Graf static int ip6_route_del(struct fib6_config *cfg) 20321da177e4SLinus Torvalds { 2033c71099acSThomas Graf struct fib6_table *table; 20341da177e4SLinus Torvalds struct fib6_node *fn; 20351da177e4SLinus Torvalds struct rt6_info *rt; 20361da177e4SLinus Torvalds int err = -ESRCH; 20371da177e4SLinus Torvalds 20385578689aSDaniel Lezcano table = fib6_get_table(cfg->fc_nlinfo.nl_net, cfg->fc_table); 203938308473SDavid S. Miller if (!table) 2040c71099acSThomas Graf return err; 20411da177e4SLinus Torvalds 2042c71099acSThomas Graf read_lock_bh(&table->tb6_lock); 2043c71099acSThomas Graf 2044c71099acSThomas Graf fn = fib6_locate(&table->tb6_root, 204586872cb5SThomas Graf &cfg->fc_dst, cfg->fc_dst_len, 204686872cb5SThomas Graf &cfg->fc_src, cfg->fc_src_len); 20471da177e4SLinus Torvalds 20481da177e4SLinus Torvalds if (fn) { 2049d8d1f30bSChangli Gao for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) { 20501f56a01fSMartin KaFai Lau if ((rt->rt6i_flags & RTF_CACHE) && 20511f56a01fSMartin KaFai Lau !(cfg->fc_flags & RTF_CACHE)) 20521f56a01fSMartin KaFai Lau continue; 205386872cb5SThomas Graf if (cfg->fc_ifindex && 2054d1918542SDavid S. Miller (!rt->dst.dev || 2055d1918542SDavid S. Miller rt->dst.dev->ifindex != cfg->fc_ifindex)) 20561da177e4SLinus Torvalds continue; 205786872cb5SThomas Graf if (cfg->fc_flags & RTF_GATEWAY && 205886872cb5SThomas Graf !ipv6_addr_equal(&cfg->fc_gateway, &rt->rt6i_gateway)) 20591da177e4SLinus Torvalds continue; 206086872cb5SThomas Graf if (cfg->fc_metric && cfg->fc_metric != rt->rt6i_metric) 20611da177e4SLinus Torvalds continue; 2062d8d1f30bSChangli Gao dst_hold(&rt->dst); 2063c71099acSThomas Graf read_unlock_bh(&table->tb6_lock); 20641da177e4SLinus Torvalds 206586872cb5SThomas Graf return __ip6_del_rt(rt, &cfg->fc_nlinfo); 20661da177e4SLinus Torvalds } 20671da177e4SLinus Torvalds } 2068c71099acSThomas Graf read_unlock_bh(&table->tb6_lock); 20691da177e4SLinus Torvalds 20701da177e4SLinus Torvalds return err; 20711da177e4SLinus Torvalds } 20721da177e4SLinus Torvalds 20736700c270SDavid S. Miller static void rt6_do_redirect(struct dst_entry *dst, struct sock *sk, struct sk_buff *skb) 2074a6279458SYOSHIFUJI Hideaki { 2075e8599ff4SDavid S. Miller struct net *net = dev_net(skb->dev); 2076a6279458SYOSHIFUJI Hideaki struct netevent_redirect netevent; 2077e8599ff4SDavid S. Miller struct rt6_info *rt, *nrt = NULL; 2078e8599ff4SDavid S. Miller struct ndisc_options ndopts; 2079e8599ff4SDavid S. Miller struct inet6_dev *in6_dev; 2080e8599ff4SDavid S. Miller struct neighbour *neigh; 208171bcdba0SYOSHIFUJI Hideaki / 吉藤英明 struct rd_msg *msg; 20826e157b6aSDavid S. Miller int optlen, on_link; 20836e157b6aSDavid S. Miller u8 *lladdr; 2084e8599ff4SDavid S. Miller 208529a3cad5SSimon Horman optlen = skb_tail_pointer(skb) - skb_transport_header(skb); 208671bcdba0SYOSHIFUJI Hideaki / 吉藤英明 optlen -= sizeof(*msg); 2087e8599ff4SDavid S. Miller 2088e8599ff4SDavid S. Miller if (optlen < 0) { 20896e157b6aSDavid S. Miller net_dbg_ratelimited("rt6_do_redirect: packet too short\n"); 2090e8599ff4SDavid S. Miller return; 2091e8599ff4SDavid S. Miller } 2092e8599ff4SDavid S. Miller 209371bcdba0SYOSHIFUJI Hideaki / 吉藤英明 msg = (struct rd_msg *)icmp6_hdr(skb); 2094e8599ff4SDavid S. Miller 209571bcdba0SYOSHIFUJI Hideaki / 吉藤英明 if (ipv6_addr_is_multicast(&msg->dest)) { 20966e157b6aSDavid S. Miller net_dbg_ratelimited("rt6_do_redirect: destination address is multicast\n"); 2097e8599ff4SDavid S. Miller return; 2098e8599ff4SDavid S. Miller } 2099e8599ff4SDavid S. Miller 21006e157b6aSDavid S. Miller on_link = 0; 210171bcdba0SYOSHIFUJI Hideaki / 吉藤英明 if (ipv6_addr_equal(&msg->dest, &msg->target)) { 2102e8599ff4SDavid S. Miller on_link = 1; 210371bcdba0SYOSHIFUJI Hideaki / 吉藤英明 } else if (ipv6_addr_type(&msg->target) != 2104e8599ff4SDavid S. Miller (IPV6_ADDR_UNICAST|IPV6_ADDR_LINKLOCAL)) { 21056e157b6aSDavid S. Miller net_dbg_ratelimited("rt6_do_redirect: target address is not link-local unicast\n"); 2106e8599ff4SDavid S. Miller return; 2107e8599ff4SDavid S. Miller } 2108e8599ff4SDavid S. Miller 2109e8599ff4SDavid S. Miller in6_dev = __in6_dev_get(skb->dev); 2110e8599ff4SDavid S. Miller if (!in6_dev) 2111e8599ff4SDavid S. Miller return; 2112e8599ff4SDavid S. Miller if (in6_dev->cnf.forwarding || !in6_dev->cnf.accept_redirects) 2113e8599ff4SDavid S. Miller return; 2114e8599ff4SDavid S. Miller 2115e8599ff4SDavid S. Miller /* RFC2461 8.1: 2116e8599ff4SDavid S. Miller * The IP source address of the Redirect MUST be the same as the current 2117e8599ff4SDavid S. Miller * first-hop router for the specified ICMP Destination Address. 2118e8599ff4SDavid S. Miller */ 2119e8599ff4SDavid S. Miller 212071bcdba0SYOSHIFUJI Hideaki / 吉藤英明 if (!ndisc_parse_options(msg->opt, optlen, &ndopts)) { 2121e8599ff4SDavid S. Miller net_dbg_ratelimited("rt6_redirect: invalid ND options\n"); 2122e8599ff4SDavid S. Miller return; 2123e8599ff4SDavid S. Miller } 21246e157b6aSDavid S. Miller 21256e157b6aSDavid S. Miller lladdr = NULL; 2126e8599ff4SDavid S. Miller if (ndopts.nd_opts_tgt_lladdr) { 2127e8599ff4SDavid S. Miller lladdr = ndisc_opt_addr_data(ndopts.nd_opts_tgt_lladdr, 2128e8599ff4SDavid S. Miller skb->dev); 2129e8599ff4SDavid S. Miller if (!lladdr) { 2130e8599ff4SDavid S. Miller net_dbg_ratelimited("rt6_redirect: invalid link-layer address length\n"); 2131e8599ff4SDavid S. Miller return; 2132e8599ff4SDavid S. Miller } 2133e8599ff4SDavid S. Miller } 2134e8599ff4SDavid S. Miller 21356e157b6aSDavid S. Miller rt = (struct rt6_info *) dst; 21366e157b6aSDavid S. Miller if (rt == net->ipv6.ip6_null_entry) { 21376e157b6aSDavid S. Miller net_dbg_ratelimited("rt6_redirect: source isn't a valid nexthop for redirect target\n"); 21386e157b6aSDavid S. Miller return; 21396e157b6aSDavid S. Miller } 21406e157b6aSDavid S. Miller 21416e157b6aSDavid S. Miller /* Redirect received -> path was valid. 21426e157b6aSDavid S. Miller * Look, redirects are sent only in response to data packets, 21436e157b6aSDavid S. Miller * so that this nexthop apparently is reachable. --ANK 21446e157b6aSDavid S. Miller */ 21456e157b6aSDavid S. Miller dst_confirm(&rt->dst); 21466e157b6aSDavid S. Miller 214771bcdba0SYOSHIFUJI Hideaki / 吉藤英明 neigh = __neigh_lookup(&nd_tbl, &msg->target, skb->dev, 1); 2148e8599ff4SDavid S. Miller if (!neigh) 2149e8599ff4SDavid S. Miller return; 2150e8599ff4SDavid S. Miller 21511da177e4SLinus Torvalds /* 21521da177e4SLinus Torvalds * We have finally decided to accept it. 21531da177e4SLinus Torvalds */ 21541da177e4SLinus Torvalds 21551da177e4SLinus Torvalds neigh_update(neigh, lladdr, NUD_STALE, 21561da177e4SLinus Torvalds NEIGH_UPDATE_F_WEAK_OVERRIDE| 21571da177e4SLinus Torvalds NEIGH_UPDATE_F_OVERRIDE| 21581da177e4SLinus Torvalds (on_link ? 0 : (NEIGH_UPDATE_F_OVERRIDE_ISROUTER| 21591da177e4SLinus Torvalds NEIGH_UPDATE_F_ISROUTER)) 21601da177e4SLinus Torvalds ); 21611da177e4SLinus Torvalds 216283a09abdSMartin KaFai Lau nrt = ip6_rt_cache_alloc(rt, &msg->dest, NULL); 216338308473SDavid S. Miller if (!nrt) 21641da177e4SLinus Torvalds goto out; 21651da177e4SLinus Torvalds 21661da177e4SLinus Torvalds nrt->rt6i_flags = RTF_GATEWAY|RTF_UP|RTF_DYNAMIC|RTF_CACHE; 21671da177e4SLinus Torvalds if (on_link) 21681da177e4SLinus Torvalds nrt->rt6i_flags &= ~RTF_GATEWAY; 21691da177e4SLinus Torvalds 21704e3fd7a0SAlexey Dobriyan nrt->rt6i_gateway = *(struct in6_addr *)neigh->primary_key; 21711da177e4SLinus Torvalds 217240e22e8fSThomas Graf if (ip6_ins_rt(nrt)) 21731da177e4SLinus Torvalds goto out; 21741da177e4SLinus Torvalds 2175d8d1f30bSChangli Gao netevent.old = &rt->dst; 2176d8d1f30bSChangli Gao netevent.new = &nrt->dst; 217771bcdba0SYOSHIFUJI Hideaki / 吉藤英明 netevent.daddr = &msg->dest; 217860592833SYOSHIFUJI Hideaki / 吉藤英明 netevent.neigh = neigh; 21798d71740cSTom Tucker call_netevent_notifiers(NETEVENT_REDIRECT, &netevent); 21808d71740cSTom Tucker 21811da177e4SLinus Torvalds if (rt->rt6i_flags & RTF_CACHE) { 21826e157b6aSDavid S. Miller rt = (struct rt6_info *) dst_clone(&rt->dst); 2183e0a1ad73SThomas Graf ip6_del_rt(rt); 21841da177e4SLinus Torvalds } 21851da177e4SLinus Torvalds 21861da177e4SLinus Torvalds out: 2187e8599ff4SDavid S. Miller neigh_release(neigh); 21886e157b6aSDavid S. Miller } 21896e157b6aSDavid S. Miller 21901da177e4SLinus Torvalds /* 21911da177e4SLinus Torvalds * Misc support functions 21921da177e4SLinus Torvalds */ 21931da177e4SLinus Torvalds 21944b32b5adSMartin KaFai Lau static void rt6_set_from(struct rt6_info *rt, struct rt6_info *from) 21954b32b5adSMartin KaFai Lau { 21964b32b5adSMartin KaFai Lau BUG_ON(from->dst.from); 21974b32b5adSMartin KaFai Lau 21984b32b5adSMartin KaFai Lau rt->rt6i_flags &= ~RTF_EXPIRES; 21994b32b5adSMartin KaFai Lau dst_hold(&from->dst); 22004b32b5adSMartin KaFai Lau rt->dst.from = &from->dst; 22014b32b5adSMartin KaFai Lau dst_init_metrics(&rt->dst, dst_metrics_ptr(&from->dst), true); 22024b32b5adSMartin KaFai Lau } 22034b32b5adSMartin KaFai Lau 220483a09abdSMartin KaFai Lau static void ip6_rt_copy_init(struct rt6_info *rt, struct rt6_info *ort) 22051da177e4SLinus Torvalds { 2206d8d1f30bSChangli Gao rt->dst.input = ort->dst.input; 2207d8d1f30bSChangli Gao rt->dst.output = ort->dst.output; 220883a09abdSMartin KaFai Lau rt->rt6i_dst = ort->rt6i_dst; 2209d8d1f30bSChangli Gao rt->dst.error = ort->dst.error; 22101da177e4SLinus Torvalds rt->rt6i_idev = ort->rt6i_idev; 22111da177e4SLinus Torvalds if (rt->rt6i_idev) 22121da177e4SLinus Torvalds in6_dev_hold(rt->rt6i_idev); 2213d8d1f30bSChangli Gao rt->dst.lastuse = jiffies; 22144e3fd7a0SAlexey Dobriyan rt->rt6i_gateway = ort->rt6i_gateway; 22151716a961SGao feng rt->rt6i_flags = ort->rt6i_flags; 22161716a961SGao feng rt6_set_from(rt, ort); 221783a09abdSMartin KaFai Lau rt->rt6i_metric = ort->rt6i_metric; 22181da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES 221983a09abdSMartin KaFai Lau rt->rt6i_src = ort->rt6i_src; 22201da177e4SLinus Torvalds #endif 222183a09abdSMartin KaFai Lau rt->rt6i_prefsrc = ort->rt6i_prefsrc; 2222c71099acSThomas Graf rt->rt6i_table = ort->rt6i_table; 222361adedf3SJiri Benc rt->dst.lwtstate = lwtstate_get(ort->dst.lwtstate); 22241da177e4SLinus Torvalds } 22251da177e4SLinus Torvalds 222670ceb4f5SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_ROUTE_INFO 2227efa2cea0SDaniel Lezcano static struct rt6_info *rt6_get_route_info(struct net *net, 2228b71d1d42SEric Dumazet const struct in6_addr *prefix, int prefixlen, 2229b71d1d42SEric Dumazet const struct in6_addr *gwaddr, int ifindex) 223070ceb4f5SYOSHIFUJI Hideaki { 223170ceb4f5SYOSHIFUJI Hideaki struct fib6_node *fn; 223270ceb4f5SYOSHIFUJI Hideaki struct rt6_info *rt = NULL; 2233c71099acSThomas Graf struct fib6_table *table; 223470ceb4f5SYOSHIFUJI Hideaki 2235efa2cea0SDaniel Lezcano table = fib6_get_table(net, RT6_TABLE_INFO); 223638308473SDavid S. Miller if (!table) 2237c71099acSThomas Graf return NULL; 2238c71099acSThomas Graf 22395744dd9bSLi RongQing read_lock_bh(&table->tb6_lock); 2240c71099acSThomas Graf fn = fib6_locate(&table->tb6_root, prefix, prefixlen, NULL, 0); 224170ceb4f5SYOSHIFUJI Hideaki if (!fn) 224270ceb4f5SYOSHIFUJI Hideaki goto out; 224370ceb4f5SYOSHIFUJI Hideaki 2244d8d1f30bSChangli Gao for (rt = fn->leaf; rt; rt = rt->dst.rt6_next) { 2245d1918542SDavid S. Miller if (rt->dst.dev->ifindex != ifindex) 224670ceb4f5SYOSHIFUJI Hideaki continue; 224770ceb4f5SYOSHIFUJI Hideaki if ((rt->rt6i_flags & (RTF_ROUTEINFO|RTF_GATEWAY)) != (RTF_ROUTEINFO|RTF_GATEWAY)) 224870ceb4f5SYOSHIFUJI Hideaki continue; 224970ceb4f5SYOSHIFUJI Hideaki if (!ipv6_addr_equal(&rt->rt6i_gateway, gwaddr)) 225070ceb4f5SYOSHIFUJI Hideaki continue; 2251d8d1f30bSChangli Gao dst_hold(&rt->dst); 225270ceb4f5SYOSHIFUJI Hideaki break; 225370ceb4f5SYOSHIFUJI Hideaki } 225470ceb4f5SYOSHIFUJI Hideaki out: 22555744dd9bSLi RongQing read_unlock_bh(&table->tb6_lock); 225670ceb4f5SYOSHIFUJI Hideaki return rt; 225770ceb4f5SYOSHIFUJI Hideaki } 225870ceb4f5SYOSHIFUJI Hideaki 2259efa2cea0SDaniel Lezcano static struct rt6_info *rt6_add_route_info(struct net *net, 2260b71d1d42SEric Dumazet const struct in6_addr *prefix, int prefixlen, 2261b71d1d42SEric Dumazet const struct in6_addr *gwaddr, int ifindex, 226295c96174SEric Dumazet unsigned int pref) 226370ceb4f5SYOSHIFUJI Hideaki { 226486872cb5SThomas Graf struct fib6_config cfg = { 226586872cb5SThomas Graf .fc_table = RT6_TABLE_INFO, 2266238fc7eaSRami Rosen .fc_metric = IP6_RT_PRIO_USER, 226786872cb5SThomas Graf .fc_ifindex = ifindex, 226886872cb5SThomas Graf .fc_dst_len = prefixlen, 226986872cb5SThomas Graf .fc_flags = RTF_GATEWAY | RTF_ADDRCONF | RTF_ROUTEINFO | 227086872cb5SThomas Graf RTF_UP | RTF_PREF(pref), 227115e47304SEric W. Biederman .fc_nlinfo.portid = 0, 2272efa2cea0SDaniel Lezcano .fc_nlinfo.nlh = NULL, 2273efa2cea0SDaniel Lezcano .fc_nlinfo.nl_net = net, 227486872cb5SThomas Graf }; 227570ceb4f5SYOSHIFUJI Hideaki 22764e3fd7a0SAlexey Dobriyan cfg.fc_dst = *prefix; 22774e3fd7a0SAlexey Dobriyan cfg.fc_gateway = *gwaddr; 227886872cb5SThomas Graf 2279e317da96SYOSHIFUJI Hideaki /* We should treat it as a default route if prefix length is 0. */ 2280e317da96SYOSHIFUJI Hideaki if (!prefixlen) 228186872cb5SThomas Graf cfg.fc_flags |= RTF_DEFAULT; 228270ceb4f5SYOSHIFUJI Hideaki 228386872cb5SThomas Graf ip6_route_add(&cfg); 228470ceb4f5SYOSHIFUJI Hideaki 2285efa2cea0SDaniel Lezcano return rt6_get_route_info(net, prefix, prefixlen, gwaddr, ifindex); 228670ceb4f5SYOSHIFUJI Hideaki } 228770ceb4f5SYOSHIFUJI Hideaki #endif 228870ceb4f5SYOSHIFUJI Hideaki 2289b71d1d42SEric Dumazet struct rt6_info *rt6_get_dflt_router(const struct in6_addr *addr, struct net_device *dev) 22901da177e4SLinus Torvalds { 22911da177e4SLinus Torvalds struct rt6_info *rt; 2292c71099acSThomas Graf struct fib6_table *table; 22931da177e4SLinus Torvalds 2294c346dca1SYOSHIFUJI Hideaki table = fib6_get_table(dev_net(dev), RT6_TABLE_DFLT); 229538308473SDavid S. Miller if (!table) 2296c71099acSThomas Graf return NULL; 22971da177e4SLinus Torvalds 22985744dd9bSLi RongQing read_lock_bh(&table->tb6_lock); 2299d8d1f30bSChangli Gao for (rt = table->tb6_root.leaf; rt; rt = rt->dst.rt6_next) { 2300d1918542SDavid S. Miller if (dev == rt->dst.dev && 2301045927ffSYOSHIFUJI Hideaki ((rt->rt6i_flags & (RTF_ADDRCONF | RTF_DEFAULT)) == (RTF_ADDRCONF | RTF_DEFAULT)) && 23021da177e4SLinus Torvalds ipv6_addr_equal(&rt->rt6i_gateway, addr)) 23031da177e4SLinus Torvalds break; 23041da177e4SLinus Torvalds } 23051da177e4SLinus Torvalds if (rt) 2306d8d1f30bSChangli Gao dst_hold(&rt->dst); 23075744dd9bSLi RongQing read_unlock_bh(&table->tb6_lock); 23081da177e4SLinus Torvalds return rt; 23091da177e4SLinus Torvalds } 23101da177e4SLinus Torvalds 2311b71d1d42SEric Dumazet struct rt6_info *rt6_add_dflt_router(const struct in6_addr *gwaddr, 2312ebacaaa0SYOSHIFUJI Hideaki struct net_device *dev, 2313ebacaaa0SYOSHIFUJI Hideaki unsigned int pref) 23141da177e4SLinus Torvalds { 231586872cb5SThomas Graf struct fib6_config cfg = { 231686872cb5SThomas Graf .fc_table = RT6_TABLE_DFLT, 2317238fc7eaSRami Rosen .fc_metric = IP6_RT_PRIO_USER, 231886872cb5SThomas Graf .fc_ifindex = dev->ifindex, 231986872cb5SThomas Graf .fc_flags = RTF_GATEWAY | RTF_ADDRCONF | RTF_DEFAULT | 232086872cb5SThomas Graf RTF_UP | RTF_EXPIRES | RTF_PREF(pref), 232115e47304SEric W. Biederman .fc_nlinfo.portid = 0, 23225578689aSDaniel Lezcano .fc_nlinfo.nlh = NULL, 2323c346dca1SYOSHIFUJI Hideaki .fc_nlinfo.nl_net = dev_net(dev), 232486872cb5SThomas Graf }; 23251da177e4SLinus Torvalds 23264e3fd7a0SAlexey Dobriyan cfg.fc_gateway = *gwaddr; 23271da177e4SLinus Torvalds 232886872cb5SThomas Graf ip6_route_add(&cfg); 23291da177e4SLinus Torvalds 23301da177e4SLinus Torvalds return rt6_get_dflt_router(gwaddr, dev); 23311da177e4SLinus Torvalds } 23321da177e4SLinus Torvalds 23337b4da532SDaniel Lezcano void rt6_purge_dflt_routers(struct net *net) 23341da177e4SLinus Torvalds { 23351da177e4SLinus Torvalds struct rt6_info *rt; 2336c71099acSThomas Graf struct fib6_table *table; 2337c71099acSThomas Graf 2338c71099acSThomas Graf /* NOTE: Keep consistent with rt6_get_dflt_router */ 23397b4da532SDaniel Lezcano table = fib6_get_table(net, RT6_TABLE_DFLT); 234038308473SDavid S. Miller if (!table) 2341c71099acSThomas Graf return; 23421da177e4SLinus Torvalds 23431da177e4SLinus Torvalds restart: 2344c71099acSThomas Graf read_lock_bh(&table->tb6_lock); 2345d8d1f30bSChangli Gao for (rt = table->tb6_root.leaf; rt; rt = rt->dst.rt6_next) { 23463e8b0ac3SLorenzo Colitti if (rt->rt6i_flags & (RTF_DEFAULT | RTF_ADDRCONF) && 23473e8b0ac3SLorenzo Colitti (!rt->rt6i_idev || rt->rt6i_idev->cnf.accept_ra != 2)) { 2348d8d1f30bSChangli Gao dst_hold(&rt->dst); 2349c71099acSThomas Graf read_unlock_bh(&table->tb6_lock); 2350e0a1ad73SThomas Graf ip6_del_rt(rt); 23511da177e4SLinus Torvalds goto restart; 23521da177e4SLinus Torvalds } 23531da177e4SLinus Torvalds } 2354c71099acSThomas Graf read_unlock_bh(&table->tb6_lock); 23551da177e4SLinus Torvalds } 23561da177e4SLinus Torvalds 23575578689aSDaniel Lezcano static void rtmsg_to_fib6_config(struct net *net, 23585578689aSDaniel Lezcano struct in6_rtmsg *rtmsg, 235986872cb5SThomas Graf struct fib6_config *cfg) 236086872cb5SThomas Graf { 236186872cb5SThomas Graf memset(cfg, 0, sizeof(*cfg)); 236286872cb5SThomas Graf 236386872cb5SThomas Graf cfg->fc_table = RT6_TABLE_MAIN; 236486872cb5SThomas Graf cfg->fc_ifindex = rtmsg->rtmsg_ifindex; 236586872cb5SThomas Graf cfg->fc_metric = rtmsg->rtmsg_metric; 236686872cb5SThomas Graf cfg->fc_expires = rtmsg->rtmsg_info; 236786872cb5SThomas Graf cfg->fc_dst_len = rtmsg->rtmsg_dst_len; 236886872cb5SThomas Graf cfg->fc_src_len = rtmsg->rtmsg_src_len; 236986872cb5SThomas Graf cfg->fc_flags = rtmsg->rtmsg_flags; 237086872cb5SThomas Graf 23715578689aSDaniel Lezcano cfg->fc_nlinfo.nl_net = net; 2372f1243c2dSBenjamin Thery 23734e3fd7a0SAlexey Dobriyan cfg->fc_dst = rtmsg->rtmsg_dst; 23744e3fd7a0SAlexey Dobriyan cfg->fc_src = rtmsg->rtmsg_src; 23754e3fd7a0SAlexey Dobriyan cfg->fc_gateway = rtmsg->rtmsg_gateway; 237686872cb5SThomas Graf } 237786872cb5SThomas Graf 23785578689aSDaniel Lezcano int ipv6_route_ioctl(struct net *net, unsigned int cmd, void __user *arg) 23791da177e4SLinus Torvalds { 238086872cb5SThomas Graf struct fib6_config cfg; 23811da177e4SLinus Torvalds struct in6_rtmsg rtmsg; 23821da177e4SLinus Torvalds int err; 23831da177e4SLinus Torvalds 23841da177e4SLinus Torvalds switch (cmd) { 23851da177e4SLinus Torvalds case SIOCADDRT: /* Add a route */ 23861da177e4SLinus Torvalds case SIOCDELRT: /* Delete a route */ 2387af31f412SEric W. Biederman if (!ns_capable(net->user_ns, CAP_NET_ADMIN)) 23881da177e4SLinus Torvalds return -EPERM; 23891da177e4SLinus Torvalds err = copy_from_user(&rtmsg, arg, 23901da177e4SLinus Torvalds sizeof(struct in6_rtmsg)); 23911da177e4SLinus Torvalds if (err) 23921da177e4SLinus Torvalds return -EFAULT; 23931da177e4SLinus Torvalds 23945578689aSDaniel Lezcano rtmsg_to_fib6_config(net, &rtmsg, &cfg); 239586872cb5SThomas Graf 23961da177e4SLinus Torvalds rtnl_lock(); 23971da177e4SLinus Torvalds switch (cmd) { 23981da177e4SLinus Torvalds case SIOCADDRT: 239986872cb5SThomas Graf err = ip6_route_add(&cfg); 24001da177e4SLinus Torvalds break; 24011da177e4SLinus Torvalds case SIOCDELRT: 240286872cb5SThomas Graf err = ip6_route_del(&cfg); 24031da177e4SLinus Torvalds break; 24041da177e4SLinus Torvalds default: 24051da177e4SLinus Torvalds err = -EINVAL; 24061da177e4SLinus Torvalds } 24071da177e4SLinus Torvalds rtnl_unlock(); 24081da177e4SLinus Torvalds 24091da177e4SLinus Torvalds return err; 24103ff50b79SStephen Hemminger } 24111da177e4SLinus Torvalds 24121da177e4SLinus Torvalds return -EINVAL; 24131da177e4SLinus Torvalds } 24141da177e4SLinus Torvalds 24151da177e4SLinus Torvalds /* 24161da177e4SLinus Torvalds * Drop the packet on the floor 24171da177e4SLinus Torvalds */ 24181da177e4SLinus Torvalds 2419d5fdd6baSBrian Haley static int ip6_pkt_drop(struct sk_buff *skb, u8 code, int ipstats_mib_noroutes) 24201da177e4SLinus Torvalds { 2421612f09e8SYOSHIFUJI Hideaki int type; 2422adf30907SEric Dumazet struct dst_entry *dst = skb_dst(skb); 2423612f09e8SYOSHIFUJI Hideaki switch (ipstats_mib_noroutes) { 2424612f09e8SYOSHIFUJI Hideaki case IPSTATS_MIB_INNOROUTES: 24250660e03fSArnaldo Carvalho de Melo type = ipv6_addr_type(&ipv6_hdr(skb)->daddr); 242645bb0060SUlrich Weber if (type == IPV6_ADDR_ANY) { 24273bd653c8SDenis V. Lunev IP6_INC_STATS(dev_net(dst->dev), ip6_dst_idev(dst), 24283bd653c8SDenis V. Lunev IPSTATS_MIB_INADDRERRORS); 2429612f09e8SYOSHIFUJI Hideaki break; 2430612f09e8SYOSHIFUJI Hideaki } 2431612f09e8SYOSHIFUJI Hideaki /* FALLTHROUGH */ 2432612f09e8SYOSHIFUJI Hideaki case IPSTATS_MIB_OUTNOROUTES: 24333bd653c8SDenis V. Lunev IP6_INC_STATS(dev_net(dst->dev), ip6_dst_idev(dst), 24343bd653c8SDenis V. Lunev ipstats_mib_noroutes); 2435612f09e8SYOSHIFUJI Hideaki break; 2436612f09e8SYOSHIFUJI Hideaki } 24373ffe533cSAlexey Dobriyan icmpv6_send(skb, ICMPV6_DEST_UNREACH, code, 0); 24381da177e4SLinus Torvalds kfree_skb(skb); 24391da177e4SLinus Torvalds return 0; 24401da177e4SLinus Torvalds } 24411da177e4SLinus Torvalds 24429ce8ade0SThomas Graf static int ip6_pkt_discard(struct sk_buff *skb) 24439ce8ade0SThomas Graf { 2444612f09e8SYOSHIFUJI Hideaki return ip6_pkt_drop(skb, ICMPV6_NOROUTE, IPSTATS_MIB_INNOROUTES); 24459ce8ade0SThomas Graf } 24469ce8ade0SThomas Graf 2447aad88724SEric Dumazet static int ip6_pkt_discard_out(struct sock *sk, struct sk_buff *skb) 24481da177e4SLinus Torvalds { 2449adf30907SEric Dumazet skb->dev = skb_dst(skb)->dev; 2450612f09e8SYOSHIFUJI Hideaki return ip6_pkt_drop(skb, ICMPV6_NOROUTE, IPSTATS_MIB_OUTNOROUTES); 24511da177e4SLinus Torvalds } 24521da177e4SLinus Torvalds 24539ce8ade0SThomas Graf static int ip6_pkt_prohibit(struct sk_buff *skb) 24549ce8ade0SThomas Graf { 2455612f09e8SYOSHIFUJI Hideaki return ip6_pkt_drop(skb, ICMPV6_ADM_PROHIBITED, IPSTATS_MIB_INNOROUTES); 24569ce8ade0SThomas Graf } 24579ce8ade0SThomas Graf 2458aad88724SEric Dumazet static int ip6_pkt_prohibit_out(struct sock *sk, struct sk_buff *skb) 24599ce8ade0SThomas Graf { 2460adf30907SEric Dumazet skb->dev = skb_dst(skb)->dev; 2461612f09e8SYOSHIFUJI Hideaki return ip6_pkt_drop(skb, ICMPV6_ADM_PROHIBITED, IPSTATS_MIB_OUTNOROUTES); 24629ce8ade0SThomas Graf } 24639ce8ade0SThomas Graf 24641da177e4SLinus Torvalds /* 24651da177e4SLinus Torvalds * Allocate a dst for local (unicast / anycast) address. 24661da177e4SLinus Torvalds */ 24671da177e4SLinus Torvalds 24681da177e4SLinus Torvalds struct rt6_info *addrconf_dst_alloc(struct inet6_dev *idev, 24691da177e4SLinus Torvalds const struct in6_addr *addr, 24708f031519SDavid S. Miller bool anycast) 24711da177e4SLinus Torvalds { 2472c346dca1SYOSHIFUJI Hideaki struct net *net = dev_net(idev->dev); 2473a3300ef4SHannes Frederic Sowa struct rt6_info *rt = ip6_dst_alloc(net, net->loopback_dev, 2474ad706862SMartin KaFai Lau DST_NOCOUNT); 2475a3300ef4SHannes Frederic Sowa if (!rt) 24761da177e4SLinus Torvalds return ERR_PTR(-ENOMEM); 24771da177e4SLinus Torvalds 24781da177e4SLinus Torvalds in6_dev_hold(idev); 24791da177e4SLinus Torvalds 248011d53b49SDavid S. Miller rt->dst.flags |= DST_HOST; 2481d8d1f30bSChangli Gao rt->dst.input = ip6_input; 2482d8d1f30bSChangli Gao rt->dst.output = ip6_output; 24831da177e4SLinus Torvalds rt->rt6i_idev = idev; 24841da177e4SLinus Torvalds 24851da177e4SLinus Torvalds rt->rt6i_flags = RTF_UP | RTF_NONEXTHOP; 248658c4fb86SYOSHIFUJI Hideaki if (anycast) 248758c4fb86SYOSHIFUJI Hideaki rt->rt6i_flags |= RTF_ANYCAST; 248858c4fb86SYOSHIFUJI Hideaki else 24891da177e4SLinus Torvalds rt->rt6i_flags |= RTF_LOCAL; 24901da177e4SLinus Torvalds 2491550bab42SJulian Anastasov rt->rt6i_gateway = *addr; 24924e3fd7a0SAlexey Dobriyan rt->rt6i_dst.addr = *addr; 24931da177e4SLinus Torvalds rt->rt6i_dst.plen = 128; 24945578689aSDaniel Lezcano rt->rt6i_table = fib6_get_table(net, RT6_TABLE_LOCAL); 24951da177e4SLinus Torvalds 2496d8d1f30bSChangli Gao atomic_set(&rt->dst.__refcnt, 1); 24971da177e4SLinus Torvalds 24981da177e4SLinus Torvalds return rt; 24991da177e4SLinus Torvalds } 25001da177e4SLinus Torvalds 2501c3968a85SDaniel Walter int ip6_route_get_saddr(struct net *net, 2502c3968a85SDaniel Walter struct rt6_info *rt, 2503b71d1d42SEric Dumazet const struct in6_addr *daddr, 2504c3968a85SDaniel Walter unsigned int prefs, 2505c3968a85SDaniel Walter struct in6_addr *saddr) 2506c3968a85SDaniel Walter { 2507e16e888bSMarkus Stenberg struct inet6_dev *idev = 2508e16e888bSMarkus Stenberg rt ? ip6_dst_idev((struct dst_entry *)rt) : NULL; 2509c3968a85SDaniel Walter int err = 0; 2510e16e888bSMarkus Stenberg if (rt && rt->rt6i_prefsrc.plen) 25114e3fd7a0SAlexey Dobriyan *saddr = rt->rt6i_prefsrc.addr; 2512c3968a85SDaniel Walter else 2513c3968a85SDaniel Walter err = ipv6_dev_get_saddr(net, idev ? idev->dev : NULL, 2514c3968a85SDaniel Walter daddr, prefs, saddr); 2515c3968a85SDaniel Walter return err; 2516c3968a85SDaniel Walter } 2517c3968a85SDaniel Walter 2518c3968a85SDaniel Walter /* remove deleted ip from prefsrc entries */ 2519c3968a85SDaniel Walter struct arg_dev_net_ip { 2520c3968a85SDaniel Walter struct net_device *dev; 2521c3968a85SDaniel Walter struct net *net; 2522c3968a85SDaniel Walter struct in6_addr *addr; 2523c3968a85SDaniel Walter }; 2524c3968a85SDaniel Walter 2525c3968a85SDaniel Walter static int fib6_remove_prefsrc(struct rt6_info *rt, void *arg) 2526c3968a85SDaniel Walter { 2527c3968a85SDaniel Walter struct net_device *dev = ((struct arg_dev_net_ip *)arg)->dev; 2528c3968a85SDaniel Walter struct net *net = ((struct arg_dev_net_ip *)arg)->net; 2529c3968a85SDaniel Walter struct in6_addr *addr = ((struct arg_dev_net_ip *)arg)->addr; 2530c3968a85SDaniel Walter 2531d1918542SDavid S. Miller if (((void *)rt->dst.dev == dev || !dev) && 2532c3968a85SDaniel Walter rt != net->ipv6.ip6_null_entry && 2533c3968a85SDaniel Walter ipv6_addr_equal(addr, &rt->rt6i_prefsrc.addr)) { 2534c3968a85SDaniel Walter /* remove prefsrc entry */ 2535c3968a85SDaniel Walter rt->rt6i_prefsrc.plen = 0; 2536c3968a85SDaniel Walter } 2537c3968a85SDaniel Walter return 0; 2538c3968a85SDaniel Walter } 2539c3968a85SDaniel Walter 2540c3968a85SDaniel Walter void rt6_remove_prefsrc(struct inet6_ifaddr *ifp) 2541c3968a85SDaniel Walter { 2542c3968a85SDaniel Walter struct net *net = dev_net(ifp->idev->dev); 2543c3968a85SDaniel Walter struct arg_dev_net_ip adni = { 2544c3968a85SDaniel Walter .dev = ifp->idev->dev, 2545c3968a85SDaniel Walter .net = net, 2546c3968a85SDaniel Walter .addr = &ifp->addr, 2547c3968a85SDaniel Walter }; 25480c3584d5SLi RongQing fib6_clean_all(net, fib6_remove_prefsrc, &adni); 2549c3968a85SDaniel Walter } 2550c3968a85SDaniel Walter 2551be7a010dSDuan Jiong #define RTF_RA_ROUTER (RTF_ADDRCONF | RTF_DEFAULT | RTF_GATEWAY) 2552be7a010dSDuan Jiong #define RTF_CACHE_GATEWAY (RTF_GATEWAY | RTF_CACHE) 2553be7a010dSDuan Jiong 2554be7a010dSDuan Jiong /* Remove routers and update dst entries when gateway turn into host. */ 2555be7a010dSDuan Jiong static int fib6_clean_tohost(struct rt6_info *rt, void *arg) 2556be7a010dSDuan Jiong { 2557be7a010dSDuan Jiong struct in6_addr *gateway = (struct in6_addr *)arg; 2558be7a010dSDuan Jiong 2559be7a010dSDuan Jiong if ((((rt->rt6i_flags & RTF_RA_ROUTER) == RTF_RA_ROUTER) || 2560be7a010dSDuan Jiong ((rt->rt6i_flags & RTF_CACHE_GATEWAY) == RTF_CACHE_GATEWAY)) && 2561be7a010dSDuan Jiong ipv6_addr_equal(gateway, &rt->rt6i_gateway)) { 2562be7a010dSDuan Jiong return -1; 2563be7a010dSDuan Jiong } 2564be7a010dSDuan Jiong return 0; 2565be7a010dSDuan Jiong } 2566be7a010dSDuan Jiong 2567be7a010dSDuan Jiong void rt6_clean_tohost(struct net *net, struct in6_addr *gateway) 2568be7a010dSDuan Jiong { 2569be7a010dSDuan Jiong fib6_clean_all(net, fib6_clean_tohost, gateway); 2570be7a010dSDuan Jiong } 2571be7a010dSDuan Jiong 25728ed67789SDaniel Lezcano struct arg_dev_net { 25738ed67789SDaniel Lezcano struct net_device *dev; 25748ed67789SDaniel Lezcano struct net *net; 25758ed67789SDaniel Lezcano }; 25768ed67789SDaniel Lezcano 25771da177e4SLinus Torvalds static int fib6_ifdown(struct rt6_info *rt, void *arg) 25781da177e4SLinus Torvalds { 2579bc3ef660Sstephen hemminger const struct arg_dev_net *adn = arg; 2580bc3ef660Sstephen hemminger const struct net_device *dev = adn->dev; 25818ed67789SDaniel Lezcano 2582d1918542SDavid S. Miller if ((rt->dst.dev == dev || !dev) && 2583c159d30cSDavid S. Miller rt != adn->net->ipv6.ip6_null_entry) 25841da177e4SLinus Torvalds return -1; 2585c159d30cSDavid S. Miller 25861da177e4SLinus Torvalds return 0; 25871da177e4SLinus Torvalds } 25881da177e4SLinus Torvalds 2589f3db4851SDaniel Lezcano void rt6_ifdown(struct net *net, struct net_device *dev) 25901da177e4SLinus Torvalds { 25918ed67789SDaniel Lezcano struct arg_dev_net adn = { 25928ed67789SDaniel Lezcano .dev = dev, 25938ed67789SDaniel Lezcano .net = net, 25948ed67789SDaniel Lezcano }; 25958ed67789SDaniel Lezcano 25960c3584d5SLi RongQing fib6_clean_all(net, fib6_ifdown, &adn); 25971e493d19SDavid S. Miller icmp6_clean_all(fib6_ifdown, &adn); 25988d0b94afSMartin KaFai Lau rt6_uncached_list_flush_dev(net, dev); 25991da177e4SLinus Torvalds } 26001da177e4SLinus Torvalds 260195c96174SEric Dumazet struct rt6_mtu_change_arg { 26021da177e4SLinus Torvalds struct net_device *dev; 260395c96174SEric Dumazet unsigned int mtu; 26041da177e4SLinus Torvalds }; 26051da177e4SLinus Torvalds 26061da177e4SLinus Torvalds static int rt6_mtu_change_route(struct rt6_info *rt, void *p_arg) 26071da177e4SLinus Torvalds { 26081da177e4SLinus Torvalds struct rt6_mtu_change_arg *arg = (struct rt6_mtu_change_arg *) p_arg; 26091da177e4SLinus Torvalds struct inet6_dev *idev; 26101da177e4SLinus Torvalds 26111da177e4SLinus Torvalds /* In IPv6 pmtu discovery is not optional, 26121da177e4SLinus Torvalds so that RTAX_MTU lock cannot disable it. 26131da177e4SLinus Torvalds We still use this lock to block changes 26141da177e4SLinus Torvalds caused by addrconf/ndisc. 26151da177e4SLinus Torvalds */ 26161da177e4SLinus Torvalds 26171da177e4SLinus Torvalds idev = __in6_dev_get(arg->dev); 261838308473SDavid S. Miller if (!idev) 26191da177e4SLinus Torvalds return 0; 26201da177e4SLinus Torvalds 26211da177e4SLinus Torvalds /* For administrative MTU increase, there is no way to discover 26221da177e4SLinus Torvalds IPv6 PMTU increase, so PMTU increase should be updated here. 26231da177e4SLinus Torvalds Since RFC 1981 doesn't include administrative MTU increase 26241da177e4SLinus Torvalds update PMTU increase is a MUST. (i.e. jumbo frame) 26251da177e4SLinus Torvalds */ 26261da177e4SLinus Torvalds /* 26271da177e4SLinus Torvalds If new MTU is less than route PMTU, this new MTU will be the 26281da177e4SLinus Torvalds lowest MTU in the path, update the route PMTU to reflect PMTU 26291da177e4SLinus Torvalds decreases; if new MTU is greater than route PMTU, and the 26301da177e4SLinus Torvalds old MTU is the lowest MTU in the path, update the route PMTU 26311da177e4SLinus Torvalds to reflect the increase. In this case if the other nodes' MTU 26321da177e4SLinus Torvalds also have the lowest MTU, TOO BIG MESSAGE will be lead to 26331da177e4SLinus Torvalds PMTU discouvery. 26341da177e4SLinus Torvalds */ 2635d1918542SDavid S. Miller if (rt->dst.dev == arg->dev && 26364b32b5adSMartin KaFai Lau !dst_metric_locked(&rt->dst, RTAX_MTU)) { 26374b32b5adSMartin KaFai Lau if (rt->rt6i_flags & RTF_CACHE) { 26384b32b5adSMartin KaFai Lau /* For RTF_CACHE with rt6i_pmtu == 0 26394b32b5adSMartin KaFai Lau * (i.e. a redirected route), 26404b32b5adSMartin KaFai Lau * the metrics of its rt->dst.from has already 26414b32b5adSMartin KaFai Lau * been updated. 26424b32b5adSMartin KaFai Lau */ 26434b32b5adSMartin KaFai Lau if (rt->rt6i_pmtu && rt->rt6i_pmtu > arg->mtu) 26444b32b5adSMartin KaFai Lau rt->rt6i_pmtu = arg->mtu; 26454b32b5adSMartin KaFai Lau } else if (dst_mtu(&rt->dst) >= arg->mtu || 2646d8d1f30bSChangli Gao (dst_mtu(&rt->dst) < arg->mtu && 26474b32b5adSMartin KaFai Lau dst_mtu(&rt->dst) == idev->cnf.mtu6)) { 2648defb3519SDavid S. Miller dst_metric_set(&rt->dst, RTAX_MTU, arg->mtu); 2649566cfd8fSSimon Arlott } 26504b32b5adSMartin KaFai Lau } 26511da177e4SLinus Torvalds return 0; 26521da177e4SLinus Torvalds } 26531da177e4SLinus Torvalds 265495c96174SEric Dumazet void rt6_mtu_change(struct net_device *dev, unsigned int mtu) 26551da177e4SLinus Torvalds { 2656c71099acSThomas Graf struct rt6_mtu_change_arg arg = { 2657c71099acSThomas Graf .dev = dev, 2658c71099acSThomas Graf .mtu = mtu, 2659c71099acSThomas Graf }; 26601da177e4SLinus Torvalds 26610c3584d5SLi RongQing fib6_clean_all(dev_net(dev), rt6_mtu_change_route, &arg); 26621da177e4SLinus Torvalds } 26631da177e4SLinus Torvalds 2664ef7c79edSPatrick McHardy static const struct nla_policy rtm_ipv6_policy[RTA_MAX+1] = { 26655176f91eSThomas Graf [RTA_GATEWAY] = { .len = sizeof(struct in6_addr) }, 266686872cb5SThomas Graf [RTA_OIF] = { .type = NLA_U32 }, 2667ab364a6fSThomas Graf [RTA_IIF] = { .type = NLA_U32 }, 266886872cb5SThomas Graf [RTA_PRIORITY] = { .type = NLA_U32 }, 266986872cb5SThomas Graf [RTA_METRICS] = { .type = NLA_NESTED }, 267051ebd318SNicolas Dichtel [RTA_MULTIPATH] = { .len = sizeof(struct rtnexthop) }, 2671c78ba6d6SLubomir Rintel [RTA_PREF] = { .type = NLA_U8 }, 267219e42e45SRoopa Prabhu [RTA_ENCAP_TYPE] = { .type = NLA_U16 }, 267319e42e45SRoopa Prabhu [RTA_ENCAP] = { .type = NLA_NESTED }, 267486872cb5SThomas Graf }; 267586872cb5SThomas Graf 267686872cb5SThomas Graf static int rtm_to_fib6_config(struct sk_buff *skb, struct nlmsghdr *nlh, 267786872cb5SThomas Graf struct fib6_config *cfg) 26781da177e4SLinus Torvalds { 267986872cb5SThomas Graf struct rtmsg *rtm; 268086872cb5SThomas Graf struct nlattr *tb[RTA_MAX+1]; 2681c78ba6d6SLubomir Rintel unsigned int pref; 268286872cb5SThomas Graf int err; 26831da177e4SLinus Torvalds 268486872cb5SThomas Graf err = nlmsg_parse(nlh, sizeof(*rtm), tb, RTA_MAX, rtm_ipv6_policy); 268586872cb5SThomas Graf if (err < 0) 268686872cb5SThomas Graf goto errout; 26871da177e4SLinus Torvalds 268886872cb5SThomas Graf err = -EINVAL; 268986872cb5SThomas Graf rtm = nlmsg_data(nlh); 269086872cb5SThomas Graf memset(cfg, 0, sizeof(*cfg)); 269186872cb5SThomas Graf 269286872cb5SThomas Graf cfg->fc_table = rtm->rtm_table; 269386872cb5SThomas Graf cfg->fc_dst_len = rtm->rtm_dst_len; 269486872cb5SThomas Graf cfg->fc_src_len = rtm->rtm_src_len; 269586872cb5SThomas Graf cfg->fc_flags = RTF_UP; 269686872cb5SThomas Graf cfg->fc_protocol = rtm->rtm_protocol; 2697ef2c7d7bSNicolas Dichtel cfg->fc_type = rtm->rtm_type; 269886872cb5SThomas Graf 2699ef2c7d7bSNicolas Dichtel if (rtm->rtm_type == RTN_UNREACHABLE || 2700ef2c7d7bSNicolas Dichtel rtm->rtm_type == RTN_BLACKHOLE || 2701b4949ab2SNicolas Dichtel rtm->rtm_type == RTN_PROHIBIT || 2702b4949ab2SNicolas Dichtel rtm->rtm_type == RTN_THROW) 270386872cb5SThomas Graf cfg->fc_flags |= RTF_REJECT; 270486872cb5SThomas Graf 2705ab79ad14SMaciej Żenczykowski if (rtm->rtm_type == RTN_LOCAL) 2706ab79ad14SMaciej Żenczykowski cfg->fc_flags |= RTF_LOCAL; 2707ab79ad14SMaciej Żenczykowski 27081f56a01fSMartin KaFai Lau if (rtm->rtm_flags & RTM_F_CLONED) 27091f56a01fSMartin KaFai Lau cfg->fc_flags |= RTF_CACHE; 27101f56a01fSMartin KaFai Lau 271115e47304SEric W. Biederman cfg->fc_nlinfo.portid = NETLINK_CB(skb).portid; 271286872cb5SThomas Graf cfg->fc_nlinfo.nlh = nlh; 27133b1e0a65SYOSHIFUJI Hideaki cfg->fc_nlinfo.nl_net = sock_net(skb->sk); 271486872cb5SThomas Graf 271586872cb5SThomas Graf if (tb[RTA_GATEWAY]) { 271667b61f6cSJiri Benc cfg->fc_gateway = nla_get_in6_addr(tb[RTA_GATEWAY]); 271786872cb5SThomas Graf cfg->fc_flags |= RTF_GATEWAY; 27181da177e4SLinus Torvalds } 271986872cb5SThomas Graf 272086872cb5SThomas Graf if (tb[RTA_DST]) { 272186872cb5SThomas Graf int plen = (rtm->rtm_dst_len + 7) >> 3; 272286872cb5SThomas Graf 272386872cb5SThomas Graf if (nla_len(tb[RTA_DST]) < plen) 272486872cb5SThomas Graf goto errout; 272586872cb5SThomas Graf 272686872cb5SThomas Graf nla_memcpy(&cfg->fc_dst, tb[RTA_DST], plen); 27271da177e4SLinus Torvalds } 272886872cb5SThomas Graf 272986872cb5SThomas Graf if (tb[RTA_SRC]) { 273086872cb5SThomas Graf int plen = (rtm->rtm_src_len + 7) >> 3; 273186872cb5SThomas Graf 273286872cb5SThomas Graf if (nla_len(tb[RTA_SRC]) < plen) 273386872cb5SThomas Graf goto errout; 273486872cb5SThomas Graf 273586872cb5SThomas Graf nla_memcpy(&cfg->fc_src, tb[RTA_SRC], plen); 27361da177e4SLinus Torvalds } 273786872cb5SThomas Graf 2738c3968a85SDaniel Walter if (tb[RTA_PREFSRC]) 273967b61f6cSJiri Benc cfg->fc_prefsrc = nla_get_in6_addr(tb[RTA_PREFSRC]); 2740c3968a85SDaniel Walter 274186872cb5SThomas Graf if (tb[RTA_OIF]) 274286872cb5SThomas Graf cfg->fc_ifindex = nla_get_u32(tb[RTA_OIF]); 274386872cb5SThomas Graf 274486872cb5SThomas Graf if (tb[RTA_PRIORITY]) 274586872cb5SThomas Graf cfg->fc_metric = nla_get_u32(tb[RTA_PRIORITY]); 274686872cb5SThomas Graf 274786872cb5SThomas Graf if (tb[RTA_METRICS]) { 274886872cb5SThomas Graf cfg->fc_mx = nla_data(tb[RTA_METRICS]); 274986872cb5SThomas Graf cfg->fc_mx_len = nla_len(tb[RTA_METRICS]); 27501da177e4SLinus Torvalds } 275186872cb5SThomas Graf 275286872cb5SThomas Graf if (tb[RTA_TABLE]) 275386872cb5SThomas Graf cfg->fc_table = nla_get_u32(tb[RTA_TABLE]); 275486872cb5SThomas Graf 275551ebd318SNicolas Dichtel if (tb[RTA_MULTIPATH]) { 275651ebd318SNicolas Dichtel cfg->fc_mp = nla_data(tb[RTA_MULTIPATH]); 275751ebd318SNicolas Dichtel cfg->fc_mp_len = nla_len(tb[RTA_MULTIPATH]); 275851ebd318SNicolas Dichtel } 275951ebd318SNicolas Dichtel 2760c78ba6d6SLubomir Rintel if (tb[RTA_PREF]) { 2761c78ba6d6SLubomir Rintel pref = nla_get_u8(tb[RTA_PREF]); 2762c78ba6d6SLubomir Rintel if (pref != ICMPV6_ROUTER_PREF_LOW && 2763c78ba6d6SLubomir Rintel pref != ICMPV6_ROUTER_PREF_HIGH) 2764c78ba6d6SLubomir Rintel pref = ICMPV6_ROUTER_PREF_MEDIUM; 2765c78ba6d6SLubomir Rintel cfg->fc_flags |= RTF_PREF(pref); 2766c78ba6d6SLubomir Rintel } 2767c78ba6d6SLubomir Rintel 276819e42e45SRoopa Prabhu if (tb[RTA_ENCAP]) 276919e42e45SRoopa Prabhu cfg->fc_encap = tb[RTA_ENCAP]; 277019e42e45SRoopa Prabhu 277119e42e45SRoopa Prabhu if (tb[RTA_ENCAP_TYPE]) 277219e42e45SRoopa Prabhu cfg->fc_encap_type = nla_get_u16(tb[RTA_ENCAP_TYPE]); 277319e42e45SRoopa Prabhu 277486872cb5SThomas Graf err = 0; 277586872cb5SThomas Graf errout: 277686872cb5SThomas Graf return err; 27771da177e4SLinus Torvalds } 27781da177e4SLinus Torvalds 277951ebd318SNicolas Dichtel static int ip6_route_multipath(struct fib6_config *cfg, int add) 278051ebd318SNicolas Dichtel { 278151ebd318SNicolas Dichtel struct fib6_config r_cfg; 278251ebd318SNicolas Dichtel struct rtnexthop *rtnh; 278351ebd318SNicolas Dichtel int remaining; 278451ebd318SNicolas Dichtel int attrlen; 278551ebd318SNicolas Dichtel int err = 0, last_err = 0; 278651ebd318SNicolas Dichtel 278735f1b4e9SMichal Kubeček remaining = cfg->fc_mp_len; 278851ebd318SNicolas Dichtel beginning: 278951ebd318SNicolas Dichtel rtnh = (struct rtnexthop *)cfg->fc_mp; 279051ebd318SNicolas Dichtel 279151ebd318SNicolas Dichtel /* Parse a Multipath Entry */ 279251ebd318SNicolas Dichtel while (rtnh_ok(rtnh, remaining)) { 279351ebd318SNicolas Dichtel memcpy(&r_cfg, cfg, sizeof(*cfg)); 279451ebd318SNicolas Dichtel if (rtnh->rtnh_ifindex) 279551ebd318SNicolas Dichtel r_cfg.fc_ifindex = rtnh->rtnh_ifindex; 279651ebd318SNicolas Dichtel 279751ebd318SNicolas Dichtel attrlen = rtnh_attrlen(rtnh); 279851ebd318SNicolas Dichtel if (attrlen > 0) { 279951ebd318SNicolas Dichtel struct nlattr *nla, *attrs = rtnh_attrs(rtnh); 280051ebd318SNicolas Dichtel 280151ebd318SNicolas Dichtel nla = nla_find(attrs, attrlen, RTA_GATEWAY); 280251ebd318SNicolas Dichtel if (nla) { 280367b61f6cSJiri Benc r_cfg.fc_gateway = nla_get_in6_addr(nla); 280451ebd318SNicolas Dichtel r_cfg.fc_flags |= RTF_GATEWAY; 280551ebd318SNicolas Dichtel } 280619e42e45SRoopa Prabhu r_cfg.fc_encap = nla_find(attrs, attrlen, RTA_ENCAP); 280719e42e45SRoopa Prabhu nla = nla_find(attrs, attrlen, RTA_ENCAP_TYPE); 280819e42e45SRoopa Prabhu if (nla) 280919e42e45SRoopa Prabhu r_cfg.fc_encap_type = nla_get_u16(nla); 281051ebd318SNicolas Dichtel } 281151ebd318SNicolas Dichtel err = add ? ip6_route_add(&r_cfg) : ip6_route_del(&r_cfg); 281251ebd318SNicolas Dichtel if (err) { 281351ebd318SNicolas Dichtel last_err = err; 281451ebd318SNicolas Dichtel /* If we are trying to remove a route, do not stop the 281551ebd318SNicolas Dichtel * loop when ip6_route_del() fails (because next hop is 281651ebd318SNicolas Dichtel * already gone), we should try to remove all next hops. 281751ebd318SNicolas Dichtel */ 281851ebd318SNicolas Dichtel if (add) { 281951ebd318SNicolas Dichtel /* If add fails, we should try to delete all 282051ebd318SNicolas Dichtel * next hops that have been already added. 282151ebd318SNicolas Dichtel */ 282251ebd318SNicolas Dichtel add = 0; 282335f1b4e9SMichal Kubeček remaining = cfg->fc_mp_len - remaining; 282451ebd318SNicolas Dichtel goto beginning; 282551ebd318SNicolas Dichtel } 282651ebd318SNicolas Dichtel } 28271a72418bSNicolas Dichtel /* Because each route is added like a single route we remove 282827596472SMichal Kubeček * these flags after the first nexthop: if there is a collision, 282927596472SMichal Kubeček * we have already failed to add the first nexthop: 283027596472SMichal Kubeček * fib6_add_rt2node() has rejected it; when replacing, old 283127596472SMichal Kubeček * nexthops have been replaced by first new, the rest should 283227596472SMichal Kubeček * be added to it. 28331a72418bSNicolas Dichtel */ 283427596472SMichal Kubeček cfg->fc_nlinfo.nlh->nlmsg_flags &= ~(NLM_F_EXCL | 283527596472SMichal Kubeček NLM_F_REPLACE); 283651ebd318SNicolas Dichtel rtnh = rtnh_next(rtnh, &remaining); 283751ebd318SNicolas Dichtel } 283851ebd318SNicolas Dichtel 283951ebd318SNicolas Dichtel return last_err; 284051ebd318SNicolas Dichtel } 284151ebd318SNicolas Dichtel 2842661d2967SThomas Graf static int inet6_rtm_delroute(struct sk_buff *skb, struct nlmsghdr *nlh) 28431da177e4SLinus Torvalds { 284486872cb5SThomas Graf struct fib6_config cfg; 284586872cb5SThomas Graf int err; 28461da177e4SLinus Torvalds 284786872cb5SThomas Graf err = rtm_to_fib6_config(skb, nlh, &cfg); 284886872cb5SThomas Graf if (err < 0) 284986872cb5SThomas Graf return err; 285086872cb5SThomas Graf 285151ebd318SNicolas Dichtel if (cfg.fc_mp) 285251ebd318SNicolas Dichtel return ip6_route_multipath(&cfg, 0); 285351ebd318SNicolas Dichtel else 285486872cb5SThomas Graf return ip6_route_del(&cfg); 28551da177e4SLinus Torvalds } 28561da177e4SLinus Torvalds 2857661d2967SThomas Graf static int inet6_rtm_newroute(struct sk_buff *skb, struct nlmsghdr *nlh) 28581da177e4SLinus Torvalds { 285986872cb5SThomas Graf struct fib6_config cfg; 286086872cb5SThomas Graf int err; 28611da177e4SLinus Torvalds 286286872cb5SThomas Graf err = rtm_to_fib6_config(skb, nlh, &cfg); 286386872cb5SThomas Graf if (err < 0) 286486872cb5SThomas Graf return err; 286586872cb5SThomas Graf 286651ebd318SNicolas Dichtel if (cfg.fc_mp) 286751ebd318SNicolas Dichtel return ip6_route_multipath(&cfg, 1); 286851ebd318SNicolas Dichtel else 286986872cb5SThomas Graf return ip6_route_add(&cfg); 28701da177e4SLinus Torvalds } 28711da177e4SLinus Torvalds 287219e42e45SRoopa Prabhu static inline size_t rt6_nlmsg_size(struct rt6_info *rt) 2873339bf98fSThomas Graf { 2874339bf98fSThomas Graf return NLMSG_ALIGN(sizeof(struct rtmsg)) 2875339bf98fSThomas Graf + nla_total_size(16) /* RTA_SRC */ 2876339bf98fSThomas Graf + nla_total_size(16) /* RTA_DST */ 2877339bf98fSThomas Graf + nla_total_size(16) /* RTA_GATEWAY */ 2878339bf98fSThomas Graf + nla_total_size(16) /* RTA_PREFSRC */ 2879339bf98fSThomas Graf + nla_total_size(4) /* RTA_TABLE */ 2880339bf98fSThomas Graf + nla_total_size(4) /* RTA_IIF */ 2881339bf98fSThomas Graf + nla_total_size(4) /* RTA_OIF */ 2882339bf98fSThomas Graf + nla_total_size(4) /* RTA_PRIORITY */ 28836a2b9ce0SNoriaki TAKAMIYA + RTAX_MAX * nla_total_size(4) /* RTA_METRICS */ 2884ea697639SDaniel Borkmann + nla_total_size(sizeof(struct rta_cacheinfo)) 2885c78ba6d6SLubomir Rintel + nla_total_size(TCP_CA_NAME_MAX) /* RTAX_CC_ALGO */ 288619e42e45SRoopa Prabhu + nla_total_size(1) /* RTA_PREF */ 288761adedf3SJiri Benc + lwtunnel_get_encap_size(rt->dst.lwtstate); 2888339bf98fSThomas Graf } 2889339bf98fSThomas Graf 2890191cd582SBrian Haley static int rt6_fill_node(struct net *net, 2891191cd582SBrian Haley struct sk_buff *skb, struct rt6_info *rt, 28920d51aa80SJamal Hadi Salim struct in6_addr *dst, struct in6_addr *src, 289315e47304SEric W. Biederman int iif, int type, u32 portid, u32 seq, 28947bc570c8SYOSHIFUJI Hideaki int prefix, int nowait, unsigned int flags) 28951da177e4SLinus Torvalds { 28964b32b5adSMartin KaFai Lau u32 metrics[RTAX_MAX]; 28971da177e4SLinus Torvalds struct rtmsg *rtm; 28981da177e4SLinus Torvalds struct nlmsghdr *nlh; 2899e3703b3dSThomas Graf long expires; 29009e762a4aSPatrick McHardy u32 table; 29011da177e4SLinus Torvalds 29021da177e4SLinus Torvalds if (prefix) { /* user wants prefix routes only */ 29031da177e4SLinus Torvalds if (!(rt->rt6i_flags & RTF_PREFIX_RT)) { 29041da177e4SLinus Torvalds /* success since this is not a prefix route */ 29051da177e4SLinus Torvalds return 1; 29061da177e4SLinus Torvalds } 29071da177e4SLinus Torvalds } 29081da177e4SLinus Torvalds 290915e47304SEric W. Biederman nlh = nlmsg_put(skb, portid, seq, type, sizeof(*rtm), flags); 291038308473SDavid S. Miller if (!nlh) 291126932566SPatrick McHardy return -EMSGSIZE; 29122d7202bfSThomas Graf 29132d7202bfSThomas Graf rtm = nlmsg_data(nlh); 29141da177e4SLinus Torvalds rtm->rtm_family = AF_INET6; 29151da177e4SLinus Torvalds rtm->rtm_dst_len = rt->rt6i_dst.plen; 29161da177e4SLinus Torvalds rtm->rtm_src_len = rt->rt6i_src.plen; 29171da177e4SLinus Torvalds rtm->rtm_tos = 0; 2918c71099acSThomas Graf if (rt->rt6i_table) 29199e762a4aSPatrick McHardy table = rt->rt6i_table->tb6_id; 2920c71099acSThomas Graf else 29219e762a4aSPatrick McHardy table = RT6_TABLE_UNSPEC; 29229e762a4aSPatrick McHardy rtm->rtm_table = table; 2923c78679e8SDavid S. Miller if (nla_put_u32(skb, RTA_TABLE, table)) 2924c78679e8SDavid S. Miller goto nla_put_failure; 2925ef2c7d7bSNicolas Dichtel if (rt->rt6i_flags & RTF_REJECT) { 2926ef2c7d7bSNicolas Dichtel switch (rt->dst.error) { 2927ef2c7d7bSNicolas Dichtel case -EINVAL: 2928ef2c7d7bSNicolas Dichtel rtm->rtm_type = RTN_BLACKHOLE; 2929ef2c7d7bSNicolas Dichtel break; 2930ef2c7d7bSNicolas Dichtel case -EACCES: 2931ef2c7d7bSNicolas Dichtel rtm->rtm_type = RTN_PROHIBIT; 2932ef2c7d7bSNicolas Dichtel break; 2933b4949ab2SNicolas Dichtel case -EAGAIN: 2934b4949ab2SNicolas Dichtel rtm->rtm_type = RTN_THROW; 2935b4949ab2SNicolas Dichtel break; 2936ef2c7d7bSNicolas Dichtel default: 29371da177e4SLinus Torvalds rtm->rtm_type = RTN_UNREACHABLE; 2938ef2c7d7bSNicolas Dichtel break; 2939ef2c7d7bSNicolas Dichtel } 2940ef2c7d7bSNicolas Dichtel } 2941ab79ad14SMaciej Żenczykowski else if (rt->rt6i_flags & RTF_LOCAL) 2942ab79ad14SMaciej Żenczykowski rtm->rtm_type = RTN_LOCAL; 2943d1918542SDavid S. Miller else if (rt->dst.dev && (rt->dst.dev->flags & IFF_LOOPBACK)) 29441da177e4SLinus Torvalds rtm->rtm_type = RTN_LOCAL; 29451da177e4SLinus Torvalds else 29461da177e4SLinus Torvalds rtm->rtm_type = RTN_UNICAST; 29471da177e4SLinus Torvalds rtm->rtm_flags = 0; 294835103d11SAndy Gospodarek if (!netif_carrier_ok(rt->dst.dev)) { 2949cea45e20SAndy Gospodarek rtm->rtm_flags |= RTNH_F_LINKDOWN; 295035103d11SAndy Gospodarek if (rt->rt6i_idev->cnf.ignore_routes_with_linkdown) 295135103d11SAndy Gospodarek rtm->rtm_flags |= RTNH_F_DEAD; 295235103d11SAndy Gospodarek } 29531da177e4SLinus Torvalds rtm->rtm_scope = RT_SCOPE_UNIVERSE; 29541da177e4SLinus Torvalds rtm->rtm_protocol = rt->rt6i_protocol; 29551da177e4SLinus Torvalds if (rt->rt6i_flags & RTF_DYNAMIC) 29561da177e4SLinus Torvalds rtm->rtm_protocol = RTPROT_REDIRECT; 2957f0396f60SDenis Ovsienko else if (rt->rt6i_flags & RTF_ADDRCONF) { 2958f0396f60SDenis Ovsienko if (rt->rt6i_flags & (RTF_DEFAULT | RTF_ROUTEINFO)) 29591da177e4SLinus Torvalds rtm->rtm_protocol = RTPROT_RA; 2960f0396f60SDenis Ovsienko else 2961f0396f60SDenis Ovsienko rtm->rtm_protocol = RTPROT_KERNEL; 2962f0396f60SDenis Ovsienko } 29631da177e4SLinus Torvalds 29641da177e4SLinus Torvalds if (rt->rt6i_flags & RTF_CACHE) 29651da177e4SLinus Torvalds rtm->rtm_flags |= RTM_F_CLONED; 29661da177e4SLinus Torvalds 29671da177e4SLinus Torvalds if (dst) { 2968930345eaSJiri Benc if (nla_put_in6_addr(skb, RTA_DST, dst)) 2969c78679e8SDavid S. Miller goto nla_put_failure; 29701da177e4SLinus Torvalds rtm->rtm_dst_len = 128; 29711da177e4SLinus Torvalds } else if (rtm->rtm_dst_len) 2972930345eaSJiri Benc if (nla_put_in6_addr(skb, RTA_DST, &rt->rt6i_dst.addr)) 2973c78679e8SDavid S. Miller goto nla_put_failure; 29741da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES 29751da177e4SLinus Torvalds if (src) { 2976930345eaSJiri Benc if (nla_put_in6_addr(skb, RTA_SRC, src)) 2977c78679e8SDavid S. Miller goto nla_put_failure; 29781da177e4SLinus Torvalds rtm->rtm_src_len = 128; 2979c78679e8SDavid S. Miller } else if (rtm->rtm_src_len && 2980930345eaSJiri Benc nla_put_in6_addr(skb, RTA_SRC, &rt->rt6i_src.addr)) 2981c78679e8SDavid S. Miller goto nla_put_failure; 29821da177e4SLinus Torvalds #endif 29837bc570c8SYOSHIFUJI Hideaki if (iif) { 29847bc570c8SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_MROUTE 29857bc570c8SYOSHIFUJI Hideaki if (ipv6_addr_is_multicast(&rt->rt6i_dst.addr)) { 29868229efdaSBenjamin Thery int err = ip6mr_get_route(net, skb, rtm, nowait); 29877bc570c8SYOSHIFUJI Hideaki if (err <= 0) { 29887bc570c8SYOSHIFUJI Hideaki if (!nowait) { 29897bc570c8SYOSHIFUJI Hideaki if (err == 0) 29907bc570c8SYOSHIFUJI Hideaki return 0; 29917bc570c8SYOSHIFUJI Hideaki goto nla_put_failure; 29927bc570c8SYOSHIFUJI Hideaki } else { 29937bc570c8SYOSHIFUJI Hideaki if (err == -EMSGSIZE) 29947bc570c8SYOSHIFUJI Hideaki goto nla_put_failure; 29957bc570c8SYOSHIFUJI Hideaki } 29967bc570c8SYOSHIFUJI Hideaki } 29977bc570c8SYOSHIFUJI Hideaki } else 29987bc570c8SYOSHIFUJI Hideaki #endif 2999c78679e8SDavid S. Miller if (nla_put_u32(skb, RTA_IIF, iif)) 3000c78679e8SDavid S. Miller goto nla_put_failure; 30017bc570c8SYOSHIFUJI Hideaki } else if (dst) { 30021da177e4SLinus Torvalds struct in6_addr saddr_buf; 3003c78679e8SDavid S. Miller if (ip6_route_get_saddr(net, rt, dst, 0, &saddr_buf) == 0 && 3004930345eaSJiri Benc nla_put_in6_addr(skb, RTA_PREFSRC, &saddr_buf)) 3005c78679e8SDavid S. Miller goto nla_put_failure; 3006c3968a85SDaniel Walter } 3007c3968a85SDaniel Walter 3008c3968a85SDaniel Walter if (rt->rt6i_prefsrc.plen) { 3009c3968a85SDaniel Walter struct in6_addr saddr_buf; 30104e3fd7a0SAlexey Dobriyan saddr_buf = rt->rt6i_prefsrc.addr; 3011930345eaSJiri Benc if (nla_put_in6_addr(skb, RTA_PREFSRC, &saddr_buf)) 3012c78679e8SDavid S. Miller goto nla_put_failure; 30131da177e4SLinus Torvalds } 30142d7202bfSThomas Graf 30154b32b5adSMartin KaFai Lau memcpy(metrics, dst_metrics_ptr(&rt->dst), sizeof(metrics)); 30164b32b5adSMartin KaFai Lau if (rt->rt6i_pmtu) 30174b32b5adSMartin KaFai Lau metrics[RTAX_MTU - 1] = rt->rt6i_pmtu; 30184b32b5adSMartin KaFai Lau if (rtnetlink_put_metrics(skb, metrics) < 0) 30192d7202bfSThomas Graf goto nla_put_failure; 30202d7202bfSThomas Graf 3021dd0cbf29SYOSHIFUJI Hideaki / 吉藤英明 if (rt->rt6i_flags & RTF_GATEWAY) { 3022930345eaSJiri Benc if (nla_put_in6_addr(skb, RTA_GATEWAY, &rt->rt6i_gateway) < 0) 302394f826b8SEric Dumazet goto nla_put_failure; 302494f826b8SEric Dumazet } 30252d7202bfSThomas Graf 3026c78679e8SDavid S. Miller if (rt->dst.dev && 3027c78679e8SDavid S. Miller nla_put_u32(skb, RTA_OIF, rt->dst.dev->ifindex)) 3028c78679e8SDavid S. Miller goto nla_put_failure; 3029c78679e8SDavid S. Miller if (nla_put_u32(skb, RTA_PRIORITY, rt->rt6i_metric)) 3030c78679e8SDavid S. Miller goto nla_put_failure; 30318253947eSLi Wei 30328253947eSLi Wei expires = (rt->rt6i_flags & RTF_EXPIRES) ? rt->dst.expires - jiffies : 0; 303369cdf8f9SYOSHIFUJI Hideaki 303487a50699SDavid S. Miller if (rtnl_put_cacheinfo(skb, &rt->dst, 0, expires, rt->dst.error) < 0) 3035e3703b3dSThomas Graf goto nla_put_failure; 30361da177e4SLinus Torvalds 3037c78ba6d6SLubomir Rintel if (nla_put_u8(skb, RTA_PREF, IPV6_EXTRACT_PREF(rt->rt6i_flags))) 3038c78ba6d6SLubomir Rintel goto nla_put_failure; 3039c78ba6d6SLubomir Rintel 304061adedf3SJiri Benc lwtunnel_fill_encap(skb, rt->dst.lwtstate); 304119e42e45SRoopa Prabhu 3042053c095aSJohannes Berg nlmsg_end(skb, nlh); 3043053c095aSJohannes Berg return 0; 30442d7202bfSThomas Graf 30452d7202bfSThomas Graf nla_put_failure: 304626932566SPatrick McHardy nlmsg_cancel(skb, nlh); 304726932566SPatrick McHardy return -EMSGSIZE; 30481da177e4SLinus Torvalds } 30491da177e4SLinus Torvalds 30501b43af54SPatrick McHardy int rt6_dump_route(struct rt6_info *rt, void *p_arg) 30511da177e4SLinus Torvalds { 30521da177e4SLinus Torvalds struct rt6_rtnl_dump_arg *arg = (struct rt6_rtnl_dump_arg *) p_arg; 30531da177e4SLinus Torvalds int prefix; 30541da177e4SLinus Torvalds 30552d7202bfSThomas Graf if (nlmsg_len(arg->cb->nlh) >= sizeof(struct rtmsg)) { 30562d7202bfSThomas Graf struct rtmsg *rtm = nlmsg_data(arg->cb->nlh); 30571da177e4SLinus Torvalds prefix = (rtm->rtm_flags & RTM_F_PREFIX) != 0; 30581da177e4SLinus Torvalds } else 30591da177e4SLinus Torvalds prefix = 0; 30601da177e4SLinus Torvalds 3061191cd582SBrian Haley return rt6_fill_node(arg->net, 3062191cd582SBrian Haley arg->skb, rt, NULL, NULL, 0, RTM_NEWROUTE, 306315e47304SEric W. Biederman NETLINK_CB(arg->cb->skb).portid, arg->cb->nlh->nlmsg_seq, 30647bc570c8SYOSHIFUJI Hideaki prefix, 0, NLM_F_MULTI); 30651da177e4SLinus Torvalds } 30661da177e4SLinus Torvalds 3067661d2967SThomas Graf static int inet6_rtm_getroute(struct sk_buff *in_skb, struct nlmsghdr *nlh) 30681da177e4SLinus Torvalds { 30693b1e0a65SYOSHIFUJI Hideaki struct net *net = sock_net(in_skb->sk); 3070ab364a6fSThomas Graf struct nlattr *tb[RTA_MAX+1]; 30711da177e4SLinus Torvalds struct rt6_info *rt; 3072ab364a6fSThomas Graf struct sk_buff *skb; 3073ab364a6fSThomas Graf struct rtmsg *rtm; 30744c9483b2SDavid S. Miller struct flowi6 fl6; 307572331bc0SShmulik Ladkani int err, iif = 0, oif = 0; 3076ab364a6fSThomas Graf 3077ab364a6fSThomas Graf err = nlmsg_parse(nlh, sizeof(*rtm), tb, RTA_MAX, rtm_ipv6_policy); 3078ab364a6fSThomas Graf if (err < 0) 3079ab364a6fSThomas Graf goto errout; 3080ab364a6fSThomas Graf 3081ab364a6fSThomas Graf err = -EINVAL; 30824c9483b2SDavid S. Miller memset(&fl6, 0, sizeof(fl6)); 3083ab364a6fSThomas Graf 3084ab364a6fSThomas Graf if (tb[RTA_SRC]) { 3085ab364a6fSThomas Graf if (nla_len(tb[RTA_SRC]) < sizeof(struct in6_addr)) 3086ab364a6fSThomas Graf goto errout; 3087ab364a6fSThomas Graf 30884e3fd7a0SAlexey Dobriyan fl6.saddr = *(struct in6_addr *)nla_data(tb[RTA_SRC]); 3089ab364a6fSThomas Graf } 3090ab364a6fSThomas Graf 3091ab364a6fSThomas Graf if (tb[RTA_DST]) { 3092ab364a6fSThomas Graf if (nla_len(tb[RTA_DST]) < sizeof(struct in6_addr)) 3093ab364a6fSThomas Graf goto errout; 3094ab364a6fSThomas Graf 30954e3fd7a0SAlexey Dobriyan fl6.daddr = *(struct in6_addr *)nla_data(tb[RTA_DST]); 3096ab364a6fSThomas Graf } 3097ab364a6fSThomas Graf 3098ab364a6fSThomas Graf if (tb[RTA_IIF]) 3099ab364a6fSThomas Graf iif = nla_get_u32(tb[RTA_IIF]); 3100ab364a6fSThomas Graf 3101ab364a6fSThomas Graf if (tb[RTA_OIF]) 310272331bc0SShmulik Ladkani oif = nla_get_u32(tb[RTA_OIF]); 3103ab364a6fSThomas Graf 31042e47b291SLorenzo Colitti if (tb[RTA_MARK]) 31052e47b291SLorenzo Colitti fl6.flowi6_mark = nla_get_u32(tb[RTA_MARK]); 31062e47b291SLorenzo Colitti 3107ab364a6fSThomas Graf if (iif) { 3108ab364a6fSThomas Graf struct net_device *dev; 310972331bc0SShmulik Ladkani int flags = 0; 311072331bc0SShmulik Ladkani 31115578689aSDaniel Lezcano dev = __dev_get_by_index(net, iif); 3112ab364a6fSThomas Graf if (!dev) { 3113ab364a6fSThomas Graf err = -ENODEV; 3114ab364a6fSThomas Graf goto errout; 3115ab364a6fSThomas Graf } 311672331bc0SShmulik Ladkani 311772331bc0SShmulik Ladkani fl6.flowi6_iif = iif; 311872331bc0SShmulik Ladkani 311972331bc0SShmulik Ladkani if (!ipv6_addr_any(&fl6.saddr)) 312072331bc0SShmulik Ladkani flags |= RT6_LOOKUP_F_HAS_SADDR; 312172331bc0SShmulik Ladkani 312272331bc0SShmulik Ladkani rt = (struct rt6_info *)ip6_route_input_lookup(net, dev, &fl6, 312372331bc0SShmulik Ladkani flags); 312472331bc0SShmulik Ladkani } else { 312572331bc0SShmulik Ladkani fl6.flowi6_oif = oif; 312672331bc0SShmulik Ladkani 312772331bc0SShmulik Ladkani rt = (struct rt6_info *)ip6_route_output(net, NULL, &fl6); 3128ab364a6fSThomas Graf } 31291da177e4SLinus Torvalds 31301da177e4SLinus Torvalds skb = alloc_skb(NLMSG_GOODSIZE, GFP_KERNEL); 313138308473SDavid S. Miller if (!skb) { 313294e187c0SAmerigo Wang ip6_rt_put(rt); 3133ab364a6fSThomas Graf err = -ENOBUFS; 3134ab364a6fSThomas Graf goto errout; 3135ab364a6fSThomas Graf } 31361da177e4SLinus Torvalds 31371da177e4SLinus Torvalds /* Reserve room for dummy headers, this skb can pass 31381da177e4SLinus Torvalds through good chunk of routing engine. 31391da177e4SLinus Torvalds */ 3140459a98edSArnaldo Carvalho de Melo skb_reset_mac_header(skb); 31411da177e4SLinus Torvalds skb_reserve(skb, MAX_HEADER + sizeof(struct ipv6hdr)); 31421da177e4SLinus Torvalds 3143d8d1f30bSChangli Gao skb_dst_set(skb, &rt->dst); 31441da177e4SLinus Torvalds 31454c9483b2SDavid S. Miller err = rt6_fill_node(net, skb, rt, &fl6.daddr, &fl6.saddr, iif, 314615e47304SEric W. Biederman RTM_NEWROUTE, NETLINK_CB(in_skb).portid, 31477bc570c8SYOSHIFUJI Hideaki nlh->nlmsg_seq, 0, 0, 0); 31481da177e4SLinus Torvalds if (err < 0) { 3149ab364a6fSThomas Graf kfree_skb(skb); 3150ab364a6fSThomas Graf goto errout; 31511da177e4SLinus Torvalds } 31521da177e4SLinus Torvalds 315315e47304SEric W. Biederman err = rtnl_unicast(skb, net, NETLINK_CB(in_skb).portid); 3154ab364a6fSThomas Graf errout: 31551da177e4SLinus Torvalds return err; 31561da177e4SLinus Torvalds } 31571da177e4SLinus Torvalds 315886872cb5SThomas Graf void inet6_rt_notify(int event, struct rt6_info *rt, struct nl_info *info) 31591da177e4SLinus Torvalds { 31601da177e4SLinus Torvalds struct sk_buff *skb; 31615578689aSDaniel Lezcano struct net *net = info->nl_net; 3162528c4cebSDenis V. Lunev u32 seq; 3163528c4cebSDenis V. Lunev int err; 31640d51aa80SJamal Hadi Salim 3165528c4cebSDenis V. Lunev err = -ENOBUFS; 316638308473SDavid S. Miller seq = info->nlh ? info->nlh->nlmsg_seq : 0; 316786872cb5SThomas Graf 316819e42e45SRoopa Prabhu skb = nlmsg_new(rt6_nlmsg_size(rt), gfp_any()); 316938308473SDavid S. Miller if (!skb) 317021713ebcSThomas Graf goto errout; 31711da177e4SLinus Torvalds 3172191cd582SBrian Haley err = rt6_fill_node(net, skb, rt, NULL, NULL, 0, 317315e47304SEric W. Biederman event, info->portid, seq, 0, 0, 0); 317426932566SPatrick McHardy if (err < 0) { 317526932566SPatrick McHardy /* -EMSGSIZE implies BUG in rt6_nlmsg_size() */ 317626932566SPatrick McHardy WARN_ON(err == -EMSGSIZE); 317726932566SPatrick McHardy kfree_skb(skb); 317826932566SPatrick McHardy goto errout; 317926932566SPatrick McHardy } 318015e47304SEric W. Biederman rtnl_notify(skb, net, info->portid, RTNLGRP_IPV6_ROUTE, 31815578689aSDaniel Lezcano info->nlh, gfp_any()); 31821ce85fe4SPablo Neira Ayuso return; 318321713ebcSThomas Graf errout: 318421713ebcSThomas Graf if (err < 0) 31855578689aSDaniel Lezcano rtnl_set_sk_err(net, RTNLGRP_IPV6_ROUTE, err); 31861da177e4SLinus Torvalds } 31871da177e4SLinus Torvalds 31888ed67789SDaniel Lezcano static int ip6_route_dev_notify(struct notifier_block *this, 3189351638e7SJiri Pirko unsigned long event, void *ptr) 31908ed67789SDaniel Lezcano { 3191351638e7SJiri Pirko struct net_device *dev = netdev_notifier_info_to_dev(ptr); 3192c346dca1SYOSHIFUJI Hideaki struct net *net = dev_net(dev); 31938ed67789SDaniel Lezcano 31948ed67789SDaniel Lezcano if (event == NETDEV_REGISTER && (dev->flags & IFF_LOOPBACK)) { 3195d8d1f30bSChangli Gao net->ipv6.ip6_null_entry->dst.dev = dev; 31968ed67789SDaniel Lezcano net->ipv6.ip6_null_entry->rt6i_idev = in6_dev_get(dev); 31978ed67789SDaniel Lezcano #ifdef CONFIG_IPV6_MULTIPLE_TABLES 3198d8d1f30bSChangli Gao net->ipv6.ip6_prohibit_entry->dst.dev = dev; 31998ed67789SDaniel Lezcano net->ipv6.ip6_prohibit_entry->rt6i_idev = in6_dev_get(dev); 3200d8d1f30bSChangli Gao net->ipv6.ip6_blk_hole_entry->dst.dev = dev; 32018ed67789SDaniel Lezcano net->ipv6.ip6_blk_hole_entry->rt6i_idev = in6_dev_get(dev); 32028ed67789SDaniel Lezcano #endif 32038ed67789SDaniel Lezcano } 32048ed67789SDaniel Lezcano 32058ed67789SDaniel Lezcano return NOTIFY_OK; 32068ed67789SDaniel Lezcano } 32078ed67789SDaniel Lezcano 32081da177e4SLinus Torvalds /* 32091da177e4SLinus Torvalds * /proc 32101da177e4SLinus Torvalds */ 32111da177e4SLinus Torvalds 32121da177e4SLinus Torvalds #ifdef CONFIG_PROC_FS 32131da177e4SLinus Torvalds 321433120b30SAlexey Dobriyan static const struct file_operations ipv6_route_proc_fops = { 321533120b30SAlexey Dobriyan .owner = THIS_MODULE, 321633120b30SAlexey Dobriyan .open = ipv6_route_open, 321733120b30SAlexey Dobriyan .read = seq_read, 321833120b30SAlexey Dobriyan .llseek = seq_lseek, 32198d2ca1d7SHannes Frederic Sowa .release = seq_release_net, 322033120b30SAlexey Dobriyan }; 322133120b30SAlexey Dobriyan 32221da177e4SLinus Torvalds static int rt6_stats_seq_show(struct seq_file *seq, void *v) 32231da177e4SLinus Torvalds { 322469ddb805SDaniel Lezcano struct net *net = (struct net *)seq->private; 32251da177e4SLinus Torvalds seq_printf(seq, "%04x %04x %04x %04x %04x %04x %04x\n", 322669ddb805SDaniel Lezcano net->ipv6.rt6_stats->fib_nodes, 322769ddb805SDaniel Lezcano net->ipv6.rt6_stats->fib_route_nodes, 322869ddb805SDaniel Lezcano net->ipv6.rt6_stats->fib_rt_alloc, 322969ddb805SDaniel Lezcano net->ipv6.rt6_stats->fib_rt_entries, 323069ddb805SDaniel Lezcano net->ipv6.rt6_stats->fib_rt_cache, 3231fc66f95cSEric Dumazet dst_entries_get_slow(&net->ipv6.ip6_dst_ops), 323269ddb805SDaniel Lezcano net->ipv6.rt6_stats->fib_discarded_routes); 32331da177e4SLinus Torvalds 32341da177e4SLinus Torvalds return 0; 32351da177e4SLinus Torvalds } 32361da177e4SLinus Torvalds 32371da177e4SLinus Torvalds static int rt6_stats_seq_open(struct inode *inode, struct file *file) 32381da177e4SLinus Torvalds { 3239de05c557SPavel Emelyanov return single_open_net(inode, file, rt6_stats_seq_show); 324069ddb805SDaniel Lezcano } 324169ddb805SDaniel Lezcano 32429a32144eSArjan van de Ven static const struct file_operations rt6_stats_seq_fops = { 32431da177e4SLinus Torvalds .owner = THIS_MODULE, 32441da177e4SLinus Torvalds .open = rt6_stats_seq_open, 32451da177e4SLinus Torvalds .read = seq_read, 32461da177e4SLinus Torvalds .llseek = seq_lseek, 3247b6fcbdb4SPavel Emelyanov .release = single_release_net, 32481da177e4SLinus Torvalds }; 32491da177e4SLinus Torvalds #endif /* CONFIG_PROC_FS */ 32501da177e4SLinus Torvalds 32511da177e4SLinus Torvalds #ifdef CONFIG_SYSCTL 32521da177e4SLinus Torvalds 32531da177e4SLinus Torvalds static 3254fe2c6338SJoe Perches int ipv6_sysctl_rtcache_flush(struct ctl_table *ctl, int write, 32551da177e4SLinus Torvalds void __user *buffer, size_t *lenp, loff_t *ppos) 32561da177e4SLinus Torvalds { 3257c486da34SLucian Adrian Grijincu struct net *net; 3258c486da34SLucian Adrian Grijincu int delay; 3259c486da34SLucian Adrian Grijincu if (!write) 3260c486da34SLucian Adrian Grijincu return -EINVAL; 3261c486da34SLucian Adrian Grijincu 3262c486da34SLucian Adrian Grijincu net = (struct net *)ctl->extra1; 3263c486da34SLucian Adrian Grijincu delay = net->ipv6.sysctl.flush_delay; 32648d65af78SAlexey Dobriyan proc_dointvec(ctl, write, buffer, lenp, ppos); 32652ac3ac8fSMichal Kubeček fib6_run_gc(delay <= 0 ? 0 : (unsigned long)delay, net, delay > 0); 32661da177e4SLinus Torvalds return 0; 32671da177e4SLinus Torvalds } 32681da177e4SLinus Torvalds 3269fe2c6338SJoe Perches struct ctl_table ipv6_route_table_template[] = { 32701da177e4SLinus Torvalds { 32711da177e4SLinus Torvalds .procname = "flush", 32724990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.flush_delay, 32731da177e4SLinus Torvalds .maxlen = sizeof(int), 327489c8b3a1SDave Jones .mode = 0200, 32756d9f239aSAlexey Dobriyan .proc_handler = ipv6_sysctl_rtcache_flush 32761da177e4SLinus Torvalds }, 32771da177e4SLinus Torvalds { 32781da177e4SLinus Torvalds .procname = "gc_thresh", 32799a7ec3a9SDaniel Lezcano .data = &ip6_dst_ops_template.gc_thresh, 32801da177e4SLinus Torvalds .maxlen = sizeof(int), 32811da177e4SLinus Torvalds .mode = 0644, 32826d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec, 32831da177e4SLinus Torvalds }, 32841da177e4SLinus Torvalds { 32851da177e4SLinus Torvalds .procname = "max_size", 32864990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_max_size, 32871da177e4SLinus Torvalds .maxlen = sizeof(int), 32881da177e4SLinus Torvalds .mode = 0644, 32896d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec, 32901da177e4SLinus Torvalds }, 32911da177e4SLinus Torvalds { 32921da177e4SLinus Torvalds .procname = "gc_min_interval", 32934990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_gc_min_interval, 32941da177e4SLinus Torvalds .maxlen = sizeof(int), 32951da177e4SLinus Torvalds .mode = 0644, 32966d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec_jiffies, 32971da177e4SLinus Torvalds }, 32981da177e4SLinus Torvalds { 32991da177e4SLinus Torvalds .procname = "gc_timeout", 33004990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_gc_timeout, 33011da177e4SLinus Torvalds .maxlen = sizeof(int), 33021da177e4SLinus Torvalds .mode = 0644, 33036d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec_jiffies, 33041da177e4SLinus Torvalds }, 33051da177e4SLinus Torvalds { 33061da177e4SLinus Torvalds .procname = "gc_interval", 33074990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_gc_interval, 33081da177e4SLinus Torvalds .maxlen = sizeof(int), 33091da177e4SLinus Torvalds .mode = 0644, 33106d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec_jiffies, 33111da177e4SLinus Torvalds }, 33121da177e4SLinus Torvalds { 33131da177e4SLinus Torvalds .procname = "gc_elasticity", 33144990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_gc_elasticity, 33151da177e4SLinus Torvalds .maxlen = sizeof(int), 33161da177e4SLinus Torvalds .mode = 0644, 3317f3d3f616SMin Zhang .proc_handler = proc_dointvec, 33181da177e4SLinus Torvalds }, 33191da177e4SLinus Torvalds { 33201da177e4SLinus Torvalds .procname = "mtu_expires", 33214990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_mtu_expires, 33221da177e4SLinus Torvalds .maxlen = sizeof(int), 33231da177e4SLinus Torvalds .mode = 0644, 33246d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec_jiffies, 33251da177e4SLinus Torvalds }, 33261da177e4SLinus Torvalds { 33271da177e4SLinus Torvalds .procname = "min_adv_mss", 33284990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_min_advmss, 33291da177e4SLinus Torvalds .maxlen = sizeof(int), 33301da177e4SLinus Torvalds .mode = 0644, 3331f3d3f616SMin Zhang .proc_handler = proc_dointvec, 33321da177e4SLinus Torvalds }, 33331da177e4SLinus Torvalds { 33341da177e4SLinus Torvalds .procname = "gc_min_interval_ms", 33354990509fSDaniel Lezcano .data = &init_net.ipv6.sysctl.ip6_rt_gc_min_interval, 33361da177e4SLinus Torvalds .maxlen = sizeof(int), 33371da177e4SLinus Torvalds .mode = 0644, 33386d9f239aSAlexey Dobriyan .proc_handler = proc_dointvec_ms_jiffies, 33391da177e4SLinus Torvalds }, 3340f8572d8fSEric W. Biederman { } 33411da177e4SLinus Torvalds }; 33421da177e4SLinus Torvalds 33432c8c1e72SAlexey Dobriyan struct ctl_table * __net_init ipv6_route_sysctl_init(struct net *net) 3344760f2d01SDaniel Lezcano { 3345760f2d01SDaniel Lezcano struct ctl_table *table; 3346760f2d01SDaniel Lezcano 3347760f2d01SDaniel Lezcano table = kmemdup(ipv6_route_table_template, 3348760f2d01SDaniel Lezcano sizeof(ipv6_route_table_template), 3349760f2d01SDaniel Lezcano GFP_KERNEL); 33505ee09105SYOSHIFUJI Hideaki 33515ee09105SYOSHIFUJI Hideaki if (table) { 33525ee09105SYOSHIFUJI Hideaki table[0].data = &net->ipv6.sysctl.flush_delay; 3353c486da34SLucian Adrian Grijincu table[0].extra1 = net; 335486393e52SAlexey Dobriyan table[1].data = &net->ipv6.ip6_dst_ops.gc_thresh; 33555ee09105SYOSHIFUJI Hideaki table[2].data = &net->ipv6.sysctl.ip6_rt_max_size; 33565ee09105SYOSHIFUJI Hideaki table[3].data = &net->ipv6.sysctl.ip6_rt_gc_min_interval; 33575ee09105SYOSHIFUJI Hideaki table[4].data = &net->ipv6.sysctl.ip6_rt_gc_timeout; 33585ee09105SYOSHIFUJI Hideaki table[5].data = &net->ipv6.sysctl.ip6_rt_gc_interval; 33595ee09105SYOSHIFUJI Hideaki table[6].data = &net->ipv6.sysctl.ip6_rt_gc_elasticity; 33605ee09105SYOSHIFUJI Hideaki table[7].data = &net->ipv6.sysctl.ip6_rt_mtu_expires; 33615ee09105SYOSHIFUJI Hideaki table[8].data = &net->ipv6.sysctl.ip6_rt_min_advmss; 33629c69fabeSAlexey Dobriyan table[9].data = &net->ipv6.sysctl.ip6_rt_gc_min_interval; 3363464dc801SEric W. Biederman 3364464dc801SEric W. Biederman /* Don't export sysctls to unprivileged users */ 3365464dc801SEric W. Biederman if (net->user_ns != &init_user_ns) 3366464dc801SEric W. Biederman table[0].procname = NULL; 33675ee09105SYOSHIFUJI Hideaki } 33685ee09105SYOSHIFUJI Hideaki 3369760f2d01SDaniel Lezcano return table; 3370760f2d01SDaniel Lezcano } 33711da177e4SLinus Torvalds #endif 33721da177e4SLinus Torvalds 33732c8c1e72SAlexey Dobriyan static int __net_init ip6_route_net_init(struct net *net) 3374cdb18761SDaniel Lezcano { 3375633d424bSPavel Emelyanov int ret = -ENOMEM; 33768ed67789SDaniel Lezcano 337786393e52SAlexey Dobriyan memcpy(&net->ipv6.ip6_dst_ops, &ip6_dst_ops_template, 337886393e52SAlexey Dobriyan sizeof(net->ipv6.ip6_dst_ops)); 3379f2fc6a54SBenjamin Thery 3380fc66f95cSEric Dumazet if (dst_entries_init(&net->ipv6.ip6_dst_ops) < 0) 3381fc66f95cSEric Dumazet goto out_ip6_dst_ops; 3382fc66f95cSEric Dumazet 33838ed67789SDaniel Lezcano net->ipv6.ip6_null_entry = kmemdup(&ip6_null_entry_template, 33848ed67789SDaniel Lezcano sizeof(*net->ipv6.ip6_null_entry), 33858ed67789SDaniel Lezcano GFP_KERNEL); 33868ed67789SDaniel Lezcano if (!net->ipv6.ip6_null_entry) 3387fc66f95cSEric Dumazet goto out_ip6_dst_entries; 3388d8d1f30bSChangli Gao net->ipv6.ip6_null_entry->dst.path = 33898ed67789SDaniel Lezcano (struct dst_entry *)net->ipv6.ip6_null_entry; 3390d8d1f30bSChangli Gao net->ipv6.ip6_null_entry->dst.ops = &net->ipv6.ip6_dst_ops; 339162fa8a84SDavid S. Miller dst_init_metrics(&net->ipv6.ip6_null_entry->dst, 339262fa8a84SDavid S. Miller ip6_template_metrics, true); 33938ed67789SDaniel Lezcano 33948ed67789SDaniel Lezcano #ifdef CONFIG_IPV6_MULTIPLE_TABLES 33958ed67789SDaniel Lezcano net->ipv6.ip6_prohibit_entry = kmemdup(&ip6_prohibit_entry_template, 33968ed67789SDaniel Lezcano sizeof(*net->ipv6.ip6_prohibit_entry), 33978ed67789SDaniel Lezcano GFP_KERNEL); 339868fffc67SPeter Zijlstra if (!net->ipv6.ip6_prohibit_entry) 339968fffc67SPeter Zijlstra goto out_ip6_null_entry; 3400d8d1f30bSChangli Gao net->ipv6.ip6_prohibit_entry->dst.path = 34018ed67789SDaniel Lezcano (struct dst_entry *)net->ipv6.ip6_prohibit_entry; 3402d8d1f30bSChangli Gao net->ipv6.ip6_prohibit_entry->dst.ops = &net->ipv6.ip6_dst_ops; 340362fa8a84SDavid S. Miller dst_init_metrics(&net->ipv6.ip6_prohibit_entry->dst, 340462fa8a84SDavid S. Miller ip6_template_metrics, true); 34058ed67789SDaniel Lezcano 34068ed67789SDaniel Lezcano net->ipv6.ip6_blk_hole_entry = kmemdup(&ip6_blk_hole_entry_template, 34078ed67789SDaniel Lezcano sizeof(*net->ipv6.ip6_blk_hole_entry), 34088ed67789SDaniel Lezcano GFP_KERNEL); 340968fffc67SPeter Zijlstra if (!net->ipv6.ip6_blk_hole_entry) 341068fffc67SPeter Zijlstra goto out_ip6_prohibit_entry; 3411d8d1f30bSChangli Gao net->ipv6.ip6_blk_hole_entry->dst.path = 34128ed67789SDaniel Lezcano (struct dst_entry *)net->ipv6.ip6_blk_hole_entry; 3413d8d1f30bSChangli Gao net->ipv6.ip6_blk_hole_entry->dst.ops = &net->ipv6.ip6_dst_ops; 341462fa8a84SDavid S. Miller dst_init_metrics(&net->ipv6.ip6_blk_hole_entry->dst, 341562fa8a84SDavid S. Miller ip6_template_metrics, true); 34168ed67789SDaniel Lezcano #endif 34178ed67789SDaniel Lezcano 3418b339a47cSPeter Zijlstra net->ipv6.sysctl.flush_delay = 0; 3419b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_max_size = 4096; 3420b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_gc_min_interval = HZ / 2; 3421b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_gc_timeout = 60*HZ; 3422b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_gc_interval = 30*HZ; 3423b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_gc_elasticity = 9; 3424b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_mtu_expires = 10*60*HZ; 3425b339a47cSPeter Zijlstra net->ipv6.sysctl.ip6_rt_min_advmss = IPV6_MIN_MTU - 20 - 40; 3426b339a47cSPeter Zijlstra 34276891a346SBenjamin Thery net->ipv6.ip6_rt_gc_expire = 30*HZ; 34286891a346SBenjamin Thery 34298ed67789SDaniel Lezcano ret = 0; 34308ed67789SDaniel Lezcano out: 34318ed67789SDaniel Lezcano return ret; 3432f2fc6a54SBenjamin Thery 343368fffc67SPeter Zijlstra #ifdef CONFIG_IPV6_MULTIPLE_TABLES 343468fffc67SPeter Zijlstra out_ip6_prohibit_entry: 343568fffc67SPeter Zijlstra kfree(net->ipv6.ip6_prohibit_entry); 343668fffc67SPeter Zijlstra out_ip6_null_entry: 343768fffc67SPeter Zijlstra kfree(net->ipv6.ip6_null_entry); 343868fffc67SPeter Zijlstra #endif 3439fc66f95cSEric Dumazet out_ip6_dst_entries: 3440fc66f95cSEric Dumazet dst_entries_destroy(&net->ipv6.ip6_dst_ops); 3441f2fc6a54SBenjamin Thery out_ip6_dst_ops: 3442f2fc6a54SBenjamin Thery goto out; 3443cdb18761SDaniel Lezcano } 3444cdb18761SDaniel Lezcano 34452c8c1e72SAlexey Dobriyan static void __net_exit ip6_route_net_exit(struct net *net) 3446cdb18761SDaniel Lezcano { 34478ed67789SDaniel Lezcano kfree(net->ipv6.ip6_null_entry); 34488ed67789SDaniel Lezcano #ifdef CONFIG_IPV6_MULTIPLE_TABLES 34498ed67789SDaniel Lezcano kfree(net->ipv6.ip6_prohibit_entry); 34508ed67789SDaniel Lezcano kfree(net->ipv6.ip6_blk_hole_entry); 34518ed67789SDaniel Lezcano #endif 345241bb78b4SXiaotian Feng dst_entries_destroy(&net->ipv6.ip6_dst_ops); 3453cdb18761SDaniel Lezcano } 3454cdb18761SDaniel Lezcano 3455d189634eSThomas Graf static int __net_init ip6_route_net_init_late(struct net *net) 3456d189634eSThomas Graf { 3457d189634eSThomas Graf #ifdef CONFIG_PROC_FS 3458d4beaa66SGao feng proc_create("ipv6_route", 0, net->proc_net, &ipv6_route_proc_fops); 3459d4beaa66SGao feng proc_create("rt6_stats", S_IRUGO, net->proc_net, &rt6_stats_seq_fops); 3460d189634eSThomas Graf #endif 3461d189634eSThomas Graf return 0; 3462d189634eSThomas Graf } 3463d189634eSThomas Graf 3464d189634eSThomas Graf static void __net_exit ip6_route_net_exit_late(struct net *net) 3465d189634eSThomas Graf { 3466d189634eSThomas Graf #ifdef CONFIG_PROC_FS 3467ece31ffdSGao feng remove_proc_entry("ipv6_route", net->proc_net); 3468ece31ffdSGao feng remove_proc_entry("rt6_stats", net->proc_net); 3469d189634eSThomas Graf #endif 3470d189634eSThomas Graf } 3471d189634eSThomas Graf 3472cdb18761SDaniel Lezcano static struct pernet_operations ip6_route_net_ops = { 3473cdb18761SDaniel Lezcano .init = ip6_route_net_init, 3474cdb18761SDaniel Lezcano .exit = ip6_route_net_exit, 3475cdb18761SDaniel Lezcano }; 3476cdb18761SDaniel Lezcano 3477c3426b47SDavid S. Miller static int __net_init ipv6_inetpeer_init(struct net *net) 3478c3426b47SDavid S. Miller { 3479c3426b47SDavid S. Miller struct inet_peer_base *bp = kmalloc(sizeof(*bp), GFP_KERNEL); 3480c3426b47SDavid S. Miller 3481c3426b47SDavid S. Miller if (!bp) 3482c3426b47SDavid S. Miller return -ENOMEM; 3483c3426b47SDavid S. Miller inet_peer_base_init(bp); 3484c3426b47SDavid S. Miller net->ipv6.peers = bp; 3485c3426b47SDavid S. Miller return 0; 3486c3426b47SDavid S. Miller } 3487c3426b47SDavid S. Miller 3488c3426b47SDavid S. Miller static void __net_exit ipv6_inetpeer_exit(struct net *net) 3489c3426b47SDavid S. Miller { 3490c3426b47SDavid S. Miller struct inet_peer_base *bp = net->ipv6.peers; 3491c3426b47SDavid S. Miller 3492c3426b47SDavid S. Miller net->ipv6.peers = NULL; 349356a6b248SDavid S. Miller inetpeer_invalidate_tree(bp); 3494c3426b47SDavid S. Miller kfree(bp); 3495c3426b47SDavid S. Miller } 3496c3426b47SDavid S. Miller 34972b823f72SDavid S. Miller static struct pernet_operations ipv6_inetpeer_ops = { 3498c3426b47SDavid S. Miller .init = ipv6_inetpeer_init, 3499c3426b47SDavid S. Miller .exit = ipv6_inetpeer_exit, 3500c3426b47SDavid S. Miller }; 3501c3426b47SDavid S. Miller 3502d189634eSThomas Graf static struct pernet_operations ip6_route_net_late_ops = { 3503d189634eSThomas Graf .init = ip6_route_net_init_late, 3504d189634eSThomas Graf .exit = ip6_route_net_exit_late, 3505d189634eSThomas Graf }; 3506d189634eSThomas Graf 35078ed67789SDaniel Lezcano static struct notifier_block ip6_route_dev_notifier = { 35088ed67789SDaniel Lezcano .notifier_call = ip6_route_dev_notify, 35098ed67789SDaniel Lezcano .priority = 0, 35108ed67789SDaniel Lezcano }; 35118ed67789SDaniel Lezcano 3512433d49c3SDaniel Lezcano int __init ip6_route_init(void) 35131da177e4SLinus Torvalds { 3514433d49c3SDaniel Lezcano int ret; 35158d0b94afSMartin KaFai Lau int cpu; 3516433d49c3SDaniel Lezcano 35179a7ec3a9SDaniel Lezcano ret = -ENOMEM; 35189a7ec3a9SDaniel Lezcano ip6_dst_ops_template.kmem_cachep = 35199a7ec3a9SDaniel Lezcano kmem_cache_create("ip6_dst_cache", sizeof(struct rt6_info), 0, 35209a7ec3a9SDaniel Lezcano SLAB_HWCACHE_ALIGN, NULL); 35219a7ec3a9SDaniel Lezcano if (!ip6_dst_ops_template.kmem_cachep) 3522c19a28e1SFernando Carrijo goto out; 352314e50e57SDavid S. Miller 3524fc66f95cSEric Dumazet ret = dst_entries_init(&ip6_dst_blackhole_ops); 35258ed67789SDaniel Lezcano if (ret) 3526bdb3289fSDaniel Lezcano goto out_kmem_cache; 3527bdb3289fSDaniel Lezcano 3528c3426b47SDavid S. Miller ret = register_pernet_subsys(&ipv6_inetpeer_ops); 3529c3426b47SDavid S. Miller if (ret) 3530e8803b6cSDavid S. Miller goto out_dst_entries; 35312a0c451aSThomas Graf 35327e52b33bSDavid S. Miller ret = register_pernet_subsys(&ip6_route_net_ops); 35337e52b33bSDavid S. Miller if (ret) 35347e52b33bSDavid S. Miller goto out_register_inetpeer; 3535c3426b47SDavid S. Miller 35365dc121e9SArnaud Ebalard ip6_dst_blackhole_ops.kmem_cachep = ip6_dst_ops_template.kmem_cachep; 35375dc121e9SArnaud Ebalard 35388ed67789SDaniel Lezcano /* Registering of the loopback is done before this portion of code, 35398ed67789SDaniel Lezcano * the loopback reference in rt6_info will not be taken, do it 35408ed67789SDaniel Lezcano * manually for init_net */ 3541d8d1f30bSChangli Gao init_net.ipv6.ip6_null_entry->dst.dev = init_net.loopback_dev; 35428ed67789SDaniel Lezcano init_net.ipv6.ip6_null_entry->rt6i_idev = in6_dev_get(init_net.loopback_dev); 3543bdb3289fSDaniel Lezcano #ifdef CONFIG_IPV6_MULTIPLE_TABLES 3544d8d1f30bSChangli Gao init_net.ipv6.ip6_prohibit_entry->dst.dev = init_net.loopback_dev; 35458ed67789SDaniel Lezcano init_net.ipv6.ip6_prohibit_entry->rt6i_idev = in6_dev_get(init_net.loopback_dev); 3546d8d1f30bSChangli Gao init_net.ipv6.ip6_blk_hole_entry->dst.dev = init_net.loopback_dev; 35478ed67789SDaniel Lezcano init_net.ipv6.ip6_blk_hole_entry->rt6i_idev = in6_dev_get(init_net.loopback_dev); 3548bdb3289fSDaniel Lezcano #endif 3549e8803b6cSDavid S. Miller ret = fib6_init(); 3550433d49c3SDaniel Lezcano if (ret) 35518ed67789SDaniel Lezcano goto out_register_subsys; 3552433d49c3SDaniel Lezcano 3553433d49c3SDaniel Lezcano ret = xfrm6_init(); 3554433d49c3SDaniel Lezcano if (ret) 3555e8803b6cSDavid S. Miller goto out_fib6_init; 3556c35b7e72SDaniel Lezcano 3557433d49c3SDaniel Lezcano ret = fib6_rules_init(); 3558433d49c3SDaniel Lezcano if (ret) 3559433d49c3SDaniel Lezcano goto xfrm6_init; 35607e5449c2SDaniel Lezcano 3561d189634eSThomas Graf ret = register_pernet_subsys(&ip6_route_net_late_ops); 3562d189634eSThomas Graf if (ret) 3563d189634eSThomas Graf goto fib6_rules_init; 3564d189634eSThomas Graf 3565433d49c3SDaniel Lezcano ret = -ENOBUFS; 3566c7ac8679SGreg Rose if (__rtnl_register(PF_INET6, RTM_NEWROUTE, inet6_rtm_newroute, NULL, NULL) || 3567c7ac8679SGreg Rose __rtnl_register(PF_INET6, RTM_DELROUTE, inet6_rtm_delroute, NULL, NULL) || 3568c7ac8679SGreg Rose __rtnl_register(PF_INET6, RTM_GETROUTE, inet6_rtm_getroute, NULL, NULL)) 3569d189634eSThomas Graf goto out_register_late_subsys; 3570433d49c3SDaniel Lezcano 35718ed67789SDaniel Lezcano ret = register_netdevice_notifier(&ip6_route_dev_notifier); 3572cdb18761SDaniel Lezcano if (ret) 3573d189634eSThomas Graf goto out_register_late_subsys; 35748ed67789SDaniel Lezcano 35758d0b94afSMartin KaFai Lau for_each_possible_cpu(cpu) { 35768d0b94afSMartin KaFai Lau struct uncached_list *ul = per_cpu_ptr(&rt6_uncached_list, cpu); 35778d0b94afSMartin KaFai Lau 35788d0b94afSMartin KaFai Lau INIT_LIST_HEAD(&ul->head); 35798d0b94afSMartin KaFai Lau spin_lock_init(&ul->lock); 35808d0b94afSMartin KaFai Lau } 35818d0b94afSMartin KaFai Lau 3582433d49c3SDaniel Lezcano out: 3583433d49c3SDaniel Lezcano return ret; 3584433d49c3SDaniel Lezcano 3585d189634eSThomas Graf out_register_late_subsys: 3586d189634eSThomas Graf unregister_pernet_subsys(&ip6_route_net_late_ops); 3587433d49c3SDaniel Lezcano fib6_rules_init: 3588433d49c3SDaniel Lezcano fib6_rules_cleanup(); 3589433d49c3SDaniel Lezcano xfrm6_init: 3590433d49c3SDaniel Lezcano xfrm6_fini(); 35912a0c451aSThomas Graf out_fib6_init: 35922a0c451aSThomas Graf fib6_gc_cleanup(); 35938ed67789SDaniel Lezcano out_register_subsys: 35948ed67789SDaniel Lezcano unregister_pernet_subsys(&ip6_route_net_ops); 35957e52b33bSDavid S. Miller out_register_inetpeer: 35967e52b33bSDavid S. Miller unregister_pernet_subsys(&ipv6_inetpeer_ops); 3597fc66f95cSEric Dumazet out_dst_entries: 3598fc66f95cSEric Dumazet dst_entries_destroy(&ip6_dst_blackhole_ops); 3599433d49c3SDaniel Lezcano out_kmem_cache: 3600f2fc6a54SBenjamin Thery kmem_cache_destroy(ip6_dst_ops_template.kmem_cachep); 3601433d49c3SDaniel Lezcano goto out; 36021da177e4SLinus Torvalds } 36031da177e4SLinus Torvalds 36041da177e4SLinus Torvalds void ip6_route_cleanup(void) 36051da177e4SLinus Torvalds { 36068ed67789SDaniel Lezcano unregister_netdevice_notifier(&ip6_route_dev_notifier); 3607d189634eSThomas Graf unregister_pernet_subsys(&ip6_route_net_late_ops); 3608101367c2SThomas Graf fib6_rules_cleanup(); 36091da177e4SLinus Torvalds xfrm6_fini(); 36101da177e4SLinus Torvalds fib6_gc_cleanup(); 3611c3426b47SDavid S. Miller unregister_pernet_subsys(&ipv6_inetpeer_ops); 36128ed67789SDaniel Lezcano unregister_pernet_subsys(&ip6_route_net_ops); 361341bb78b4SXiaotian Feng dst_entries_destroy(&ip6_dst_blackhole_ops); 3614f2fc6a54SBenjamin Thery kmem_cache_destroy(ip6_dst_ops_template.kmem_cachep); 36151da177e4SLinus Torvalds } 3616