12874c5fdSThomas Gleixner // SPDX-License-Identifier: GPL-2.0-or-later
21da177e4SLinus Torvalds /*
31da177e4SLinus Torvalds * Linux INET6 implementation
41da177e4SLinus Torvalds * Forwarding Information Database
51da177e4SLinus Torvalds *
61da177e4SLinus Torvalds * Authors:
71da177e4SLinus Torvalds * Pedro Roque <roque@di.fc.ul.pt>
81da177e4SLinus Torvalds *
91da177e4SLinus Torvalds * Changes:
101da177e4SLinus Torvalds * Yuji SEKIYA @USAGI: Support default route on router node;
111da177e4SLinus Torvalds * remove ip6_null_entry from the top of
121da177e4SLinus Torvalds * routing table.
13c0bece9fSYOSHIFUJI Hideaki * Ville Nuorvala: Fixed routing subtrees.
141da177e4SLinus Torvalds */
15f3213831SJoe Perches
16f3213831SJoe Perches #define pr_fmt(fmt) "IPv6: " fmt
17f3213831SJoe Perches
18b6459415SJakub Kicinski #include <linux/bpf.h>
191da177e4SLinus Torvalds #include <linux/errno.h>
201da177e4SLinus Torvalds #include <linux/types.h>
211da177e4SLinus Torvalds #include <linux/net.h>
221da177e4SLinus Torvalds #include <linux/route.h>
231da177e4SLinus Torvalds #include <linux/netdevice.h>
241da177e4SLinus Torvalds #include <linux/in6.h>
251da177e4SLinus Torvalds #include <linux/init.h>
26c71099acSThomas Graf #include <linux/list.h>
275a0e3ad6STejun Heo #include <linux/slab.h>
281da177e4SLinus Torvalds
29cc5f0eb2SDavid Ahern #include <net/ip.h>
301da177e4SLinus Torvalds #include <net/ipv6.h>
311da177e4SLinus Torvalds #include <net/ndisc.h>
321da177e4SLinus Torvalds #include <net/addrconf.h>
3319e42e45SRoopa Prabhu #include <net/lwtunnel.h>
34df77fe4dSIdo Schimmel #include <net/fib_notifier.h>
351da177e4SLinus Torvalds
36ed13923fSIdo Schimmel #include <net/ip_fib.h>
371da177e4SLinus Torvalds #include <net/ip6_fib.h>
381da177e4SLinus Torvalds #include <net/ip6_route.h>
391da177e4SLinus Torvalds
40e18b890bSChristoph Lameter static struct kmem_cache *fib6_node_kmem __read_mostly;
411da177e4SLinus Torvalds
4294b2cfe0SHannes Frederic Sowa struct fib6_cleaner {
4394b2cfe0SHannes Frederic Sowa struct fib6_walker w;
44ec7d43c2SBenjamin Thery struct net *net;
458d1c802bSDavid Ahern int (*func)(struct fib6_info *, void *arg);
46327571cbSHannes Frederic Sowa int sernum;
471da177e4SLinus Torvalds void *arg;
487c6bb7d2SDavid Ahern bool skip_notify;
491da177e4SLinus Torvalds };
501da177e4SLinus Torvalds
511da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
521da177e4SLinus Torvalds #define FWS_INIT FWS_S
531da177e4SLinus Torvalds #else
541da177e4SLinus Torvalds #define FWS_INIT FWS_L
551da177e4SLinus Torvalds #endif
561da177e4SLinus Torvalds
578d1c802bSDavid Ahern static struct fib6_info *fib6_find_prefix(struct net *net,
5866f5d6ceSWei Wang struct fib6_table *table,
5966f5d6ceSWei Wang struct fib6_node *fn);
6066f5d6ceSWei Wang static struct fib6_node *fib6_repair_tree(struct net *net,
6166f5d6ceSWei Wang struct fib6_table *table,
6266f5d6ceSWei Wang struct fib6_node *fn);
639a03cd8fSMichal Kubeček static int fib6_walk(struct net *net, struct fib6_walker *w);
6494b2cfe0SHannes Frederic Sowa static int fib6_walk_continue(struct fib6_walker *w);
651da177e4SLinus Torvalds
661da177e4SLinus Torvalds /*
671da177e4SLinus Torvalds * A routing update causes an increase of the serial number on the
681da177e4SLinus Torvalds * affected subtree. This allows for cached routes to be asynchronously
691da177e4SLinus Torvalds * tested when modifications are made to the destination cache as a
701da177e4SLinus Torvalds * result of redirects, path MTU changes, etc.
711da177e4SLinus Torvalds */
721da177e4SLinus Torvalds
7386cb30ecSKees Cook static void fib6_gc_timer_cb(struct timer_list *t);
745b7c931dSDaniel Lezcano
759a03cd8fSMichal Kubeček #define FOR_WALKERS(net, w) \
769a03cd8fSMichal Kubeček list_for_each_entry(w, &(net)->ipv6.fib6_walkers, lh)
771da177e4SLinus Torvalds
fib6_walker_link(struct net * net,struct fib6_walker * w)789a03cd8fSMichal Kubeček static void fib6_walker_link(struct net *net, struct fib6_walker *w)
7990d41122SAdrian Bunk {
809a03cd8fSMichal Kubeček write_lock_bh(&net->ipv6.fib6_walker_lock);
819a03cd8fSMichal Kubeček list_add(&w->lh, &net->ipv6.fib6_walkers);
829a03cd8fSMichal Kubeček write_unlock_bh(&net->ipv6.fib6_walker_lock);
8390d41122SAdrian Bunk }
8490d41122SAdrian Bunk
fib6_walker_unlink(struct net * net,struct fib6_walker * w)859a03cd8fSMichal Kubeček static void fib6_walker_unlink(struct net *net, struct fib6_walker *w)
8690d41122SAdrian Bunk {
879a03cd8fSMichal Kubeček write_lock_bh(&net->ipv6.fib6_walker_lock);
88bbef49daSAlexey Dobriyan list_del(&w->lh);
899a03cd8fSMichal Kubeček write_unlock_bh(&net->ipv6.fib6_walker_lock);
9090d41122SAdrian Bunk }
9194b2cfe0SHannes Frederic Sowa
fib6_new_sernum(struct net * net)92812918c4SHannes Frederic Sowa static int fib6_new_sernum(struct net *net)
931da177e4SLinus Torvalds {
9430189806SEric Dumazet int new, old = atomic_read(&net->ipv6.fib6_sernum);
9542b18706SHannes Frederic Sowa
9642b18706SHannes Frederic Sowa do {
9742b18706SHannes Frederic Sowa new = old < INT_MAX ? old + 1 : 1;
9830189806SEric Dumazet } while (!atomic_try_cmpxchg(&net->ipv6.fib6_sernum, &old, new));
9930189806SEric Dumazet
10042b18706SHannes Frederic Sowa return new;
1011da177e4SLinus Torvalds }
1021da177e4SLinus Torvalds
103327571cbSHannes Frederic Sowa enum {
104327571cbSHannes Frederic Sowa FIB6_NO_SERNUM_CHANGE = 0,
105327571cbSHannes Frederic Sowa };
106327571cbSHannes Frederic Sowa
fib6_update_sernum(struct net * net,struct fib6_info * f6i)10793c2fb25SDavid Ahern void fib6_update_sernum(struct net *net, struct fib6_info *f6i)
108180ca444SWei Wang {
109180ca444SWei Wang struct fib6_node *fn;
110180ca444SWei Wang
11193c2fb25SDavid Ahern fn = rcu_dereference_protected(f6i->fib6_node,
11293c2fb25SDavid Ahern lockdep_is_held(&f6i->fib6_table->tb6_lock));
113180ca444SWei Wang if (fn)
114aafc2e32SEric Dumazet WRITE_ONCE(fn->fn_sernum, fib6_new_sernum(net));
115180ca444SWei Wang }
116180ca444SWei Wang
1171da177e4SLinus Torvalds /*
1181da177e4SLinus Torvalds * Auxiliary address test functions for the radix tree.
1191da177e4SLinus Torvalds *
1201da177e4SLinus Torvalds * These assume a 32bit processor (although it will work on
1211da177e4SLinus Torvalds * 64bit processors)
1221da177e4SLinus Torvalds */
1231da177e4SLinus Torvalds
1241da177e4SLinus Torvalds /*
1251da177e4SLinus Torvalds * test bit
1261da177e4SLinus Torvalds */
12702cdce53SYOSHIFUJI Hideaki / 吉藤英明 #if defined(__LITTLE_ENDIAN)
12802cdce53SYOSHIFUJI Hideaki / 吉藤英明 # define BITOP_BE32_SWIZZLE (0x1F & ~7)
12902cdce53SYOSHIFUJI Hideaki / 吉藤英明 #else
13002cdce53SYOSHIFUJI Hideaki / 吉藤英明 # define BITOP_BE32_SWIZZLE 0
13102cdce53SYOSHIFUJI Hideaki / 吉藤英明 #endif
1321da177e4SLinus Torvalds
addr_bit_set(const void * token,int fn_bit)13394b2cfe0SHannes Frederic Sowa static __be32 addr_bit_set(const void *token, int fn_bit)
1341da177e4SLinus Torvalds {
135b71d1d42SEric Dumazet const __be32 *addr = token;
13602cdce53SYOSHIFUJI Hideaki / 吉藤英明 /*
13702cdce53SYOSHIFUJI Hideaki / 吉藤英明 * Here,
13802cdce53SYOSHIFUJI Hideaki / 吉藤英明 * 1 << ((~fn_bit ^ BITOP_BE32_SWIZZLE) & 0x1f)
13902cdce53SYOSHIFUJI Hideaki / 吉藤英明 * is optimized version of
14002cdce53SYOSHIFUJI Hideaki / 吉藤英明 * htonl(1 << ((~fn_bit)&0x1F))
14102cdce53SYOSHIFUJI Hideaki / 吉藤英明 * See include/asm-generic/bitops/le.h.
14202cdce53SYOSHIFUJI Hideaki / 吉藤英明 */
1430eae88f3SEric Dumazet return (__force __be32)(1 << ((~fn_bit ^ BITOP_BE32_SWIZZLE) & 0x1f)) &
1440eae88f3SEric Dumazet addr[fn_bit >> 5];
1451da177e4SLinus Torvalds }
1461da177e4SLinus Torvalds
fib6_info_alloc(gfp_t gfp_flags,bool with_fib6_nh)1471cf844c7SDavid Ahern struct fib6_info *fib6_info_alloc(gfp_t gfp_flags, bool with_fib6_nh)
148a64efe14SDavid Ahern {
1498d1c802bSDavid Ahern struct fib6_info *f6i;
1501cf844c7SDavid Ahern size_t sz = sizeof(*f6i);
151a64efe14SDavid Ahern
1521cf844c7SDavid Ahern if (with_fib6_nh)
1531cf844c7SDavid Ahern sz += sizeof(struct fib6_nh);
1541cf844c7SDavid Ahern
1551cf844c7SDavid Ahern f6i = kzalloc(sz, gfp_flags);
156a64efe14SDavid Ahern if (!f6i)
157a64efe14SDavid Ahern return NULL;
158a64efe14SDavid Ahern
159f88d8ea6SDavid Ahern /* fib6_siblings is a union with nh_list, so this initializes both */
16093c2fb25SDavid Ahern INIT_LIST_HEAD(&f6i->fib6_siblings);
161f05713e0SEric Dumazet refcount_set(&f6i->fib6_ref, 1);
162a64efe14SDavid Ahern
163a64efe14SDavid Ahern return f6i;
164a64efe14SDavid Ahern }
165a64efe14SDavid Ahern
fib6_info_destroy_rcu(struct rcu_head * head)1669b0a8da8SEric Dumazet void fib6_info_destroy_rcu(struct rcu_head *head)
167a64efe14SDavid Ahern {
1689b0a8da8SEric Dumazet struct fib6_info *f6i = container_of(head, struct fib6_info, rcu);
169a64efe14SDavid Ahern
17093c2fb25SDavid Ahern WARN_ON(f6i->fib6_node);
171a64efe14SDavid Ahern
172f88d8ea6SDavid Ahern if (f6i->nh)
173f88d8ea6SDavid Ahern nexthop_put(f6i->nh);
174f88d8ea6SDavid Ahern else
1751cf844c7SDavid Ahern fib6_nh_release(f6i->fib6_nh);
176f88d8ea6SDavid Ahern
177cc5f0eb2SDavid Ahern ip_fib_metrics_put(f6i->fib6_metrics);
178a64efe14SDavid Ahern kfree(f6i);
179a64efe14SDavid Ahern }
1809b0a8da8SEric Dumazet EXPORT_SYMBOL_GPL(fib6_info_destroy_rcu);
181a64efe14SDavid Ahern
node_alloc(struct net * net)18281eb8447SWei Wang static struct fib6_node *node_alloc(struct net *net)
1831da177e4SLinus Torvalds {
1841da177e4SLinus Torvalds struct fib6_node *fn;
1851da177e4SLinus Torvalds
186c3762229SRobert P. J. Day fn = kmem_cache_zalloc(fib6_node_kmem, GFP_ATOMIC);
18781eb8447SWei Wang if (fn)
18881eb8447SWei Wang net->ipv6.rt6_stats->fib_nodes++;
1891da177e4SLinus Torvalds
1901da177e4SLinus Torvalds return fn;
1911da177e4SLinus Torvalds }
1921da177e4SLinus Torvalds
node_free_immediate(struct net * net,struct fib6_node * fn)19381eb8447SWei Wang static void node_free_immediate(struct net *net, struct fib6_node *fn)
1941da177e4SLinus Torvalds {
1951da177e4SLinus Torvalds kmem_cache_free(fib6_node_kmem, fn);
19681eb8447SWei Wang net->ipv6.rt6_stats->fib_nodes--;
1971da177e4SLinus Torvalds }
1981da177e4SLinus Torvalds
node_free_rcu(struct rcu_head * head)199c5cff856SWei Wang static void node_free_rcu(struct rcu_head *head)
200c5cff856SWei Wang {
201c5cff856SWei Wang struct fib6_node *fn = container_of(head, struct fib6_node, rcu);
202c5cff856SWei Wang
203c5cff856SWei Wang kmem_cache_free(fib6_node_kmem, fn);
204c5cff856SWei Wang }
205c5cff856SWei Wang
node_free(struct net * net,struct fib6_node * fn)20681eb8447SWei Wang static void node_free(struct net *net, struct fib6_node *fn)
207c5cff856SWei Wang {
208c5cff856SWei Wang call_rcu(&fn->rcu, node_free_rcu);
20981eb8447SWei Wang net->ipv6.rt6_stats->fib_nodes--;
210c5cff856SWei Wang }
211c5cff856SWei Wang
fib6_free_table(struct fib6_table * table)212ba1cc08dSSabrina Dubroca static void fib6_free_table(struct fib6_table *table)
213ba1cc08dSSabrina Dubroca {
214ba1cc08dSSabrina Dubroca inetpeer_invalidate_tree(&table->tb6_peers);
215ba1cc08dSSabrina Dubroca kfree(table);
216ba1cc08dSSabrina Dubroca }
217ba1cc08dSSabrina Dubroca
fib6_link_table(struct net * net,struct fib6_table * tb)21858f09b78SDaniel Lezcano static void fib6_link_table(struct net *net, struct fib6_table *tb)
2191b43af54SPatrick McHardy {
2201b43af54SPatrick McHardy unsigned int h;
2211b43af54SPatrick McHardy
222375216adSThomas Graf /*
223375216adSThomas Graf * Initialize table lock at a single place to give lockdep a key,
224375216adSThomas Graf * tables aren't visible prior to being linked to the list.
225375216adSThomas Graf */
22666f5d6ceSWei Wang spin_lock_init(&tb->tb6_lock);
227a33bc5c1SNeil Horman h = tb->tb6_id & (FIB6_TABLE_HASHSZ - 1);
2281b43af54SPatrick McHardy
2291b43af54SPatrick McHardy /*
2301b43af54SPatrick McHardy * No protection necessary, this is the only list mutatation
2311b43af54SPatrick McHardy * operation, tables never disappear once they exist.
2321b43af54SPatrick McHardy */
23358f09b78SDaniel Lezcano hlist_add_head_rcu(&tb->tb6_hlist, &net->ipv6.fib_table_hash[h]);
2341b43af54SPatrick McHardy }
2351b43af54SPatrick McHardy
2361b43af54SPatrick McHardy #ifdef CONFIG_IPV6_MULTIPLE_TABLES
237e0b85590SDaniel Lezcano
fib6_alloc_table(struct net * net,u32 id)2388ed67789SDaniel Lezcano static struct fib6_table *fib6_alloc_table(struct net *net, u32 id)
239c71099acSThomas Graf {
240c71099acSThomas Graf struct fib6_table *table;
241c71099acSThomas Graf
242c71099acSThomas Graf table = kzalloc(sizeof(*table), GFP_ATOMIC);
243507c9b1eSDavid S. Miller if (table) {
244c71099acSThomas Graf table->tb6_id = id;
24566f5d6ceSWei Wang rcu_assign_pointer(table->tb6_root.leaf,
246421842edSDavid Ahern net->ipv6.fib6_null_entry);
247c71099acSThomas Graf table->tb6_root.fn_flags = RTN_ROOT | RTN_TL_ROOT | RTN_RTINFO;
2488e773277SDavid S. Miller inet_peer_base_init(&table->tb6_peers);
249c71099acSThomas Graf }
250c71099acSThomas Graf
251c71099acSThomas Graf return table;
252c71099acSThomas Graf }
253c71099acSThomas Graf
fib6_new_table(struct net * net,u32 id)25458f09b78SDaniel Lezcano struct fib6_table *fib6_new_table(struct net *net, u32 id)
255c71099acSThomas Graf {
256c71099acSThomas Graf struct fib6_table *tb;
257c71099acSThomas Graf
258c71099acSThomas Graf if (id == 0)
259c71099acSThomas Graf id = RT6_TABLE_MAIN;
26058f09b78SDaniel Lezcano tb = fib6_get_table(net, id);
261c71099acSThomas Graf if (tb)
262c71099acSThomas Graf return tb;
263c71099acSThomas Graf
2648ed67789SDaniel Lezcano tb = fib6_alloc_table(net, id);
265507c9b1eSDavid S. Miller if (tb)
26658f09b78SDaniel Lezcano fib6_link_table(net, tb);
267c71099acSThomas Graf
268c71099acSThomas Graf return tb;
269c71099acSThomas Graf }
270b3b4663cSDavid Ahern EXPORT_SYMBOL_GPL(fib6_new_table);
271c71099acSThomas Graf
fib6_get_table(struct net * net,u32 id)27258f09b78SDaniel Lezcano struct fib6_table *fib6_get_table(struct net *net, u32 id)
273c71099acSThomas Graf {
274c71099acSThomas Graf struct fib6_table *tb;
27558f09b78SDaniel Lezcano struct hlist_head *head;
276c71099acSThomas Graf unsigned int h;
277c71099acSThomas Graf
278c71099acSThomas Graf if (id == 0)
279c71099acSThomas Graf id = RT6_TABLE_MAIN;
280a33bc5c1SNeil Horman h = id & (FIB6_TABLE_HASHSZ - 1);
281c71099acSThomas Graf rcu_read_lock();
28258f09b78SDaniel Lezcano head = &net->ipv6.fib_table_hash[h];
283b67bfe0dSSasha Levin hlist_for_each_entry_rcu(tb, head, tb6_hlist) {
284c71099acSThomas Graf if (tb->tb6_id == id) {
285c71099acSThomas Graf rcu_read_unlock();
286c71099acSThomas Graf return tb;
287c71099acSThomas Graf }
288c71099acSThomas Graf }
289c71099acSThomas Graf rcu_read_unlock();
290c71099acSThomas Graf
291c71099acSThomas Graf return NULL;
292c71099acSThomas Graf }
293c4850687SDavid Ahern EXPORT_SYMBOL_GPL(fib6_get_table);
294c71099acSThomas Graf
fib6_tables_init(struct net * net)2952c8c1e72SAlexey Dobriyan static void __net_init fib6_tables_init(struct net *net)
296c71099acSThomas Graf {
29758f09b78SDaniel Lezcano fib6_link_table(net, net->ipv6.fib6_main_tbl);
29858f09b78SDaniel Lezcano fib6_link_table(net, net->ipv6.fib6_local_tbl);
299c71099acSThomas Graf }
300c71099acSThomas Graf #else
301c71099acSThomas Graf
fib6_new_table(struct net * net,u32 id)30258f09b78SDaniel Lezcano struct fib6_table *fib6_new_table(struct net *net, u32 id)
303c71099acSThomas Graf {
30458f09b78SDaniel Lezcano return fib6_get_table(net, id);
305c71099acSThomas Graf }
306c71099acSThomas Graf
fib6_get_table(struct net * net,u32 id)30758f09b78SDaniel Lezcano struct fib6_table *fib6_get_table(struct net *net, u32 id)
308c71099acSThomas Graf {
30958f09b78SDaniel Lezcano return net->ipv6.fib6_main_tbl;
310c71099acSThomas Graf }
311c71099acSThomas Graf
fib6_rule_lookup(struct net * net,struct flowi6 * fl6,const struct sk_buff * skb,int flags,pol_lookup_t lookup)3124c9483b2SDavid S. Miller struct dst_entry *fib6_rule_lookup(struct net *net, struct flowi6 *fl6,
313b75cc8f9SDavid Ahern const struct sk_buff *skb,
31458f09b78SDaniel Lezcano int flags, pol_lookup_t lookup)
315c71099acSThomas Graf {
316ab997ad4Slucien struct rt6_info *rt;
317ab997ad4Slucien
31855cced4fSBrian Vazquez rt = pol_lookup_func(lookup,
31955cced4fSBrian Vazquez net, net->ipv6.fib6_main_tbl, fl6, skb, flags);
32007f61557SSerhey Popovych if (rt->dst.error == -EAGAIN) {
321d64a1f57SWei Wang ip6_rt_put_flags(rt, flags);
322ab997ad4Slucien rt = net->ipv6.ip6_null_entry;
3237b09c2d0SEric Dumazet if (!(flags & RT6_LOOKUP_F_DST_NOREF))
324ab997ad4Slucien dst_hold(&rt->dst);
325ab997ad4Slucien }
326ab997ad4Slucien
327ab997ad4Slucien return &rt->dst;
328c71099acSThomas Graf }
329c71099acSThomas Graf
330138118ecSDavid Ahern /* called with rcu lock held; no reference taken on fib6_info */
fib6_lookup(struct net * net,int oif,struct flowi6 * fl6,struct fib6_result * res,int flags)331effda4ddSDavid Ahern int fib6_lookup(struct net *net, int oif, struct flowi6 *fl6,
332effda4ddSDavid Ahern struct fib6_result *res, int flags)
333138118ecSDavid Ahern {
334effda4ddSDavid Ahern return fib6_table_lookup(net, net->ipv6.fib6_main_tbl, oif, fl6,
335effda4ddSDavid Ahern res, flags);
336138118ecSDavid Ahern }
337138118ecSDavid Ahern
fib6_tables_init(struct net * net)3382c8c1e72SAlexey Dobriyan static void __net_init fib6_tables_init(struct net *net)
339c71099acSThomas Graf {
34058f09b78SDaniel Lezcano fib6_link_table(net, net->ipv6.fib6_main_tbl);
341c71099acSThomas Graf }
342c71099acSThomas Graf
343c71099acSThomas Graf #endif
344c71099acSThomas Graf
fib6_tables_seq_read(struct net * net)345e1ee0a5bSIdo Schimmel unsigned int fib6_tables_seq_read(struct net *net)
346e1ee0a5bSIdo Schimmel {
347e1ee0a5bSIdo Schimmel unsigned int h, fib_seq = 0;
348e1ee0a5bSIdo Schimmel
349e1ee0a5bSIdo Schimmel rcu_read_lock();
350e1ee0a5bSIdo Schimmel for (h = 0; h < FIB6_TABLE_HASHSZ; h++) {
351e1ee0a5bSIdo Schimmel struct hlist_head *head = &net->ipv6.fib_table_hash[h];
352e1ee0a5bSIdo Schimmel struct fib6_table *tb;
353e1ee0a5bSIdo Schimmel
35466f5d6ceSWei Wang hlist_for_each_entry_rcu(tb, head, tb6_hlist)
355e1ee0a5bSIdo Schimmel fib_seq += tb->fib_seq;
356e1ee0a5bSIdo Schimmel }
357e1ee0a5bSIdo Schimmel rcu_read_unlock();
358e1ee0a5bSIdo Schimmel
359e1ee0a5bSIdo Schimmel return fib_seq;
360e1ee0a5bSIdo Schimmel }
361e1ee0a5bSIdo Schimmel
call_fib6_entry_notifier(struct notifier_block * nb,enum fib_event_type event_type,struct fib6_info * rt,struct netlink_ext_ack * extack)3627c550dafSJiri Pirko static int call_fib6_entry_notifier(struct notifier_block *nb,
363e1ee0a5bSIdo Schimmel enum fib_event_type event_type,
364b7a59557SJiri Pirko struct fib6_info *rt,
365b7a59557SJiri Pirko struct netlink_ext_ack *extack)
366e1ee0a5bSIdo Schimmel {
367e1ee0a5bSIdo Schimmel struct fib6_entry_notifier_info info = {
368b7a59557SJiri Pirko .info.extack = extack,
369e1ee0a5bSIdo Schimmel .rt = rt,
370e1ee0a5bSIdo Schimmel };
371e1ee0a5bSIdo Schimmel
3727c550dafSJiri Pirko return call_fib6_notifier(nb, event_type, &info.info);
373e1ee0a5bSIdo Schimmel }
374e1ee0a5bSIdo Schimmel
call_fib6_multipath_entry_notifier(struct notifier_block * nb,enum fib_event_type event_type,struct fib6_info * rt,unsigned int nsiblings,struct netlink_ext_ack * extack)3759c6ecd3cSIdo Schimmel static int call_fib6_multipath_entry_notifier(struct notifier_block *nb,
3769c6ecd3cSIdo Schimmel enum fib_event_type event_type,
3779c6ecd3cSIdo Schimmel struct fib6_info *rt,
3789c6ecd3cSIdo Schimmel unsigned int nsiblings,
3799c6ecd3cSIdo Schimmel struct netlink_ext_ack *extack)
3809c6ecd3cSIdo Schimmel {
3819c6ecd3cSIdo Schimmel struct fib6_entry_notifier_info info = {
3829c6ecd3cSIdo Schimmel .info.extack = extack,
3839c6ecd3cSIdo Schimmel .rt = rt,
3849c6ecd3cSIdo Schimmel .nsiblings = nsiblings,
3859c6ecd3cSIdo Schimmel };
3869c6ecd3cSIdo Schimmel
3879c6ecd3cSIdo Schimmel return call_fib6_notifier(nb, event_type, &info.info);
3889c6ecd3cSIdo Schimmel }
3899c6ecd3cSIdo Schimmel
call_fib6_entry_notifiers(struct net * net,enum fib_event_type event_type,struct fib6_info * rt,struct netlink_ext_ack * extack)39019a3b7eeSDavid Ahern int call_fib6_entry_notifiers(struct net *net,
391df77fe4dSIdo Schimmel enum fib_event_type event_type,
3928d1c802bSDavid Ahern struct fib6_info *rt,
3936c31e5a9SDavid Ahern struct netlink_ext_ack *extack)
394df77fe4dSIdo Schimmel {
395df77fe4dSIdo Schimmel struct fib6_entry_notifier_info info = {
3966c31e5a9SDavid Ahern .info.extack = extack,
397df77fe4dSIdo Schimmel .rt = rt,
398df77fe4dSIdo Schimmel };
399df77fe4dSIdo Schimmel
40093c2fb25SDavid Ahern rt->fib6_table->fib_seq++;
401df77fe4dSIdo Schimmel return call_fib6_notifiers(net, event_type, &info.info);
402df77fe4dSIdo Schimmel }
403df77fe4dSIdo Schimmel
call_fib6_multipath_entry_notifiers(struct net * net,enum fib_event_type event_type,struct fib6_info * rt,unsigned int nsiblings,struct netlink_ext_ack * extack)404d4b96c7bSIdo Schimmel int call_fib6_multipath_entry_notifiers(struct net *net,
405d4b96c7bSIdo Schimmel enum fib_event_type event_type,
406d4b96c7bSIdo Schimmel struct fib6_info *rt,
407d4b96c7bSIdo Schimmel unsigned int nsiblings,
408d4b96c7bSIdo Schimmel struct netlink_ext_ack *extack)
409d4b96c7bSIdo Schimmel {
410d4b96c7bSIdo Schimmel struct fib6_entry_notifier_info info = {
411d4b96c7bSIdo Schimmel .info.extack = extack,
412d4b96c7bSIdo Schimmel .rt = rt,
413d4b96c7bSIdo Schimmel .nsiblings = nsiblings,
414d4b96c7bSIdo Schimmel };
415d4b96c7bSIdo Schimmel
416d4b96c7bSIdo Schimmel rt->fib6_table->fib_seq++;
417d4b96c7bSIdo Schimmel return call_fib6_notifiers(net, event_type, &info.info);
418d4b96c7bSIdo Schimmel }
419d4b96c7bSIdo Schimmel
call_fib6_entry_notifiers_replace(struct net * net,struct fib6_info * rt)420d2f0c9b1SIdo Schimmel int call_fib6_entry_notifiers_replace(struct net *net, struct fib6_info *rt)
421d2f0c9b1SIdo Schimmel {
422d2f0c9b1SIdo Schimmel struct fib6_entry_notifier_info info = {
423d2f0c9b1SIdo Schimmel .rt = rt,
424d2f0c9b1SIdo Schimmel .nsiblings = rt->fib6_nsiblings,
425d2f0c9b1SIdo Schimmel };
426d2f0c9b1SIdo Schimmel
427d2f0c9b1SIdo Schimmel rt->fib6_table->fib_seq++;
428caafb250SIdo Schimmel return call_fib6_notifiers(net, FIB_EVENT_ENTRY_REPLACE, &info.info);
429d2f0c9b1SIdo Schimmel }
430d2f0c9b1SIdo Schimmel
431e1ee0a5bSIdo Schimmel struct fib6_dump_arg {
432e1ee0a5bSIdo Schimmel struct net *net;
433e1ee0a5bSIdo Schimmel struct notifier_block *nb;
434b7a59557SJiri Pirko struct netlink_ext_ack *extack;
435e1ee0a5bSIdo Schimmel };
436e1ee0a5bSIdo Schimmel
fib6_rt_dump(struct fib6_info * rt,struct fib6_dump_arg * arg)43755c894f7SJiri Pirko static int fib6_rt_dump(struct fib6_info *rt, struct fib6_dump_arg *arg)
438e1ee0a5bSIdo Schimmel {
439caafb250SIdo Schimmel enum fib_event_type fib_event = FIB_EVENT_ENTRY_REPLACE;
4409c6ecd3cSIdo Schimmel int err;
4419c6ecd3cSIdo Schimmel
4429c6ecd3cSIdo Schimmel if (!rt || rt == arg->net->ipv6.fib6_null_entry)
4439c6ecd3cSIdo Schimmel return 0;
4449c6ecd3cSIdo Schimmel
4459c6ecd3cSIdo Schimmel if (rt->fib6_nsiblings)
4469c6ecd3cSIdo Schimmel err = call_fib6_multipath_entry_notifier(arg->nb, fib_event,
4479c6ecd3cSIdo Schimmel rt,
4489c6ecd3cSIdo Schimmel rt->fib6_nsiblings,
4499c6ecd3cSIdo Schimmel arg->extack);
4509c6ecd3cSIdo Schimmel else
4519c6ecd3cSIdo Schimmel err = call_fib6_entry_notifier(arg->nb, fib_event, rt,
4529c6ecd3cSIdo Schimmel arg->extack);
4539c6ecd3cSIdo Schimmel
4549c6ecd3cSIdo Schimmel return err;
4559c6ecd3cSIdo Schimmel }
4569c6ecd3cSIdo Schimmel
fib6_node_dump(struct fib6_walker * w)457e1ee0a5bSIdo Schimmel static int fib6_node_dump(struct fib6_walker *w)
458e1ee0a5bSIdo Schimmel {
459caafb250SIdo Schimmel int err;
460e1ee0a5bSIdo Schimmel
461caafb250SIdo Schimmel err = fib6_rt_dump(w->leaf, w->args);
462e1ee0a5bSIdo Schimmel w->leaf = NULL;
46355c894f7SJiri Pirko return err;
464e1ee0a5bSIdo Schimmel }
465e1ee0a5bSIdo Schimmel
fib6_table_dump(struct net * net,struct fib6_table * tb,struct fib6_walker * w)46655c894f7SJiri Pirko static int fib6_table_dump(struct net *net, struct fib6_table *tb,
467e1ee0a5bSIdo Schimmel struct fib6_walker *w)
468e1ee0a5bSIdo Schimmel {
46955c894f7SJiri Pirko int err;
47055c894f7SJiri Pirko
471e1ee0a5bSIdo Schimmel w->root = &tb->tb6_root;
47266f5d6ceSWei Wang spin_lock_bh(&tb->tb6_lock);
47355c894f7SJiri Pirko err = fib6_walk(net, w);
47466f5d6ceSWei Wang spin_unlock_bh(&tb->tb6_lock);
47555c894f7SJiri Pirko return err;
476e1ee0a5bSIdo Schimmel }
477e1ee0a5bSIdo Schimmel
478e1ee0a5bSIdo Schimmel /* Called with rcu_read_lock() */
fib6_tables_dump(struct net * net,struct notifier_block * nb,struct netlink_ext_ack * extack)479b7a59557SJiri Pirko int fib6_tables_dump(struct net *net, struct notifier_block *nb,
480b7a59557SJiri Pirko struct netlink_ext_ack *extack)
481e1ee0a5bSIdo Schimmel {
482e1ee0a5bSIdo Schimmel struct fib6_dump_arg arg;
483e1ee0a5bSIdo Schimmel struct fib6_walker *w;
484e1ee0a5bSIdo Schimmel unsigned int h;
48555c894f7SJiri Pirko int err = 0;
486e1ee0a5bSIdo Schimmel
487e1ee0a5bSIdo Schimmel w = kzalloc(sizeof(*w), GFP_ATOMIC);
488e1ee0a5bSIdo Schimmel if (!w)
489e1ee0a5bSIdo Schimmel return -ENOMEM;
490e1ee0a5bSIdo Schimmel
491e1ee0a5bSIdo Schimmel w->func = fib6_node_dump;
492e1ee0a5bSIdo Schimmel arg.net = net;
493e1ee0a5bSIdo Schimmel arg.nb = nb;
494b7a59557SJiri Pirko arg.extack = extack;
495e1ee0a5bSIdo Schimmel w->args = &arg;
496e1ee0a5bSIdo Schimmel
497e1ee0a5bSIdo Schimmel for (h = 0; h < FIB6_TABLE_HASHSZ; h++) {
498e1ee0a5bSIdo Schimmel struct hlist_head *head = &net->ipv6.fib_table_hash[h];
499e1ee0a5bSIdo Schimmel struct fib6_table *tb;
500e1ee0a5bSIdo Schimmel
50155c894f7SJiri Pirko hlist_for_each_entry_rcu(tb, head, tb6_hlist) {
50255c894f7SJiri Pirko err = fib6_table_dump(net, tb, w);
5036f199552SVlad Buslov if (err)
50455c894f7SJiri Pirko goto out;
50555c894f7SJiri Pirko }
506e1ee0a5bSIdo Schimmel }
507e1ee0a5bSIdo Schimmel
50855c894f7SJiri Pirko out:
509e1ee0a5bSIdo Schimmel kfree(w);
510e1ee0a5bSIdo Schimmel
5116f199552SVlad Buslov /* The tree traversal function should never return a positive value. */
5126f199552SVlad Buslov return err > 0 ? -EINVAL : err;
513e1ee0a5bSIdo Schimmel }
514e1ee0a5bSIdo Schimmel
fib6_dump_node(struct fib6_walker * w)51594b2cfe0SHannes Frederic Sowa static int fib6_dump_node(struct fib6_walker *w)
5161b43af54SPatrick McHardy {
5171b43af54SPatrick McHardy int res;
5188d1c802bSDavid Ahern struct fib6_info *rt;
5191b43af54SPatrick McHardy
52066f5d6ceSWei Wang for_each_fib6_walker_rt(w) {
5211e47b483SStefano Brivio res = rt6_dump_route(rt, w->args, w->skip_in_node);
522bf9a8a06SStefano Brivio if (res >= 0) {
5231b43af54SPatrick McHardy /* Frame is full, suspend walking */
5241b43af54SPatrick McHardy w->leaf = rt;
5251e47b483SStefano Brivio
5261e47b483SStefano Brivio /* We'll restart from this node, so if some routes were
5271e47b483SStefano Brivio * already dumped, skip them next time.
5281e47b483SStefano Brivio */
5291e47b483SStefano Brivio w->skip_in_node += res;
5301e47b483SStefano Brivio
5311b43af54SPatrick McHardy return 1;
5321b43af54SPatrick McHardy }
5331e47b483SStefano Brivio w->skip_in_node = 0;
534beb1afacSDavid Ahern
535beb1afacSDavid Ahern /* Multipath routes are dumped in one route with the
536beb1afacSDavid Ahern * RTA_MULTIPATH attribute. Jump 'rt' to point to the
537beb1afacSDavid Ahern * last sibling of this route (no need to dump the
538beb1afacSDavid Ahern * sibling routes again)
539beb1afacSDavid Ahern */
54093c2fb25SDavid Ahern if (rt->fib6_nsiblings)
54193c2fb25SDavid Ahern rt = list_last_entry(&rt->fib6_siblings,
5428d1c802bSDavid Ahern struct fib6_info,
54393c2fb25SDavid Ahern fib6_siblings);
5441b43af54SPatrick McHardy }
5451b43af54SPatrick McHardy w->leaf = NULL;
5461b43af54SPatrick McHardy return 0;
5471b43af54SPatrick McHardy }
5481b43af54SPatrick McHardy
fib6_dump_end(struct netlink_callback * cb)5491b43af54SPatrick McHardy static void fib6_dump_end(struct netlink_callback *cb)
5501b43af54SPatrick McHardy {
5519a03cd8fSMichal Kubeček struct net *net = sock_net(cb->skb->sk);
55294b2cfe0SHannes Frederic Sowa struct fib6_walker *w = (void *)cb->args[2];
5531b43af54SPatrick McHardy
5541b43af54SPatrick McHardy if (w) {
5557891cc81SHerbert Xu if (cb->args[4]) {
5567891cc81SHerbert Xu cb->args[4] = 0;
5579a03cd8fSMichal Kubeček fib6_walker_unlink(net, w);
5587891cc81SHerbert Xu }
5591b43af54SPatrick McHardy cb->args[2] = 0;
5601b43af54SPatrick McHardy kfree(w);
5611b43af54SPatrick McHardy }
5621b43af54SPatrick McHardy cb->done = (void *)cb->args[3];
5631b43af54SPatrick McHardy cb->args[1] = 3;
5641b43af54SPatrick McHardy }
5651b43af54SPatrick McHardy
fib6_dump_done(struct netlink_callback * cb)5661b43af54SPatrick McHardy static int fib6_dump_done(struct netlink_callback *cb)
5671b43af54SPatrick McHardy {
5681b43af54SPatrick McHardy fib6_dump_end(cb);
5691b43af54SPatrick McHardy return cb->done ? cb->done(cb) : 0;
5701b43af54SPatrick McHardy }
5711b43af54SPatrick McHardy
fib6_dump_table(struct fib6_table * table,struct sk_buff * skb,struct netlink_callback * cb)5721b43af54SPatrick McHardy static int fib6_dump_table(struct fib6_table *table, struct sk_buff *skb,
5731b43af54SPatrick McHardy struct netlink_callback *cb)
5741b43af54SPatrick McHardy {
5759a03cd8fSMichal Kubeček struct net *net = sock_net(skb->sk);
57694b2cfe0SHannes Frederic Sowa struct fib6_walker *w;
5771b43af54SPatrick McHardy int res;
5781b43af54SPatrick McHardy
5791b43af54SPatrick McHardy w = (void *)cb->args[2];
5801b43af54SPatrick McHardy w->root = &table->tb6_root;
5811b43af54SPatrick McHardy
5821b43af54SPatrick McHardy if (cb->args[4] == 0) {
5832bec5a36SPatrick McHardy w->count = 0;
5842bec5a36SPatrick McHardy w->skip = 0;
5851e47b483SStefano Brivio w->skip_in_node = 0;
5862bec5a36SPatrick McHardy
58766f5d6ceSWei Wang spin_lock_bh(&table->tb6_lock);
5889a03cd8fSMichal Kubeček res = fib6_walk(net, w);
58966f5d6ceSWei Wang spin_unlock_bh(&table->tb6_lock);
5902bec5a36SPatrick McHardy if (res > 0) {
5911b43af54SPatrick McHardy cb->args[4] = 1;
592aafc2e32SEric Dumazet cb->args[5] = READ_ONCE(w->root->fn_sernum);
5932bec5a36SPatrick McHardy }
5941b43af54SPatrick McHardy } else {
595aafc2e32SEric Dumazet int sernum = READ_ONCE(w->root->fn_sernum);
596aafc2e32SEric Dumazet if (cb->args[5] != sernum) {
5972bec5a36SPatrick McHardy /* Begin at the root if the tree changed */
598aafc2e32SEric Dumazet cb->args[5] = sernum;
5992bec5a36SPatrick McHardy w->state = FWS_INIT;
6002bec5a36SPatrick McHardy w->node = w->root;
6012bec5a36SPatrick McHardy w->skip = w->count;
6021e47b483SStefano Brivio w->skip_in_node = 0;
6032bec5a36SPatrick McHardy } else
6042bec5a36SPatrick McHardy w->skip = 0;
6052bec5a36SPatrick McHardy
60666f5d6ceSWei Wang spin_lock_bh(&table->tb6_lock);
6071b43af54SPatrick McHardy res = fib6_walk_continue(w);
60866f5d6ceSWei Wang spin_unlock_bh(&table->tb6_lock);
6097891cc81SHerbert Xu if (res <= 0) {
6109a03cd8fSMichal Kubeček fib6_walker_unlink(net, w);
6111b43af54SPatrick McHardy cb->args[4] = 0;
6121b43af54SPatrick McHardy }
6137891cc81SHerbert Xu }
6147891cc81SHerbert Xu
6151b43af54SPatrick McHardy return res;
6161b43af54SPatrick McHardy }
6171b43af54SPatrick McHardy
inet6_dump_fib(struct sk_buff * skb,struct netlink_callback * cb)618c127ea2cSThomas Graf static int inet6_dump_fib(struct sk_buff *skb, struct netlink_callback *cb)
6191b43af54SPatrick McHardy {
620564c91f7SStefano Brivio struct rt6_rtnl_dump_arg arg = { .filter.dump_exceptions = true,
621564c91f7SStefano Brivio .filter.dump_routes = true };
622e8ba330aSDavid Ahern const struct nlmsghdr *nlh = cb->nlh;
6233b1e0a65SYOSHIFUJI Hideaki struct net *net = sock_net(skb->sk);
6241b43af54SPatrick McHardy unsigned int h, s_h;
6251b43af54SPatrick McHardy unsigned int e = 0, s_e;
62694b2cfe0SHannes Frederic Sowa struct fib6_walker *w;
6271b43af54SPatrick McHardy struct fib6_table *tb;
62858f09b78SDaniel Lezcano struct hlist_head *head;
6291b43af54SPatrick McHardy int res = 0;
6301b43af54SPatrick McHardy
631e8ba330aSDavid Ahern if (cb->strict_check) {
6324724676dSDavid Ahern int err;
633e8ba330aSDavid Ahern
634effe6792SDavid Ahern err = ip_valid_fib_dump_req(net, nlh, &arg.filter, cb);
635e8ba330aSDavid Ahern if (err < 0)
636e8ba330aSDavid Ahern return err;
63713e38901SDavid Ahern } else if (nlmsg_len(nlh) >= sizeof(struct rtmsg)) {
63813e38901SDavid Ahern struct rtmsg *rtm = nlmsg_data(nlh);
639e8ba330aSDavid Ahern
640ef11209dSStefano Brivio if (rtm->rtm_flags & RTM_F_PREFIX)
641ef11209dSStefano Brivio arg.filter.flags = RTM_F_PREFIX;
64213e38901SDavid Ahern }
6431b43af54SPatrick McHardy
6441b43af54SPatrick McHardy w = (void *)cb->args[2];
645507c9b1eSDavid S. Miller if (!w) {
6461b43af54SPatrick McHardy /* New dump:
6471b43af54SPatrick McHardy *
648f2dd75e5SKuniyuki Iwashima * 1. allocate and initialize walker.
6491b43af54SPatrick McHardy */
6501b43af54SPatrick McHardy w = kzalloc(sizeof(*w), GFP_ATOMIC);
651507c9b1eSDavid S. Miller if (!w)
6521b43af54SPatrick McHardy return -ENOMEM;
6531b43af54SPatrick McHardy w->func = fib6_dump_node;
6541b43af54SPatrick McHardy cb->args[2] = (long)w;
655f2dd75e5SKuniyuki Iwashima
656f2dd75e5SKuniyuki Iwashima /* 2. hook callback destructor.
657f2dd75e5SKuniyuki Iwashima */
658f2dd75e5SKuniyuki Iwashima cb->args[3] = (long)cb->done;
659f2dd75e5SKuniyuki Iwashima cb->done = fib6_dump_done;
660f2dd75e5SKuniyuki Iwashima
6611b43af54SPatrick McHardy }
6621b43af54SPatrick McHardy
6631b43af54SPatrick McHardy arg.skb = skb;
6641b43af54SPatrick McHardy arg.cb = cb;
665191cd582SBrian Haley arg.net = net;
6661b43af54SPatrick McHardy w->args = &arg;
6671b43af54SPatrick McHardy
66813e38901SDavid Ahern if (arg.filter.table_id) {
66913e38901SDavid Ahern tb = fib6_get_table(net, arg.filter.table_id);
67013e38901SDavid Ahern if (!tb) {
67141b4bd98SSabrina Dubroca if (rtnl_msg_family(cb->nlh) != PF_INET6)
672e22d0bfaSAlexey Kodanev goto out;
673ae677bbbSDavid Ahern
67413e38901SDavid Ahern NL_SET_ERR_MSG_MOD(cb->extack, "FIB table does not exist");
67513e38901SDavid Ahern return -ENOENT;
67613e38901SDavid Ahern }
67713e38901SDavid Ahern
67873155879SDavid Ahern if (!cb->args[0]) {
67913e38901SDavid Ahern res = fib6_dump_table(tb, skb, cb);
68073155879SDavid Ahern if (!res)
68173155879SDavid Ahern cb->args[0] = 1;
68273155879SDavid Ahern }
68313e38901SDavid Ahern goto out;
68413e38901SDavid Ahern }
68513e38901SDavid Ahern
68613e38901SDavid Ahern s_h = cb->args[0];
68713e38901SDavid Ahern s_e = cb->args[1];
68813e38901SDavid Ahern
689e67f88ddSEric Dumazet rcu_read_lock();
690a33bc5c1SNeil Horman for (h = s_h; h < FIB6_TABLE_HASHSZ; h++, s_e = 0) {
6911b43af54SPatrick McHardy e = 0;
69258f09b78SDaniel Lezcano head = &net->ipv6.fib_table_hash[h];
693b67bfe0dSSasha Levin hlist_for_each_entry_rcu(tb, head, tb6_hlist) {
6941b43af54SPatrick McHardy if (e < s_e)
6951b43af54SPatrick McHardy goto next;
6961b43af54SPatrick McHardy res = fib6_dump_table(tb, skb, cb);
6971b43af54SPatrick McHardy if (res != 0)
69813e38901SDavid Ahern goto out_unlock;
6991b43af54SPatrick McHardy next:
7001b43af54SPatrick McHardy e++;
7011b43af54SPatrick McHardy }
7021b43af54SPatrick McHardy }
70313e38901SDavid Ahern out_unlock:
704e67f88ddSEric Dumazet rcu_read_unlock();
7051b43af54SPatrick McHardy cb->args[1] = e;
7061b43af54SPatrick McHardy cb->args[0] = h;
70713e38901SDavid Ahern out:
7081b43af54SPatrick McHardy res = res < 0 ? res : skb->len;
7091b43af54SPatrick McHardy if (res <= 0)
7101b43af54SPatrick McHardy fib6_dump_end(cb);
7111b43af54SPatrick McHardy return res;
7121b43af54SPatrick McHardy }
7131da177e4SLinus Torvalds
fib6_metric_set(struct fib6_info * f6i,int metric,u32 val)7148d1c802bSDavid Ahern void fib6_metric_set(struct fib6_info *f6i, int metric, u32 val)
715d4ead6b3SDavid Ahern {
716d4ead6b3SDavid Ahern if (!f6i)
717d4ead6b3SDavid Ahern return;
718d4ead6b3SDavid Ahern
719d4ead6b3SDavid Ahern if (f6i->fib6_metrics == &dst_default_metrics) {
720d4ead6b3SDavid Ahern struct dst_metrics *p = kzalloc(sizeof(*p), GFP_ATOMIC);
721d4ead6b3SDavid Ahern
722d4ead6b3SDavid Ahern if (!p)
723d4ead6b3SDavid Ahern return;
724d4ead6b3SDavid Ahern
725d4ead6b3SDavid Ahern refcount_set(&p->refcnt, 1);
726d4ead6b3SDavid Ahern f6i->fib6_metrics = p;
727d4ead6b3SDavid Ahern }
728d4ead6b3SDavid Ahern
729d4ead6b3SDavid Ahern f6i->fib6_metrics->metrics[metric - 1] = val;
730d4ead6b3SDavid Ahern }
731d4ead6b3SDavid Ahern
7321da177e4SLinus Torvalds /*
7331da177e4SLinus Torvalds * Routing Table
7341da177e4SLinus Torvalds *
7351da177e4SLinus Torvalds * return the appropriate node for a routing tree "add" operation
7361da177e4SLinus Torvalds * by either creating and inserting or by returning an existing
7371da177e4SLinus Torvalds * node.
7381da177e4SLinus Torvalds */
7391da177e4SLinus Torvalds
fib6_add_1(struct net * net,struct fib6_table * table,struct fib6_node * root,struct in6_addr * addr,int plen,int offset,int allow_create,int replace_required,struct netlink_ext_ack * extack)74081eb8447SWei Wang static struct fib6_node *fib6_add_1(struct net *net,
74181eb8447SWei Wang struct fib6_table *table,
74266f5d6ceSWei Wang struct fib6_node *root,
7439225b230Sfan.du struct in6_addr *addr, int plen,
7444a287ebaSMatti Vaittinen int offset, int allow_create,
745bbd63f06SWei Wang int replace_required,
746333c4301SDavid Ahern struct netlink_ext_ack *extack)
7471da177e4SLinus Torvalds {
7481da177e4SLinus Torvalds struct fib6_node *fn, *in, *ln;
7491da177e4SLinus Torvalds struct fib6_node *pn = NULL;
7501da177e4SLinus Torvalds struct rt6key *key;
7511da177e4SLinus Torvalds int bit;
752e69a4adcSAl Viro __be32 dir = 0;
7531da177e4SLinus Torvalds
7541da177e4SLinus Torvalds RT6_TRACE("fib6_add_1\n");
7551da177e4SLinus Torvalds
7561da177e4SLinus Torvalds /* insert node in tree */
7571da177e4SLinus Torvalds
7581da177e4SLinus Torvalds fn = root;
7591da177e4SLinus Torvalds
7601da177e4SLinus Torvalds do {
7618d1c802bSDavid Ahern struct fib6_info *leaf = rcu_dereference_protected(fn->leaf,
76266f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
76366f5d6ceSWei Wang key = (struct rt6key *)((u8 *)leaf + offset);
7641da177e4SLinus Torvalds
7651da177e4SLinus Torvalds /*
7661da177e4SLinus Torvalds * Prefix match
7671da177e4SLinus Torvalds */
7681da177e4SLinus Torvalds if (plen < fn->fn_bit ||
7694a287ebaSMatti Vaittinen !ipv6_prefix_equal(&key->addr, addr, fn->fn_bit)) {
77014df015bSMatti Vaittinen if (!allow_create) {
77114df015bSMatti Vaittinen if (replace_required) {
772d5d531cbSDavid Ahern NL_SET_ERR_MSG(extack,
773d5d531cbSDavid Ahern "Can not replace route - no match found");
774f3213831SJoe Perches pr_warn("Can't replace route, no match found\n");
77514df015bSMatti Vaittinen return ERR_PTR(-ENOENT);
77614df015bSMatti Vaittinen }
777f3213831SJoe Perches pr_warn("NLM_F_CREATE should be set when creating new route\n");
77814df015bSMatti Vaittinen }
7791da177e4SLinus Torvalds goto insert_above;
7804a287ebaSMatti Vaittinen }
7811da177e4SLinus Torvalds
7821da177e4SLinus Torvalds /*
7831da177e4SLinus Torvalds * Exact match ?
7841da177e4SLinus Torvalds */
7851da177e4SLinus Torvalds
7861da177e4SLinus Torvalds if (plen == fn->fn_bit) {
7871da177e4SLinus Torvalds /* clean up an intermediate node */
788507c9b1eSDavid S. Miller if (!(fn->fn_flags & RTN_RTINFO)) {
78966f5d6ceSWei Wang RCU_INIT_POINTER(fn->leaf, NULL);
79093531c67SDavid Ahern fib6_info_release(leaf);
7914512c43eSWei Wang /* remove null_entry in the root node */
7924512c43eSWei Wang } else if (fn->fn_flags & RTN_TL_ROOT &&
7934512c43eSWei Wang rcu_access_pointer(fn->leaf) ==
794421842edSDavid Ahern net->ipv6.fib6_null_entry) {
7954512c43eSWei Wang RCU_INIT_POINTER(fn->leaf, NULL);
7961da177e4SLinus Torvalds }
7971da177e4SLinus Torvalds
7981da177e4SLinus Torvalds return fn;
7991da177e4SLinus Torvalds }
8001da177e4SLinus Torvalds
8011da177e4SLinus Torvalds /*
8021da177e4SLinus Torvalds * We have more bits to go
8031da177e4SLinus Torvalds */
8041da177e4SLinus Torvalds
8051da177e4SLinus Torvalds /* Try to walk down on tree. */
8061da177e4SLinus Torvalds dir = addr_bit_set(addr, fn->fn_bit);
8071da177e4SLinus Torvalds pn = fn;
80866f5d6ceSWei Wang fn = dir ?
80966f5d6ceSWei Wang rcu_dereference_protected(fn->right,
81066f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock)) :
81166f5d6ceSWei Wang rcu_dereference_protected(fn->left,
81266f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
8131da177e4SLinus Torvalds } while (fn);
8141da177e4SLinus Torvalds
81514df015bSMatti Vaittinen if (!allow_create) {
8164a287ebaSMatti Vaittinen /* We should not create new node because
8174a287ebaSMatti Vaittinen * NLM_F_REPLACE was specified without NLM_F_CREATE
8184a287ebaSMatti Vaittinen * I assume it is safe to require NLM_F_CREATE when
8194a287ebaSMatti Vaittinen * REPLACE flag is used! Later we may want to remove the
8204a287ebaSMatti Vaittinen * check for replace_required, because according
8214a287ebaSMatti Vaittinen * to netlink specification, NLM_F_CREATE
8224a287ebaSMatti Vaittinen * MUST be specified if new route is created.
8234a287ebaSMatti Vaittinen * That would keep IPv6 consistent with IPv4
8244a287ebaSMatti Vaittinen */
82514df015bSMatti Vaittinen if (replace_required) {
826d5d531cbSDavid Ahern NL_SET_ERR_MSG(extack,
827d5d531cbSDavid Ahern "Can not replace route - no match found");
828f3213831SJoe Perches pr_warn("Can't replace route, no match found\n");
8294a287ebaSMatti Vaittinen return ERR_PTR(-ENOENT);
8304a287ebaSMatti Vaittinen }
831f3213831SJoe Perches pr_warn("NLM_F_CREATE should be set when creating new route\n");
83214df015bSMatti Vaittinen }
8331da177e4SLinus Torvalds /*
8341da177e4SLinus Torvalds * We walked to the bottom of tree.
8351da177e4SLinus Torvalds * Create new leaf node without children.
8361da177e4SLinus Torvalds */
8371da177e4SLinus Torvalds
83881eb8447SWei Wang ln = node_alloc(net);
8391da177e4SLinus Torvalds
840507c9b1eSDavid S. Miller if (!ln)
841188c517aSLin Ming return ERR_PTR(-ENOMEM);
8421da177e4SLinus Torvalds ln->fn_bit = plen;
84366f5d6ceSWei Wang RCU_INIT_POINTER(ln->parent, pn);
8441da177e4SLinus Torvalds
8451da177e4SLinus Torvalds if (dir)
84666f5d6ceSWei Wang rcu_assign_pointer(pn->right, ln);
8471da177e4SLinus Torvalds else
84866f5d6ceSWei Wang rcu_assign_pointer(pn->left, ln);
8491da177e4SLinus Torvalds
8501da177e4SLinus Torvalds return ln;
8511da177e4SLinus Torvalds
8521da177e4SLinus Torvalds
8531da177e4SLinus Torvalds insert_above:
8541da177e4SLinus Torvalds /*
8551da177e4SLinus Torvalds * split since we don't have a common prefix anymore or
8561da177e4SLinus Torvalds * we have a less significant route.
8571da177e4SLinus Torvalds * we've to insert an intermediate node on the list
8581da177e4SLinus Torvalds * this new node will point to the one we need to create
8591da177e4SLinus Torvalds * and the current
8601da177e4SLinus Torvalds */
8611da177e4SLinus Torvalds
86266f5d6ceSWei Wang pn = rcu_dereference_protected(fn->parent,
86366f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
8641da177e4SLinus Torvalds
8651da177e4SLinus Torvalds /* find 1st bit in difference between the 2 addrs.
8661da177e4SLinus Torvalds
867971f359dSYOSHIFUJI Hideaki See comment in __ipv6_addr_diff: bit may be an invalid value,
8681da177e4SLinus Torvalds but if it is >= plen, the value is ignored in any case.
8691da177e4SLinus Torvalds */
8701da177e4SLinus Torvalds
8719225b230Sfan.du bit = __ipv6_addr_diff(addr, &key->addr, sizeof(*addr));
8721da177e4SLinus Torvalds
8731da177e4SLinus Torvalds /*
8741da177e4SLinus Torvalds * (intermediate)[in]
8751da177e4SLinus Torvalds * / \
8761da177e4SLinus Torvalds * (new leaf node)[ln] (old node)[fn]
8771da177e4SLinus Torvalds */
8781da177e4SLinus Torvalds if (plen > bit) {
87981eb8447SWei Wang in = node_alloc(net);
88081eb8447SWei Wang ln = node_alloc(net);
8811da177e4SLinus Torvalds
882507c9b1eSDavid S. Miller if (!in || !ln) {
8831da177e4SLinus Torvalds if (in)
88481eb8447SWei Wang node_free_immediate(net, in);
8851da177e4SLinus Torvalds if (ln)
88681eb8447SWei Wang node_free_immediate(net, ln);
887188c517aSLin Ming return ERR_PTR(-ENOMEM);
8881da177e4SLinus Torvalds }
8891da177e4SLinus Torvalds
8901da177e4SLinus Torvalds /*
8911da177e4SLinus Torvalds * new intermediate node.
8921da177e4SLinus Torvalds * RTN_RTINFO will
8931da177e4SLinus Torvalds * be off since that an address that chooses one of
8941da177e4SLinus Torvalds * the branches would not match less specific routes
8951da177e4SLinus Torvalds * in the other branch
8961da177e4SLinus Torvalds */
8971da177e4SLinus Torvalds
8981da177e4SLinus Torvalds in->fn_bit = bit;
8991da177e4SLinus Torvalds
90066f5d6ceSWei Wang RCU_INIT_POINTER(in->parent, pn);
9011da177e4SLinus Torvalds in->leaf = fn->leaf;
9025ea71528SEric Dumazet fib6_info_hold(rcu_dereference_protected(in->leaf,
9035ea71528SEric Dumazet lockdep_is_held(&table->tb6_lock)));
9041da177e4SLinus Torvalds
9051da177e4SLinus Torvalds /* update parent pointer */
9061da177e4SLinus Torvalds if (dir)
90766f5d6ceSWei Wang rcu_assign_pointer(pn->right, in);
9081da177e4SLinus Torvalds else
90966f5d6ceSWei Wang rcu_assign_pointer(pn->left, in);
9101da177e4SLinus Torvalds
9111da177e4SLinus Torvalds ln->fn_bit = plen;
9121da177e4SLinus Torvalds
91366f5d6ceSWei Wang RCU_INIT_POINTER(ln->parent, in);
91466f5d6ceSWei Wang rcu_assign_pointer(fn->parent, in);
9151da177e4SLinus Torvalds
9161da177e4SLinus Torvalds if (addr_bit_set(addr, bit)) {
91766f5d6ceSWei Wang rcu_assign_pointer(in->right, ln);
91866f5d6ceSWei Wang rcu_assign_pointer(in->left, fn);
9191da177e4SLinus Torvalds } else {
92066f5d6ceSWei Wang rcu_assign_pointer(in->left, ln);
92166f5d6ceSWei Wang rcu_assign_pointer(in->right, fn);
9221da177e4SLinus Torvalds }
9231da177e4SLinus Torvalds } else { /* plen <= bit */
9241da177e4SLinus Torvalds
9251da177e4SLinus Torvalds /*
9261da177e4SLinus Torvalds * (new leaf node)[ln]
9271da177e4SLinus Torvalds * / \
9281da177e4SLinus Torvalds * (old node)[fn] NULL
9291da177e4SLinus Torvalds */
9301da177e4SLinus Torvalds
93181eb8447SWei Wang ln = node_alloc(net);
9321da177e4SLinus Torvalds
933507c9b1eSDavid S. Miller if (!ln)
934188c517aSLin Ming return ERR_PTR(-ENOMEM);
9351da177e4SLinus Torvalds
9361da177e4SLinus Torvalds ln->fn_bit = plen;
9371da177e4SLinus Torvalds
93866f5d6ceSWei Wang RCU_INIT_POINTER(ln->parent, pn);
9391da177e4SLinus Torvalds
9401da177e4SLinus Torvalds if (addr_bit_set(&key->addr, plen))
94166f5d6ceSWei Wang RCU_INIT_POINTER(ln->right, fn);
9421da177e4SLinus Torvalds else
94366f5d6ceSWei Wang RCU_INIT_POINTER(ln->left, fn);
9441da177e4SLinus Torvalds
94566f5d6ceSWei Wang rcu_assign_pointer(fn->parent, ln);
94666f5d6ceSWei Wang
94766f5d6ceSWei Wang if (dir)
94866f5d6ceSWei Wang rcu_assign_pointer(pn->right, ln);
94966f5d6ceSWei Wang else
95066f5d6ceSWei Wang rcu_assign_pointer(pn->left, ln);
9511da177e4SLinus Torvalds }
9521da177e4SLinus Torvalds return ln;
9531da177e4SLinus Torvalds }
9541da177e4SLinus Torvalds
__fib6_drop_pcpu_from(struct fib6_nh * fib6_nh,const struct fib6_info * match,const struct fib6_table * table)9557d88d8b5SDavid Ahern static void __fib6_drop_pcpu_from(struct fib6_nh *fib6_nh,
9567d88d8b5SDavid Ahern const struct fib6_info *match,
9575bcaa41bSDavid Ahern const struct fib6_table *table)
958e5fd387aSMichal Kubeček {
9595bcaa41bSDavid Ahern int cpu;
960e5fd387aSMichal Kubeček
961f40b6ae2SDavid Ahern if (!fib6_nh->rt6i_pcpu)
962f40b6ae2SDavid Ahern return;
963f40b6ae2SDavid Ahern
9647e796c3fSEric Dumazet rcu_read_lock();
9655bcaa41bSDavid Ahern /* release the reference to this fib entry from
9665bcaa41bSDavid Ahern * all of its cached pcpu routes
9675bcaa41bSDavid Ahern */
9685bcaa41bSDavid Ahern for_each_possible_cpu(cpu) {
9695bcaa41bSDavid Ahern struct rt6_info **ppcpu_rt;
9705bcaa41bSDavid Ahern struct rt6_info *pcpu_rt;
9715bcaa41bSDavid Ahern
972f40b6ae2SDavid Ahern ppcpu_rt = per_cpu_ptr(fib6_nh->rt6i_pcpu, cpu);
9737e796c3fSEric Dumazet
9747e796c3fSEric Dumazet /* Paired with xchg() in rt6_get_pcpu_route() */
9757e796c3fSEric Dumazet pcpu_rt = READ_ONCE(*ppcpu_rt);
9767d88d8b5SDavid Ahern
9777d88d8b5SDavid Ahern /* only dropping the 'from' reference if the cached route
9787d88d8b5SDavid Ahern * is using 'match'. The cached pcpu_rt->from only changes
9797d88d8b5SDavid Ahern * from a fib6_info to NULL (ip6_dst_destroy); it can never
9807d88d8b5SDavid Ahern * change from one fib6_info reference to another
9817d88d8b5SDavid Ahern */
9827d88d8b5SDavid Ahern if (pcpu_rt && rcu_access_pointer(pcpu_rt->from) == match) {
983a68886a6SDavid Ahern struct fib6_info *from;
984a68886a6SDavid Ahern
98570530a2fSEric Dumazet from = unrcu_pointer(xchg(&pcpu_rt->from, NULL));
986a68886a6SDavid Ahern fib6_info_release(from);
9875bcaa41bSDavid Ahern }
988e715b6d3SFlorian Westphal }
9897e796c3fSEric Dumazet rcu_read_unlock();
990e715b6d3SFlorian Westphal }
991e715b6d3SFlorian Westphal
9922ab75bfbSDavid Ahern struct fib6_nh_pcpu_arg {
9932ab75bfbSDavid Ahern struct fib6_info *from;
9942ab75bfbSDavid Ahern const struct fib6_table *table;
9952ab75bfbSDavid Ahern };
9962ab75bfbSDavid Ahern
fib6_nh_drop_pcpu_from(struct fib6_nh * nh,void * _arg)9972ab75bfbSDavid Ahern static int fib6_nh_drop_pcpu_from(struct fib6_nh *nh, void *_arg)
9982ab75bfbSDavid Ahern {
9992ab75bfbSDavid Ahern struct fib6_nh_pcpu_arg *arg = _arg;
10002ab75bfbSDavid Ahern
10012ab75bfbSDavid Ahern __fib6_drop_pcpu_from(nh, arg->from, arg->table);
10022ab75bfbSDavid Ahern return 0;
10032ab75bfbSDavid Ahern }
10042ab75bfbSDavid Ahern
fib6_drop_pcpu_from(struct fib6_info * f6i,const struct fib6_table * table)10057d88d8b5SDavid Ahern static void fib6_drop_pcpu_from(struct fib6_info *f6i,
10067d88d8b5SDavid Ahern const struct fib6_table *table)
10077d88d8b5SDavid Ahern {
10087d88d8b5SDavid Ahern /* Make sure rt6_make_pcpu_route() wont add other percpu routes
10097d88d8b5SDavid Ahern * while we are cleaning them here.
10107d88d8b5SDavid Ahern */
10117d88d8b5SDavid Ahern f6i->fib6_destroying = 1;
10127d88d8b5SDavid Ahern mb(); /* paired with the cmpxchg() in rt6_make_pcpu_route() */
10137d88d8b5SDavid Ahern
10142ab75bfbSDavid Ahern if (f6i->nh) {
10152ab75bfbSDavid Ahern struct fib6_nh_pcpu_arg arg = {
10162ab75bfbSDavid Ahern .from = f6i,
10172ab75bfbSDavid Ahern .table = table
10182ab75bfbSDavid Ahern };
10192ab75bfbSDavid Ahern
10202ab75bfbSDavid Ahern nexthop_for_each_fib6_nh(f6i->nh, fib6_nh_drop_pcpu_from,
10212ab75bfbSDavid Ahern &arg);
10222ab75bfbSDavid Ahern } else {
10232ab75bfbSDavid Ahern struct fib6_nh *fib6_nh;
10242ab75bfbSDavid Ahern
10251cf844c7SDavid Ahern fib6_nh = f6i->fib6_nh;
10267d88d8b5SDavid Ahern __fib6_drop_pcpu_from(fib6_nh, f6i, table);
10277d88d8b5SDavid Ahern }
10282ab75bfbSDavid Ahern }
10297d88d8b5SDavid Ahern
fib6_purge_rt(struct fib6_info * rt,struct fib6_node * fn,struct net * net)10308d1c802bSDavid Ahern static void fib6_purge_rt(struct fib6_info *rt, struct fib6_node *fn,
10316e9e16e6SHannes Frederic Sowa struct net *net)
10326e9e16e6SHannes Frederic Sowa {
103393c2fb25SDavid Ahern struct fib6_table *table = rt->fib6_table;
103466f5d6ceSWei Wang
1035d8f5c296SSean Tranchetti /* Flush all cached dst in exception table */
1036d8f5c296SSean Tranchetti rt6_flush_exceptions(rt);
103761fb0d01SEric Dumazet fib6_drop_pcpu_from(rt, table);
103861fb0d01SEric Dumazet
1039f88d8ea6SDavid Ahern if (rt->nh && !list_empty(&rt->nh_list))
1040f88d8ea6SDavid Ahern list_del_init(&rt->nh_list);
1041f88d8ea6SDavid Ahern
1042f05713e0SEric Dumazet if (refcount_read(&rt->fib6_ref) != 1) {
10436e9e16e6SHannes Frederic Sowa /* This route is used as dummy address holder in some split
10446e9e16e6SHannes Frederic Sowa * nodes. It is not leaked, but it still holds other resources,
10456e9e16e6SHannes Frederic Sowa * which must be released in time. So, scan ascendant nodes
10466e9e16e6SHannes Frederic Sowa * and replace dummy references to this route with references
10476e9e16e6SHannes Frederic Sowa * to still alive ones.
10486e9e16e6SHannes Frederic Sowa */
10496e9e16e6SHannes Frederic Sowa while (fn) {
10508d1c802bSDavid Ahern struct fib6_info *leaf = rcu_dereference_protected(fn->leaf,
105166f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
10528d1c802bSDavid Ahern struct fib6_info *new_leaf;
105366f5d6ceSWei Wang if (!(fn->fn_flags & RTN_RTINFO) && leaf == rt) {
105466f5d6ceSWei Wang new_leaf = fib6_find_prefix(net, table, fn);
10555ea71528SEric Dumazet fib6_info_hold(new_leaf);
105693531c67SDavid Ahern
105766f5d6ceSWei Wang rcu_assign_pointer(fn->leaf, new_leaf);
105893531c67SDavid Ahern fib6_info_release(rt);
10596e9e16e6SHannes Frederic Sowa }
106066f5d6ceSWei Wang fn = rcu_dereference_protected(fn->parent,
106166f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
10626e9e16e6SHannes Frederic Sowa }
10636e9e16e6SHannes Frederic Sowa }
10646e9e16e6SHannes Frederic Sowa }
10656e9e16e6SHannes Frederic Sowa
10661da177e4SLinus Torvalds /*
10671da177e4SLinus Torvalds * Insert routing information in a node.
10681da177e4SLinus Torvalds */
10691da177e4SLinus Torvalds
fib6_add_rt2node(struct fib6_node * fn,struct fib6_info * rt,struct nl_info * info,struct netlink_ext_ack * extack)10708d1c802bSDavid Ahern static int fib6_add_rt2node(struct fib6_node *fn, struct fib6_info *rt,
1071d4ead6b3SDavid Ahern struct nl_info *info,
10726c31e5a9SDavid Ahern struct netlink_ext_ack *extack)
10731da177e4SLinus Torvalds {
10748d1c802bSDavid Ahern struct fib6_info *leaf = rcu_dereference_protected(fn->leaf,
107593c2fb25SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
107633bd5ac5SDavid Ahern struct fib6_info *iter = NULL;
10778d1c802bSDavid Ahern struct fib6_info __rcu **ins;
107833bd5ac5SDavid Ahern struct fib6_info __rcu **fallback_ins = NULL;
1079507c9b1eSDavid S. Miller int replace = (info->nlh &&
10804a287ebaSMatti Vaittinen (info->nlh->nlmsg_flags & NLM_F_REPLACE));
1081507c9b1eSDavid S. Miller int add = (!info->nlh ||
10824a287ebaSMatti Vaittinen (info->nlh->nlmsg_flags & NLM_F_CREATE));
10834a287ebaSMatti Vaittinen int found = 0;
108433bd5ac5SDavid Ahern bool rt_can_ecmp = rt6_qualify_for_ecmp(rt);
1085c10c4279SIdo Schimmel bool notify_sibling_rt = false;
108673483c12SGuillaume Nault u16 nlflags = NLM_F_EXCL;
1087e5fd387aSMichal Kubeček int err;
10881da177e4SLinus Torvalds
108933bd5ac5SDavid Ahern if (info->nlh && (info->nlh->nlmsg_flags & NLM_F_APPEND))
10901f5e29ceSDavid Ahern nlflags |= NLM_F_APPEND;
10911f5e29ceSDavid Ahern
10921da177e4SLinus Torvalds ins = &fn->leaf;
10931da177e4SLinus Torvalds
109466f5d6ceSWei Wang for (iter = leaf; iter;
10958fb11a9aSDavid Ahern iter = rcu_dereference_protected(iter->fib6_next,
109693c2fb25SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock))) {
10971da177e4SLinus Torvalds /*
10981da177e4SLinus Torvalds * Search for duplicates
10991da177e4SLinus Torvalds */
11001da177e4SLinus Torvalds
110193c2fb25SDavid Ahern if (iter->fib6_metric == rt->fib6_metric) {
11021da177e4SLinus Torvalds /*
11031da177e4SLinus Torvalds * Same priority level
11041da177e4SLinus Torvalds */
1105507c9b1eSDavid S. Miller if (info->nlh &&
11064a287ebaSMatti Vaittinen (info->nlh->nlmsg_flags & NLM_F_EXCL))
11074a287ebaSMatti Vaittinen return -EEXIST;
110873483c12SGuillaume Nault
110973483c12SGuillaume Nault nlflags &= ~NLM_F_EXCL;
11104a287ebaSMatti Vaittinen if (replace) {
111133bd5ac5SDavid Ahern if (rt_can_ecmp == rt6_qualify_for_ecmp(iter)) {
11124a287ebaSMatti Vaittinen found++;
11134a287ebaSMatti Vaittinen break;
11144a287ebaSMatti Vaittinen }
111533bd5ac5SDavid Ahern fallback_ins = fallback_ins ?: ins;
111633bd5ac5SDavid Ahern goto next_iter;
111733bd5ac5SDavid Ahern }
11181da177e4SLinus Torvalds
1119f06b7549SDavid Ahern if (rt6_duplicate_nexthop(iter, rt)) {
112093c2fb25SDavid Ahern if (rt->fib6_nsiblings)
112193c2fb25SDavid Ahern rt->fib6_nsiblings = 0;
112293c2fb25SDavid Ahern if (!(iter->fib6_flags & RTF_EXPIRES))
11231da177e4SLinus Torvalds return -EEXIST;
112493c2fb25SDavid Ahern if (!(rt->fib6_flags & RTF_EXPIRES))
1125b577b9aaSDavid Ahern fib6_clean_expires(iter);
11261716a961SGao feng else
1127b577b9aaSDavid Ahern fib6_set_expires(iter, rt->expires);
112815a81b41SDavid Ahern
112915a81b41SDavid Ahern if (rt->fib6_pmtu)
113015a81b41SDavid Ahern fib6_metric_set(iter, RTAX_MTU,
113115a81b41SDavid Ahern rt->fib6_pmtu);
11321da177e4SLinus Torvalds return -EEXIST;
11331da177e4SLinus Torvalds }
113433bd5ac5SDavid Ahern /* If we have the same destination and the same metric,
113533bd5ac5SDavid Ahern * but not the same gateway, then the route we try to
113633bd5ac5SDavid Ahern * add is sibling to this route, increment our counter
113733bd5ac5SDavid Ahern * of siblings, and later we will add our route to the
113833bd5ac5SDavid Ahern * list.
113933bd5ac5SDavid Ahern * Only static routes (which don't have flag
114033bd5ac5SDavid Ahern * RTF_EXPIRES) are used for ECMPv6.
114133bd5ac5SDavid Ahern *
114233bd5ac5SDavid Ahern * To avoid long list, we only had siblings if the
114333bd5ac5SDavid Ahern * route have a gateway.
114433bd5ac5SDavid Ahern */
114533bd5ac5SDavid Ahern if (rt_can_ecmp &&
114633bd5ac5SDavid Ahern rt6_qualify_for_ecmp(iter))
114733bd5ac5SDavid Ahern rt->fib6_nsiblings++;
11481da177e4SLinus Torvalds }
11491da177e4SLinus Torvalds
115093c2fb25SDavid Ahern if (iter->fib6_metric > rt->fib6_metric)
11511da177e4SLinus Torvalds break;
11521da177e4SLinus Torvalds
115333bd5ac5SDavid Ahern next_iter:
11548fb11a9aSDavid Ahern ins = &iter->fib6_next;
115527596472SMichal Kubeček }
115627596472SMichal Kubeček
115733bd5ac5SDavid Ahern if (fallback_ins && !found) {
1158e404b8c7SBenjamin Poirier /* No matching route with same ecmp-able-ness found, replace
1159e404b8c7SBenjamin Poirier * first matching route
1160e404b8c7SBenjamin Poirier */
116133bd5ac5SDavid Ahern ins = fallback_ins;
116233bd5ac5SDavid Ahern iter = rcu_dereference_protected(*ins,
116333bd5ac5SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
116433bd5ac5SDavid Ahern found++;
116533bd5ac5SDavid Ahern }
116633bd5ac5SDavid Ahern
1167f11e6659SDavid S. Miller /* Reset round-robin state, if necessary */
1168f11e6659SDavid S. Miller if (ins == &fn->leaf)
1169f11e6659SDavid S. Miller fn->rr_ptr = NULL;
1170f11e6659SDavid S. Miller
117151ebd318SNicolas Dichtel /* Link this route to others same route. */
117233bd5ac5SDavid Ahern if (rt->fib6_nsiblings) {
117333bd5ac5SDavid Ahern unsigned int fib6_nsiblings;
11748d1c802bSDavid Ahern struct fib6_info *sibling, *temp_sibling;
117551ebd318SNicolas Dichtel
117633bd5ac5SDavid Ahern /* Find the first route that have the same metric */
117733bd5ac5SDavid Ahern sibling = leaf;
1178c10c4279SIdo Schimmel notify_sibling_rt = true;
117933bd5ac5SDavid Ahern while (sibling) {
118033bd5ac5SDavid Ahern if (sibling->fib6_metric == rt->fib6_metric &&
118133bd5ac5SDavid Ahern rt6_qualify_for_ecmp(sibling)) {
1182*52da0252SOmid Ehtemam-Haghighi list_add_tail_rcu(&rt->fib6_siblings,
118333bd5ac5SDavid Ahern &sibling->fib6_siblings);
118433bd5ac5SDavid Ahern break;
118551ebd318SNicolas Dichtel }
118633bd5ac5SDavid Ahern sibling = rcu_dereference_protected(sibling->fib6_next,
118733bd5ac5SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
1188c10c4279SIdo Schimmel notify_sibling_rt = false;
118933bd5ac5SDavid Ahern }
119051ebd318SNicolas Dichtel /* For each sibling in the list, increment the counter of
119151ebd318SNicolas Dichtel * siblings. BUG() if counters does not match, list of siblings
119251ebd318SNicolas Dichtel * is broken!
119351ebd318SNicolas Dichtel */
119433bd5ac5SDavid Ahern fib6_nsiblings = 0;
119551ebd318SNicolas Dichtel list_for_each_entry_safe(sibling, temp_sibling,
119633bd5ac5SDavid Ahern &rt->fib6_siblings, fib6_siblings) {
119793c2fb25SDavid Ahern sibling->fib6_nsiblings++;
119833bd5ac5SDavid Ahern BUG_ON(sibling->fib6_nsiblings != rt->fib6_nsiblings);
119933bd5ac5SDavid Ahern fib6_nsiblings++;
120051ebd318SNicolas Dichtel }
120133bd5ac5SDavid Ahern BUG_ON(fib6_nsiblings != rt->fib6_nsiblings);
120233bd5ac5SDavid Ahern rt6_multipath_rebalance(temp_sibling);
120351ebd318SNicolas Dichtel }
120451ebd318SNicolas Dichtel
12051da177e4SLinus Torvalds /*
12061da177e4SLinus Torvalds * insert node
12071da177e4SLinus Torvalds */
12084a287ebaSMatti Vaittinen if (!replace) {
12094a287ebaSMatti Vaittinen if (!add)
1210f3213831SJoe Perches pr_warn("NLM_F_CREATE should be set when creating new route\n");
12111da177e4SLinus Torvalds
12124a287ebaSMatti Vaittinen add:
121373483c12SGuillaume Nault nlflags |= NLM_F_CREATE;
1214e715b6d3SFlorian Westphal
1215caafb250SIdo Schimmel /* The route should only be notified if it is the first
1216caafb250SIdo Schimmel * route in the node or if it is added as a sibling
1217caafb250SIdo Schimmel * route to the first route in the node.
1218caafb250SIdo Schimmel */
1219caafb250SIdo Schimmel if (!info->skip_notify_kernel &&
1220caafb250SIdo Schimmel (notify_sibling_rt || ins == &fn->leaf)) {
1221c10c4279SIdo Schimmel enum fib_event_type fib_event;
1222c10c4279SIdo Schimmel
1223c10c4279SIdo Schimmel if (notify_sibling_rt)
1224c10c4279SIdo Schimmel fib_event = FIB_EVENT_ENTRY_APPEND;
1225c10c4279SIdo Schimmel else
1226caafb250SIdo Schimmel fib_event = FIB_EVENT_ENTRY_REPLACE;
1227c10c4279SIdo Schimmel err = call_fib6_entry_notifiers(info->nl_net,
1228c10c4279SIdo Schimmel fib_event, rt,
1229c10c4279SIdo Schimmel extack);
123054851aa9SIdo Schimmel if (err) {
123154851aa9SIdo Schimmel struct fib6_info *sibling, *next_sibling;
123254851aa9SIdo Schimmel
123354851aa9SIdo Schimmel /* If the route has siblings, then it first
123454851aa9SIdo Schimmel * needs to be unlinked from them.
123554851aa9SIdo Schimmel */
123654851aa9SIdo Schimmel if (!rt->fib6_nsiblings)
1237e5fd387aSMichal Kubeček return err;
123854851aa9SIdo Schimmel
123954851aa9SIdo Schimmel list_for_each_entry_safe(sibling, next_sibling,
124054851aa9SIdo Schimmel &rt->fib6_siblings,
124154851aa9SIdo Schimmel fib6_siblings)
124254851aa9SIdo Schimmel sibling->fib6_nsiblings--;
124354851aa9SIdo Schimmel rt->fib6_nsiblings = 0;
1244*52da0252SOmid Ehtemam-Haghighi list_del_rcu(&rt->fib6_siblings);
124554851aa9SIdo Schimmel rt6_multipath_rebalance(next_sibling);
124654851aa9SIdo Schimmel return err;
124754851aa9SIdo Schimmel }
1248d5382fefSIdo Schimmel }
1249e5fd387aSMichal Kubeček
12508fb11a9aSDavid Ahern rcu_assign_pointer(rt->fib6_next, iter);
12515ea71528SEric Dumazet fib6_info_hold(rt);
125293c2fb25SDavid Ahern rcu_assign_pointer(rt->fib6_node, fn);
125366f5d6ceSWei Wang rcu_assign_pointer(*ins, rt);
12543b1137feSDavid Ahern if (!info->skip_notify)
125573483c12SGuillaume Nault inet6_rt_notify(RTM_NEWROUTE, rt, info, nlflags);
1256c572872fSBenjamin Thery info->nl_net->ipv6.rt6_stats->fib_rt_entries++;
12571da177e4SLinus Torvalds
1258507c9b1eSDavid S. Miller if (!(fn->fn_flags & RTN_RTINFO)) {
1259c572872fSBenjamin Thery info->nl_net->ipv6.rt6_stats->fib_route_nodes++;
12601da177e4SLinus Torvalds fn->fn_flags |= RTN_RTINFO;
12611da177e4SLinus Torvalds }
12621da177e4SLinus Torvalds
12634a287ebaSMatti Vaittinen } else {
126433bd5ac5SDavid Ahern int nsiblings;
126527596472SMichal Kubeček
12664a287ebaSMatti Vaittinen if (!found) {
12674a287ebaSMatti Vaittinen if (add)
12684a287ebaSMatti Vaittinen goto add;
1269f3213831SJoe Perches pr_warn("NLM_F_REPLACE set, but no existing node found!\n");
12704a287ebaSMatti Vaittinen return -ENOENT;
12714a287ebaSMatti Vaittinen }
1272e715b6d3SFlorian Westphal
1273caafb250SIdo Schimmel if (!info->skip_notify_kernel && ins == &fn->leaf) {
12742233000cSDavid Ahern err = call_fib6_entry_notifiers(info->nl_net,
12752233000cSDavid Ahern FIB_EVENT_ENTRY_REPLACE,
12762233000cSDavid Ahern rt, extack);
12772233000cSDavid Ahern if (err)
12782233000cSDavid Ahern return err;
1279d5382fefSIdo Schimmel }
12802233000cSDavid Ahern
12815ea71528SEric Dumazet fib6_info_hold(rt);
128293c2fb25SDavid Ahern rcu_assign_pointer(rt->fib6_node, fn);
128333bd5ac5SDavid Ahern rt->fib6_next = iter->fib6_next;
128466f5d6ceSWei Wang rcu_assign_pointer(*ins, rt);
12853b1137feSDavid Ahern if (!info->skip_notify)
128637a1d361SRoopa Prabhu inet6_rt_notify(RTM_NEWROUTE, rt, info, NLM_F_REPLACE);
1287507c9b1eSDavid S. Miller if (!(fn->fn_flags & RTN_RTINFO)) {
12884a287ebaSMatti Vaittinen info->nl_net->ipv6.rt6_stats->fib_route_nodes++;
12894a287ebaSMatti Vaittinen fn->fn_flags |= RTN_RTINFO;
12904a287ebaSMatti Vaittinen }
129133bd5ac5SDavid Ahern nsiblings = iter->fib6_nsiblings;
129293c2fb25SDavid Ahern iter->fib6_node = NULL;
129327596472SMichal Kubeček fib6_purge_rt(iter, fn, info->nl_net);
129466f5d6ceSWei Wang if (rcu_access_pointer(fn->rr_ptr) == iter)
1295383143f3SWei Wang fn->rr_ptr = NULL;
129693531c67SDavid Ahern fib6_info_release(iter);
12976e9e16e6SHannes Frederic Sowa
129833bd5ac5SDavid Ahern if (nsiblings) {
129933bd5ac5SDavid Ahern /* Replacing an ECMP route, remove all siblings */
130033bd5ac5SDavid Ahern ins = &rt->fib6_next;
130133bd5ac5SDavid Ahern iter = rcu_dereference_protected(*ins,
130233bd5ac5SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
130333bd5ac5SDavid Ahern while (iter) {
130433bd5ac5SDavid Ahern if (iter->fib6_metric > rt->fib6_metric)
130533bd5ac5SDavid Ahern break;
130633bd5ac5SDavid Ahern if (rt6_qualify_for_ecmp(iter)) {
130733bd5ac5SDavid Ahern *ins = iter->fib6_next;
130833bd5ac5SDavid Ahern iter->fib6_node = NULL;
130933bd5ac5SDavid Ahern fib6_purge_rt(iter, fn, info->nl_net);
131033bd5ac5SDavid Ahern if (rcu_access_pointer(fn->rr_ptr) == iter)
1311f34436a4SDavid Ahern fn->rr_ptr = NULL;
131233bd5ac5SDavid Ahern fib6_info_release(iter);
131333bd5ac5SDavid Ahern nsiblings--;
131433bd5ac5SDavid Ahern info->nl_net->ipv6.rt6_stats->fib_rt_entries--;
131533bd5ac5SDavid Ahern } else {
131633bd5ac5SDavid Ahern ins = &iter->fib6_next;
131733bd5ac5SDavid Ahern }
131833bd5ac5SDavid Ahern iter = rcu_dereference_protected(*ins,
131933bd5ac5SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
132033bd5ac5SDavid Ahern }
132133bd5ac5SDavid Ahern WARN_ON(nsiblings != 0);
132233bd5ac5SDavid Ahern }
13234a287ebaSMatti Vaittinen }
13244a287ebaSMatti Vaittinen
13251da177e4SLinus Torvalds return 0;
13261da177e4SLinus Torvalds }
13271da177e4SLinus Torvalds
fib6_start_gc(struct net * net,struct fib6_info * rt)13288d1c802bSDavid Ahern static void fib6_start_gc(struct net *net, struct fib6_info *rt)
13291da177e4SLinus Torvalds {
1330417f28bbSStephen Hemminger if (!timer_pending(&net->ipv6.ip6_fib_timer) &&
133193c2fb25SDavid Ahern (rt->fib6_flags & RTF_EXPIRES))
1332417f28bbSStephen Hemminger mod_timer(&net->ipv6.ip6_fib_timer,
1333847499ceSStephen Hemminger jiffies + net->ipv6.sysctl.ip6_rt_gc_interval);
13341da177e4SLinus Torvalds }
13351da177e4SLinus Torvalds
fib6_force_start_gc(struct net * net)133663152fc0SDaniel Lezcano void fib6_force_start_gc(struct net *net)
13371da177e4SLinus Torvalds {
1338417f28bbSStephen Hemminger if (!timer_pending(&net->ipv6.ip6_fib_timer))
1339417f28bbSStephen Hemminger mod_timer(&net->ipv6.ip6_fib_timer,
1340847499ceSStephen Hemminger jiffies + net->ipv6.sysctl.ip6_rt_gc_interval);
13411da177e4SLinus Torvalds }
13421da177e4SLinus Torvalds
__fib6_update_sernum_upto_root(struct fib6_info * rt,int sernum)13438d1c802bSDavid Ahern static void __fib6_update_sernum_upto_root(struct fib6_info *rt,
1344bbd63f06SWei Wang int sernum)
1345bbd63f06SWei Wang {
134693c2fb25SDavid Ahern struct fib6_node *fn = rcu_dereference_protected(rt->fib6_node,
134793c2fb25SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
1348bbd63f06SWei Wang
1349446e7f21Szhang kai /* paired with smp_rmb() in fib6_get_cookie_safe() */
1350bbd63f06SWei Wang smp_wmb();
1351bbd63f06SWei Wang while (fn) {
1352aafc2e32SEric Dumazet WRITE_ONCE(fn->fn_sernum, sernum);
135366f5d6ceSWei Wang fn = rcu_dereference_protected(fn->parent,
135493c2fb25SDavid Ahern lockdep_is_held(&rt->fib6_table->tb6_lock));
1355bbd63f06SWei Wang }
1356bbd63f06SWei Wang }
1357bbd63f06SWei Wang
fib6_update_sernum_upto_root(struct net * net,struct fib6_info * rt)13588d1c802bSDavid Ahern void fib6_update_sernum_upto_root(struct net *net, struct fib6_info *rt)
13594a8e56eeSIdo Schimmel {
13604a8e56eeSIdo Schimmel __fib6_update_sernum_upto_root(rt, fib6_new_sernum(net));
13614a8e56eeSIdo Schimmel }
13624a8e56eeSIdo Schimmel
1363cdaa16a4SDavid Ahern /* allow ipv4 to update sernum via ipv6_stub */
fib6_update_sernum_stub(struct net * net,struct fib6_info * f6i)1364cdaa16a4SDavid Ahern void fib6_update_sernum_stub(struct net *net, struct fib6_info *f6i)
1365cdaa16a4SDavid Ahern {
1366cdaa16a4SDavid Ahern spin_lock_bh(&f6i->fib6_table->tb6_lock);
1367cdaa16a4SDavid Ahern fib6_update_sernum_upto_root(net, f6i);
1368cdaa16a4SDavid Ahern spin_unlock_bh(&f6i->fib6_table->tb6_lock);
1369cdaa16a4SDavid Ahern }
1370cdaa16a4SDavid Ahern
13711da177e4SLinus Torvalds /*
13721da177e4SLinus Torvalds * Add routing information to the routing tree.
13731da177e4SLinus Torvalds * <destination addr>/<source addr>
13741da177e4SLinus Torvalds * with source addr info in sub-trees
137566f5d6ceSWei Wang * Need to own table->tb6_lock
13761da177e4SLinus Torvalds */
13771da177e4SLinus Torvalds
fib6_add(struct fib6_node * root,struct fib6_info * rt,struct nl_info * info,struct netlink_ext_ack * extack)13788d1c802bSDavid Ahern int fib6_add(struct fib6_node *root, struct fib6_info *rt,
1379d4ead6b3SDavid Ahern struct nl_info *info, struct netlink_ext_ack *extack)
13801da177e4SLinus Torvalds {
138193c2fb25SDavid Ahern struct fib6_table *table = rt->fib6_table;
13828a18d2f0SArnd Bergmann struct fib6_node *fn;
13838a18d2f0SArnd Bergmann #ifdef CONFIG_IPV6_SUBTREES
13848a18d2f0SArnd Bergmann struct fib6_node *pn = NULL;
13858a18d2f0SArnd Bergmann #endif
13861da177e4SLinus Torvalds int err = -ENOMEM;
13874a287ebaSMatti Vaittinen int allow_create = 1;
13884a287ebaSMatti Vaittinen int replace_required = 0;
1389507c9b1eSDavid S. Miller
1390507c9b1eSDavid S. Miller if (info->nlh) {
13914a287ebaSMatti Vaittinen if (!(info->nlh->nlmsg_flags & NLM_F_CREATE))
13924a287ebaSMatti Vaittinen allow_create = 0;
1393507c9b1eSDavid S. Miller if (info->nlh->nlmsg_flags & NLM_F_REPLACE)
13944a287ebaSMatti Vaittinen replace_required = 1;
13954a287ebaSMatti Vaittinen }
13964a287ebaSMatti Vaittinen if (!allow_create && !replace_required)
1397f3213831SJoe Perches pr_warn("RTM_NEWROUTE with no NLM_F_CREATE or NLM_F_REPLACE\n");
13981da177e4SLinus Torvalds
139981eb8447SWei Wang fn = fib6_add_1(info->nl_net, table, root,
140093c2fb25SDavid Ahern &rt->fib6_dst.addr, rt->fib6_dst.plen,
140193c2fb25SDavid Ahern offsetof(struct fib6_info, fib6_dst), allow_create,
1402bbd63f06SWei Wang replace_required, extack);
14034a287ebaSMatti Vaittinen if (IS_ERR(fn)) {
14044a287ebaSMatti Vaittinen err = PTR_ERR(fn);
1405ae7b4e1fSDaniel Borkmann fn = NULL;
14061da177e4SLinus Torvalds goto out;
1407188c517aSLin Ming }
14081da177e4SLinus Torvalds
14098a18d2f0SArnd Bergmann #ifdef CONFIG_IPV6_SUBTREES
141066729e18SYOSHIFUJI Hideaki pn = fn;
141166729e18SYOSHIFUJI Hideaki
141293c2fb25SDavid Ahern if (rt->fib6_src.plen) {
14131da177e4SLinus Torvalds struct fib6_node *sn;
14141da177e4SLinus Torvalds
141566f5d6ceSWei Wang if (!rcu_access_pointer(fn->subtree)) {
14161da177e4SLinus Torvalds struct fib6_node *sfn;
14171da177e4SLinus Torvalds
14181da177e4SLinus Torvalds /*
14191da177e4SLinus Torvalds * Create subtree.
14201da177e4SLinus Torvalds *
14211da177e4SLinus Torvalds * fn[main tree]
14221da177e4SLinus Torvalds * |
14231da177e4SLinus Torvalds * sfn[subtree root]
14241da177e4SLinus Torvalds * \
14251da177e4SLinus Torvalds * sn[new leaf node]
14261da177e4SLinus Torvalds */
14271da177e4SLinus Torvalds
14281da177e4SLinus Torvalds /* Create subtree root node */
142981eb8447SWei Wang sfn = node_alloc(info->nl_net);
1430507c9b1eSDavid S. Miller if (!sfn)
1431348a4002SWei Wang goto failure;
14321da177e4SLinus Torvalds
14335ea71528SEric Dumazet fib6_info_hold(info->nl_net->ipv6.fib6_null_entry);
143466f5d6ceSWei Wang rcu_assign_pointer(sfn->leaf,
1435421842edSDavid Ahern info->nl_net->ipv6.fib6_null_entry);
14361da177e4SLinus Torvalds sfn->fn_flags = RTN_ROOT;
14371da177e4SLinus Torvalds
14381da177e4SLinus Torvalds /* Now add the first leaf node to new subtree */
14391da177e4SLinus Torvalds
144081eb8447SWei Wang sn = fib6_add_1(info->nl_net, table, sfn,
144193c2fb25SDavid Ahern &rt->fib6_src.addr, rt->fib6_src.plen,
144293c2fb25SDavid Ahern offsetof(struct fib6_info, fib6_src),
1443bbd63f06SWei Wang allow_create, replace_required, extack);
14441da177e4SLinus Torvalds
1445f950c0ecSWei Yongjun if (IS_ERR(sn)) {
14461da177e4SLinus Torvalds /* If it is failed, discard just allocated
1447348a4002SWei Wang root, and then (in failure) stale node
14481da177e4SLinus Torvalds in main tree.
14491da177e4SLinus Torvalds */
145081eb8447SWei Wang node_free_immediate(info->nl_net, sfn);
1451188c517aSLin Ming err = PTR_ERR(sn);
1452348a4002SWei Wang goto failure;
14531da177e4SLinus Torvalds }
14541da177e4SLinus Torvalds
14551da177e4SLinus Torvalds /* Now link new subtree to main tree */
145666f5d6ceSWei Wang rcu_assign_pointer(sfn->parent, fn);
145766f5d6ceSWei Wang rcu_assign_pointer(fn->subtree, sfn);
14581da177e4SLinus Torvalds } else {
145981eb8447SWei Wang sn = fib6_add_1(info->nl_net, table, FIB6_SUBTREE(fn),
146093c2fb25SDavid Ahern &rt->fib6_src.addr, rt->fib6_src.plen,
146193c2fb25SDavid Ahern offsetof(struct fib6_info, fib6_src),
1462bbd63f06SWei Wang allow_create, replace_required, extack);
14631da177e4SLinus Torvalds
14644a287ebaSMatti Vaittinen if (IS_ERR(sn)) {
14654a287ebaSMatti Vaittinen err = PTR_ERR(sn);
1466348a4002SWei Wang goto failure;
14671da177e4SLinus Torvalds }
1468188c517aSLin Ming }
14691da177e4SLinus Torvalds
147066f5d6ceSWei Wang if (!rcu_access_pointer(fn->leaf)) {
1471591ff9eaSWei Wang if (fn->fn_flags & RTN_TL_ROOT) {
1472591ff9eaSWei Wang /* put back null_entry for root node */
1473591ff9eaSWei Wang rcu_assign_pointer(fn->leaf,
1474421842edSDavid Ahern info->nl_net->ipv6.fib6_null_entry);
1475591ff9eaSWei Wang } else {
14765ea71528SEric Dumazet fib6_info_hold(rt);
147766f5d6ceSWei Wang rcu_assign_pointer(fn->leaf, rt);
147866729e18SYOSHIFUJI Hideaki }
1479591ff9eaSWei Wang }
14801da177e4SLinus Torvalds fn = sn;
14811da177e4SLinus Torvalds }
14821da177e4SLinus Torvalds #endif
14831da177e4SLinus Torvalds
1484d4ead6b3SDavid Ahern err = fib6_add_rt2node(fn, rt, info, extack);
1485bbd63f06SWei Wang if (!err) {
1486f88d8ea6SDavid Ahern if (rt->nh)
1487f88d8ea6SDavid Ahern list_add(&rt->nh_list, &rt->nh->f6i_list);
1488e87b5052Szhang kai __fib6_update_sernum_upto_root(rt, fib6_new_sernum(info->nl_net));
148963152fc0SDaniel Lezcano fib6_start_gc(info->nl_net, rt);
1490bbd63f06SWei Wang }
14911da177e4SLinus Torvalds
14921da177e4SLinus Torvalds out:
149366729e18SYOSHIFUJI Hideaki if (err) {
149466729e18SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_SUBTREES
149566729e18SYOSHIFUJI Hideaki /*
149666729e18SYOSHIFUJI Hideaki * If fib6_add_1 has cleared the old leaf pointer in the
149766729e18SYOSHIFUJI Hideaki * super-tree leaf node we have to find a new one for it.
149866729e18SYOSHIFUJI Hideaki */
14997bbfe00eSWei Wang if (pn != fn) {
15008d1c802bSDavid Ahern struct fib6_info *pn_leaf =
15017bbfe00eSWei Wang rcu_dereference_protected(pn->leaf,
150266f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
15037bbfe00eSWei Wang if (pn_leaf == rt) {
150466f5d6ceSWei Wang pn_leaf = NULL;
150566f5d6ceSWei Wang RCU_INIT_POINTER(pn->leaf, NULL);
150693531c67SDavid Ahern fib6_info_release(rt);
15073c051235SDavid S. Miller }
15087bbfe00eSWei Wang if (!pn_leaf && !(pn->fn_flags & RTN_RTINFO)) {
15097bbfe00eSWei Wang pn_leaf = fib6_find_prefix(info->nl_net, table,
15107bbfe00eSWei Wang pn);
1511a0876811SEric Dumazet if (!pn_leaf)
15127bbfe00eSWei Wang pn_leaf =
1513421842edSDavid Ahern info->nl_net->ipv6.fib6_null_entry;
151493531c67SDavid Ahern fib6_info_hold(pn_leaf);
151566f5d6ceSWei Wang rcu_assign_pointer(pn->leaf, pn_leaf);
151666729e18SYOSHIFUJI Hideaki }
15177bbfe00eSWei Wang }
151866729e18SYOSHIFUJI Hideaki #endif
1519348a4002SWei Wang goto failure;
1520b9b33e7cSPaolo Abeni } else if (fib6_requires_src(rt)) {
1521b9b33e7cSPaolo Abeni fib6_routes_require_src_inc(info->nl_net);
152266729e18SYOSHIFUJI Hideaki }
15231da177e4SLinus Torvalds return err;
15241da177e4SLinus Torvalds
1525348a4002SWei Wang failure:
15264512c43eSWei Wang /* fn->leaf could be NULL and fib6_repair_tree() needs to be called if:
15274512c43eSWei Wang * 1. fn is an intermediate node and we failed to add the new
15284512c43eSWei Wang * route to it in both subtree creation failure and fib6_add_rt2node()
15294512c43eSWei Wang * failure case.
15304512c43eSWei Wang * 2. fn is the root node in the table and we fail to add the first
15314512c43eSWei Wang * default route to it.
15321da177e4SLinus Torvalds */
15334512c43eSWei Wang if (fn &&
15344512c43eSWei Wang (!(fn->fn_flags & (RTN_RTINFO|RTN_ROOT)) ||
15354512c43eSWei Wang (fn->fn_flags & RTN_TL_ROOT &&
15364512c43eSWei Wang !rcu_access_pointer(fn->leaf))))
153766f5d6ceSWei Wang fib6_repair_tree(info->nl_net, table, fn);
15381da177e4SLinus Torvalds return err;
15391da177e4SLinus Torvalds }
15401da177e4SLinus Torvalds
15411da177e4SLinus Torvalds /*
15421da177e4SLinus Torvalds * Routing tree lookup
15431da177e4SLinus Torvalds *
15441da177e4SLinus Torvalds */
15451da177e4SLinus Torvalds
15461da177e4SLinus Torvalds struct lookup_args {
15478d1c802bSDavid Ahern int offset; /* key offset on fib6_info */
1548b71d1d42SEric Dumazet const struct in6_addr *addr; /* search key */
15491da177e4SLinus Torvalds };
15501da177e4SLinus Torvalds
fib6_node_lookup_1(struct fib6_node * root,struct lookup_args * args)15516454743bSDavid Ahern static struct fib6_node *fib6_node_lookup_1(struct fib6_node *root,
15521da177e4SLinus Torvalds struct lookup_args *args)
15531da177e4SLinus Torvalds {
15541da177e4SLinus Torvalds struct fib6_node *fn;
1555e69a4adcSAl Viro __be32 dir;
15561da177e4SLinus Torvalds
1557825e288eSYOSHIFUJI Hideaki if (unlikely(args->offset == 0))
1558825e288eSYOSHIFUJI Hideaki return NULL;
1559825e288eSYOSHIFUJI Hideaki
15601da177e4SLinus Torvalds /*
15611da177e4SLinus Torvalds * Descend on a tree
15621da177e4SLinus Torvalds */
15631da177e4SLinus Torvalds
15641da177e4SLinus Torvalds fn = root;
15651da177e4SLinus Torvalds
15661da177e4SLinus Torvalds for (;;) {
15671da177e4SLinus Torvalds struct fib6_node *next;
15681da177e4SLinus Torvalds
15691da177e4SLinus Torvalds dir = addr_bit_set(args->addr, fn->fn_bit);
15701da177e4SLinus Torvalds
157166f5d6ceSWei Wang next = dir ? rcu_dereference(fn->right) :
157266f5d6ceSWei Wang rcu_dereference(fn->left);
15731da177e4SLinus Torvalds
15741da177e4SLinus Torvalds if (next) {
15751da177e4SLinus Torvalds fn = next;
15761da177e4SLinus Torvalds continue;
15771da177e4SLinus Torvalds }
15781da177e4SLinus Torvalds break;
15791da177e4SLinus Torvalds }
15801da177e4SLinus Torvalds
15813fc5e044SYOSHIFUJI Hideaki while (fn) {
158266f5d6ceSWei Wang struct fib6_node *subtree = FIB6_SUBTREE(fn);
158366f5d6ceSWei Wang
158466f5d6ceSWei Wang if (subtree || fn->fn_flags & RTN_RTINFO) {
15858d1c802bSDavid Ahern struct fib6_info *leaf = rcu_dereference(fn->leaf);
15861da177e4SLinus Torvalds struct rt6key *key;
15871da177e4SLinus Torvalds
15888d1040e8SWei Wang if (!leaf)
15898d1040e8SWei Wang goto backtrack;
15908d1040e8SWei Wang
15918d1040e8SWei Wang key = (struct rt6key *) ((u8 *)leaf + args->offset);
15921da177e4SLinus Torvalds
15933fc5e044SYOSHIFUJI Hideaki if (ipv6_prefix_equal(&key->addr, args->addr, key->plen)) {
15943fc5e044SYOSHIFUJI Hideaki #ifdef CONFIG_IPV6_SUBTREES
159566f5d6ceSWei Wang if (subtree) {
15963e3be275SHannes Frederic Sowa struct fib6_node *sfn;
15976454743bSDavid Ahern sfn = fib6_node_lookup_1(subtree,
15986454743bSDavid Ahern args + 1);
15993e3be275SHannes Frederic Sowa if (!sfn)
16003e3be275SHannes Frederic Sowa goto backtrack;
16013e3be275SHannes Frederic Sowa fn = sfn;
16023e3be275SHannes Frederic Sowa }
16033fc5e044SYOSHIFUJI Hideaki #endif
16043e3be275SHannes Frederic Sowa if (fn->fn_flags & RTN_RTINFO)
16051da177e4SLinus Torvalds return fn;
16061da177e4SLinus Torvalds }
16073fc5e044SYOSHIFUJI Hideaki }
16083e3be275SHannes Frederic Sowa backtrack:
16093fc5e044SYOSHIFUJI Hideaki if (fn->fn_flags & RTN_ROOT)
16103fc5e044SYOSHIFUJI Hideaki break;
16111da177e4SLinus Torvalds
161266f5d6ceSWei Wang fn = rcu_dereference(fn->parent);
16131da177e4SLinus Torvalds }
16141da177e4SLinus Torvalds
16151da177e4SLinus Torvalds return NULL;
16161da177e4SLinus Torvalds }
16171da177e4SLinus Torvalds
161866f5d6ceSWei Wang /* called with rcu_read_lock() held
161966f5d6ceSWei Wang */
fib6_node_lookup(struct fib6_node * root,const struct in6_addr * daddr,const struct in6_addr * saddr)16206454743bSDavid Ahern struct fib6_node *fib6_node_lookup(struct fib6_node *root,
16216454743bSDavid Ahern const struct in6_addr *daddr,
1622b71d1d42SEric Dumazet const struct in6_addr *saddr)
16231da177e4SLinus Torvalds {
16241da177e4SLinus Torvalds struct fib6_node *fn;
1625825e288eSYOSHIFUJI Hideaki struct lookup_args args[] = {
1626825e288eSYOSHIFUJI Hideaki {
162793c2fb25SDavid Ahern .offset = offsetof(struct fib6_info, fib6_dst),
1628825e288eSYOSHIFUJI Hideaki .addr = daddr,
1629825e288eSYOSHIFUJI Hideaki },
16301da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
1631825e288eSYOSHIFUJI Hideaki {
163293c2fb25SDavid Ahern .offset = offsetof(struct fib6_info, fib6_src),
1633825e288eSYOSHIFUJI Hideaki .addr = saddr,
1634825e288eSYOSHIFUJI Hideaki },
16351da177e4SLinus Torvalds #endif
1636825e288eSYOSHIFUJI Hideaki {
1637825e288eSYOSHIFUJI Hideaki .offset = 0, /* sentinel */
1638825e288eSYOSHIFUJI Hideaki }
1639825e288eSYOSHIFUJI Hideaki };
16401da177e4SLinus Torvalds
16416454743bSDavid Ahern fn = fib6_node_lookup_1(root, daddr ? args : args + 1);
1642507c9b1eSDavid S. Miller if (!fn || fn->fn_flags & RTN_TL_ROOT)
16431da177e4SLinus Torvalds fn = root;
16441da177e4SLinus Torvalds
16451da177e4SLinus Torvalds return fn;
16461da177e4SLinus Torvalds }
16471da177e4SLinus Torvalds
16481da177e4SLinus Torvalds /*
16491da177e4SLinus Torvalds * Get node with specified destination prefix (and source prefix,
16501da177e4SLinus Torvalds * if subtrees are used)
165138fbeeeeSWei Wang * exact_match == true means we try to find fn with exact match of
165238fbeeeeSWei Wang * the passed in prefix addr
165338fbeeeeSWei Wang * exact_match == false means we try to find fn with longest prefix
165438fbeeeeSWei Wang * match of the passed in prefix addr. This is useful for finding fn
165538fbeeeeSWei Wang * for cached route as it will be stored in the exception table under
165638fbeeeeSWei Wang * the node with longest prefix length.
16571da177e4SLinus Torvalds */
16581da177e4SLinus Torvalds
16591da177e4SLinus Torvalds
fib6_locate_1(struct fib6_node * root,const struct in6_addr * addr,int plen,int offset,bool exact_match)16601da177e4SLinus Torvalds static struct fib6_node *fib6_locate_1(struct fib6_node *root,
1661b71d1d42SEric Dumazet const struct in6_addr *addr,
166238fbeeeeSWei Wang int plen, int offset,
166338fbeeeeSWei Wang bool exact_match)
16641da177e4SLinus Torvalds {
166538fbeeeeSWei Wang struct fib6_node *fn, *prev = NULL;
16661da177e4SLinus Torvalds
16671da177e4SLinus Torvalds for (fn = root; fn ; ) {
16688d1c802bSDavid Ahern struct fib6_info *leaf = rcu_dereference(fn->leaf);
16698d1040e8SWei Wang struct rt6key *key;
16708d1040e8SWei Wang
16718d1040e8SWei Wang /* This node is being deleted */
16728d1040e8SWei Wang if (!leaf) {
16738d1040e8SWei Wang if (plen <= fn->fn_bit)
16748d1040e8SWei Wang goto out;
16758d1040e8SWei Wang else
16768d1040e8SWei Wang goto next;
16778d1040e8SWei Wang }
16788d1040e8SWei Wang
16798d1040e8SWei Wang key = (struct rt6key *)((u8 *)leaf + offset);
16801da177e4SLinus Torvalds
16811da177e4SLinus Torvalds /*
16821da177e4SLinus Torvalds * Prefix match
16831da177e4SLinus Torvalds */
16841da177e4SLinus Torvalds if (plen < fn->fn_bit ||
16851da177e4SLinus Torvalds !ipv6_prefix_equal(&key->addr, addr, fn->fn_bit))
168638fbeeeeSWei Wang goto out;
16871da177e4SLinus Torvalds
16881da177e4SLinus Torvalds if (plen == fn->fn_bit)
16891da177e4SLinus Torvalds return fn;
16901da177e4SLinus Torvalds
169140cb35d5SStefano Brivio if (fn->fn_flags & RTN_RTINFO)
169238fbeeeeSWei Wang prev = fn;
169338fbeeeeSWei Wang
16948d1040e8SWei Wang next:
16951da177e4SLinus Torvalds /*
16961da177e4SLinus Torvalds * We have more bits to go
16971da177e4SLinus Torvalds */
16981da177e4SLinus Torvalds if (addr_bit_set(addr, fn->fn_bit))
169966f5d6ceSWei Wang fn = rcu_dereference(fn->right);
17001da177e4SLinus Torvalds else
170166f5d6ceSWei Wang fn = rcu_dereference(fn->left);
17021da177e4SLinus Torvalds }
170338fbeeeeSWei Wang out:
170438fbeeeeSWei Wang if (exact_match)
17051da177e4SLinus Torvalds return NULL;
170638fbeeeeSWei Wang else
170738fbeeeeSWei Wang return prev;
17081da177e4SLinus Torvalds }
17091da177e4SLinus Torvalds
fib6_locate(struct fib6_node * root,const struct in6_addr * daddr,int dst_len,const struct in6_addr * saddr,int src_len,bool exact_match)17101da177e4SLinus Torvalds struct fib6_node *fib6_locate(struct fib6_node *root,
1711b71d1d42SEric Dumazet const struct in6_addr *daddr, int dst_len,
171238fbeeeeSWei Wang const struct in6_addr *saddr, int src_len,
171338fbeeeeSWei Wang bool exact_match)
17141da177e4SLinus Torvalds {
17151da177e4SLinus Torvalds struct fib6_node *fn;
17161da177e4SLinus Torvalds
17171da177e4SLinus Torvalds fn = fib6_locate_1(root, daddr, dst_len,
171893c2fb25SDavid Ahern offsetof(struct fib6_info, fib6_dst),
171938fbeeeeSWei Wang exact_match);
17201da177e4SLinus Torvalds
17211da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
17221da177e4SLinus Torvalds if (src_len) {
17230e80193bSWei Wang WARN_ON(saddr == NULL);
17240e80193bSWei Wang if (fn) {
172566f5d6ceSWei Wang struct fib6_node *subtree = FIB6_SUBTREE(fn);
172666f5d6ceSWei Wang
17270e80193bSWei Wang if (subtree) {
172866f5d6ceSWei Wang fn = fib6_locate_1(subtree, saddr, src_len,
172993c2fb25SDavid Ahern offsetof(struct fib6_info, fib6_src),
173038fbeeeeSWei Wang exact_match);
17311da177e4SLinus Torvalds }
17320e80193bSWei Wang }
17330e80193bSWei Wang }
17341da177e4SLinus Torvalds #endif
17351da177e4SLinus Torvalds
17361da177e4SLinus Torvalds if (fn && fn->fn_flags & RTN_RTINFO)
17371da177e4SLinus Torvalds return fn;
17381da177e4SLinus Torvalds
17391da177e4SLinus Torvalds return NULL;
17401da177e4SLinus Torvalds }
17411da177e4SLinus Torvalds
17421da177e4SLinus Torvalds
17431da177e4SLinus Torvalds /*
17441da177e4SLinus Torvalds * Deletion
17451da177e4SLinus Torvalds *
17461da177e4SLinus Torvalds */
17471da177e4SLinus Torvalds
fib6_find_prefix(struct net * net,struct fib6_table * table,struct fib6_node * fn)17488d1c802bSDavid Ahern static struct fib6_info *fib6_find_prefix(struct net *net,
174966f5d6ceSWei Wang struct fib6_table *table,
175066f5d6ceSWei Wang struct fib6_node *fn)
17511da177e4SLinus Torvalds {
175266f5d6ceSWei Wang struct fib6_node *child_left, *child_right;
175366f5d6ceSWei Wang
17541da177e4SLinus Torvalds if (fn->fn_flags & RTN_ROOT)
1755421842edSDavid Ahern return net->ipv6.fib6_null_entry;
17561da177e4SLinus Torvalds
17571da177e4SLinus Torvalds while (fn) {
175866f5d6ceSWei Wang child_left = rcu_dereference_protected(fn->left,
175966f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
176066f5d6ceSWei Wang child_right = rcu_dereference_protected(fn->right,
176166f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
176266f5d6ceSWei Wang if (child_left)
176366f5d6ceSWei Wang return rcu_dereference_protected(child_left->leaf,
176466f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
176566f5d6ceSWei Wang if (child_right)
176666f5d6ceSWei Wang return rcu_dereference_protected(child_right->leaf,
176766f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
17681da177e4SLinus Torvalds
17697fc33165SYOSHIFUJI Hideaki fn = FIB6_SUBTREE(fn);
17701da177e4SLinus Torvalds }
17711da177e4SLinus Torvalds return NULL;
17721da177e4SLinus Torvalds }
17731da177e4SLinus Torvalds
17741da177e4SLinus Torvalds /*
17751da177e4SLinus Torvalds * Called to trim the tree of intermediate nodes when possible. "fn"
17761da177e4SLinus Torvalds * is the node we want to try and remove.
177766f5d6ceSWei Wang * Need to own table->tb6_lock
17781da177e4SLinus Torvalds */
17791da177e4SLinus Torvalds
fib6_repair_tree(struct net * net,struct fib6_table * table,struct fib6_node * fn)17808ed67789SDaniel Lezcano static struct fib6_node *fib6_repair_tree(struct net *net,
178166f5d6ceSWei Wang struct fib6_table *table,
17828ed67789SDaniel Lezcano struct fib6_node *fn)
17831da177e4SLinus Torvalds {
17841da177e4SLinus Torvalds int children;
17851da177e4SLinus Torvalds int nstate;
178666f5d6ceSWei Wang struct fib6_node *child;
178794b2cfe0SHannes Frederic Sowa struct fib6_walker *w;
17881da177e4SLinus Torvalds int iter = 0;
17891da177e4SLinus Torvalds
17904512c43eSWei Wang /* Set fn->leaf to null_entry for root node. */
17914512c43eSWei Wang if (fn->fn_flags & RTN_TL_ROOT) {
1792421842edSDavid Ahern rcu_assign_pointer(fn->leaf, net->ipv6.fib6_null_entry);
17934512c43eSWei Wang return fn;
17944512c43eSWei Wang }
17954512c43eSWei Wang
17961da177e4SLinus Torvalds for (;;) {
179766f5d6ceSWei Wang struct fib6_node *fn_r = rcu_dereference_protected(fn->right,
179866f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
179966f5d6ceSWei Wang struct fib6_node *fn_l = rcu_dereference_protected(fn->left,
180066f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
180166f5d6ceSWei Wang struct fib6_node *pn = rcu_dereference_protected(fn->parent,
180266f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
180366f5d6ceSWei Wang struct fib6_node *pn_r = rcu_dereference_protected(pn->right,
180466f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
180566f5d6ceSWei Wang struct fib6_node *pn_l = rcu_dereference_protected(pn->left,
180666f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
18078d1c802bSDavid Ahern struct fib6_info *fn_leaf = rcu_dereference_protected(fn->leaf,
180866f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
18098d1c802bSDavid Ahern struct fib6_info *pn_leaf = rcu_dereference_protected(pn->leaf,
181066f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
18118d1c802bSDavid Ahern struct fib6_info *new_fn_leaf;
181266f5d6ceSWei Wang
18131da177e4SLinus Torvalds RT6_TRACE("fixing tree: plen=%d iter=%d\n", fn->fn_bit, iter);
18141da177e4SLinus Torvalds iter++;
18151da177e4SLinus Torvalds
1816547b792cSIlpo Järvinen WARN_ON(fn->fn_flags & RTN_RTINFO);
1817547b792cSIlpo Järvinen WARN_ON(fn->fn_flags & RTN_TL_ROOT);
181866f5d6ceSWei Wang WARN_ON(fn_leaf);
18191da177e4SLinus Torvalds
18201da177e4SLinus Torvalds children = 0;
18211da177e4SLinus Torvalds child = NULL;
1822dee84779SJoe Perches if (fn_r) {
1823dee84779SJoe Perches child = fn_r;
1824dee84779SJoe Perches children |= 1;
1825dee84779SJoe Perches }
1826dee84779SJoe Perches if (fn_l) {
1827dee84779SJoe Perches child = fn_l;
1828dee84779SJoe Perches children |= 2;
1829dee84779SJoe Perches }
18301da177e4SLinus Torvalds
18317fc33165SYOSHIFUJI Hideaki if (children == 3 || FIB6_SUBTREE(fn)
18321da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
18331da177e4SLinus Torvalds /* Subtree root (i.e. fn) may have one child */
18341da177e4SLinus Torvalds || (children && fn->fn_flags & RTN_ROOT)
18351da177e4SLinus Torvalds #endif
18361da177e4SLinus Torvalds ) {
183766f5d6ceSWei Wang new_fn_leaf = fib6_find_prefix(net, table, fn);
18381da177e4SLinus Torvalds #if RT6_DEBUG >= 2
183966f5d6ceSWei Wang if (!new_fn_leaf) {
184066f5d6ceSWei Wang WARN_ON(!new_fn_leaf);
1841421842edSDavid Ahern new_fn_leaf = net->ipv6.fib6_null_entry;
18421da177e4SLinus Torvalds }
18431da177e4SLinus Torvalds #endif
184493531c67SDavid Ahern fib6_info_hold(new_fn_leaf);
184566f5d6ceSWei Wang rcu_assign_pointer(fn->leaf, new_fn_leaf);
184666f5d6ceSWei Wang return pn;
18471da177e4SLinus Torvalds }
18481da177e4SLinus Torvalds
18491da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
18507fc33165SYOSHIFUJI Hideaki if (FIB6_SUBTREE(pn) == fn) {
1851547b792cSIlpo Järvinen WARN_ON(!(fn->fn_flags & RTN_ROOT));
185266f5d6ceSWei Wang RCU_INIT_POINTER(pn->subtree, NULL);
18531da177e4SLinus Torvalds nstate = FWS_L;
18541da177e4SLinus Torvalds } else {
1855547b792cSIlpo Järvinen WARN_ON(fn->fn_flags & RTN_ROOT);
18561da177e4SLinus Torvalds #endif
185766f5d6ceSWei Wang if (pn_r == fn)
185866f5d6ceSWei Wang rcu_assign_pointer(pn->right, child);
185966f5d6ceSWei Wang else if (pn_l == fn)
186066f5d6ceSWei Wang rcu_assign_pointer(pn->left, child);
18611da177e4SLinus Torvalds #if RT6_DEBUG >= 2
1862547b792cSIlpo Järvinen else
1863547b792cSIlpo Järvinen WARN_ON(1);
18641da177e4SLinus Torvalds #endif
18651da177e4SLinus Torvalds if (child)
186666f5d6ceSWei Wang rcu_assign_pointer(child->parent, pn);
18671da177e4SLinus Torvalds nstate = FWS_R;
18681da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
18691da177e4SLinus Torvalds }
18701da177e4SLinus Torvalds #endif
18711da177e4SLinus Torvalds
18729a03cd8fSMichal Kubeček read_lock(&net->ipv6.fib6_walker_lock);
18739a03cd8fSMichal Kubeček FOR_WALKERS(net, w) {
1874507c9b1eSDavid S. Miller if (!child) {
18752b760fcfSWei Wang if (w->node == fn) {
18761da177e4SLinus Torvalds RT6_TRACE("W %p adjusted by delnode 1, s=%d/%d\n", w, w->state, nstate);
18771da177e4SLinus Torvalds w->node = pn;
18781da177e4SLinus Torvalds w->state = nstate;
18791da177e4SLinus Torvalds }
18801da177e4SLinus Torvalds } else {
18811da177e4SLinus Torvalds if (w->node == fn) {
18821da177e4SLinus Torvalds w->node = child;
18831da177e4SLinus Torvalds if (children&2) {
18841da177e4SLinus Torvalds RT6_TRACE("W %p adjusted by delnode 2, s=%d\n", w, w->state);
18851da177e4SLinus Torvalds w->state = w->state >= FWS_R ? FWS_U : FWS_INIT;
18861da177e4SLinus Torvalds } else {
18871da177e4SLinus Torvalds RT6_TRACE("W %p adjusted by delnode 2, s=%d\n", w, w->state);
18881da177e4SLinus Torvalds w->state = w->state >= FWS_C ? FWS_U : FWS_INIT;
18891da177e4SLinus Torvalds }
18901da177e4SLinus Torvalds }
18911da177e4SLinus Torvalds }
18921da177e4SLinus Torvalds }
18939a03cd8fSMichal Kubeček read_unlock(&net->ipv6.fib6_walker_lock);
18941da177e4SLinus Torvalds
189581eb8447SWei Wang node_free(net, fn);
18967fc33165SYOSHIFUJI Hideaki if (pn->fn_flags & RTN_RTINFO || FIB6_SUBTREE(pn))
18971da177e4SLinus Torvalds return pn;
18981da177e4SLinus Torvalds
189966f5d6ceSWei Wang RCU_INIT_POINTER(pn->leaf, NULL);
190093531c67SDavid Ahern fib6_info_release(pn_leaf);
19011da177e4SLinus Torvalds fn = pn;
19021da177e4SLinus Torvalds }
19031da177e4SLinus Torvalds }
19041da177e4SLinus Torvalds
fib6_del_route(struct fib6_table * table,struct fib6_node * fn,struct fib6_info __rcu ** rtp,struct nl_info * info)190566f5d6ceSWei Wang static void fib6_del_route(struct fib6_table *table, struct fib6_node *fn,
19068d1c802bSDavid Ahern struct fib6_info __rcu **rtp, struct nl_info *info)
19071da177e4SLinus Torvalds {
1908d2f0c9b1SIdo Schimmel struct fib6_info *leaf, *replace_rt = NULL;
190994b2cfe0SHannes Frederic Sowa struct fib6_walker *w;
19108d1c802bSDavid Ahern struct fib6_info *rt = rcu_dereference_protected(*rtp,
191166f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
1912c572872fSBenjamin Thery struct net *net = info->nl_net;
1913d2f0c9b1SIdo Schimmel bool notify_del = false;
19141da177e4SLinus Torvalds
19151da177e4SLinus Torvalds RT6_TRACE("fib6_del_route\n");
19161da177e4SLinus Torvalds
1917d2f0c9b1SIdo Schimmel /* If the deleted route is the first in the node and it is not part of
1918d2f0c9b1SIdo Schimmel * a multipath route, then we need to replace it with the next route
1919d2f0c9b1SIdo Schimmel * in the node, if exists.
1920d2f0c9b1SIdo Schimmel */
1921d2f0c9b1SIdo Schimmel leaf = rcu_dereference_protected(fn->leaf,
1922d2f0c9b1SIdo Schimmel lockdep_is_held(&table->tb6_lock));
1923d2f0c9b1SIdo Schimmel if (leaf == rt && !rt->fib6_nsiblings) {
1924d2f0c9b1SIdo Schimmel if (rcu_access_pointer(rt->fib6_next))
1925d2f0c9b1SIdo Schimmel replace_rt = rcu_dereference_protected(rt->fib6_next,
1926d2f0c9b1SIdo Schimmel lockdep_is_held(&table->tb6_lock));
1927d2f0c9b1SIdo Schimmel else
1928d2f0c9b1SIdo Schimmel notify_del = true;
1929d2f0c9b1SIdo Schimmel }
1930d2f0c9b1SIdo Schimmel
19311da177e4SLinus Torvalds /* Unlink it */
19328fb11a9aSDavid Ahern *rtp = rt->fib6_next;
193393c2fb25SDavid Ahern rt->fib6_node = NULL;
1934c572872fSBenjamin Thery net->ipv6.rt6_stats->fib_rt_entries--;
1935c572872fSBenjamin Thery net->ipv6.rt6_stats->fib_discarded_routes++;
19361da177e4SLinus Torvalds
1937f11e6659SDavid S. Miller /* Reset round-robin state, if necessary */
193866f5d6ceSWei Wang if (rcu_access_pointer(fn->rr_ptr) == rt)
1939f11e6659SDavid S. Miller fn->rr_ptr = NULL;
1940f11e6659SDavid S. Miller
194151ebd318SNicolas Dichtel /* Remove this entry from other siblings */
194293c2fb25SDavid Ahern if (rt->fib6_nsiblings) {
19438d1c802bSDavid Ahern struct fib6_info *sibling, *next_sibling;
194451ebd318SNicolas Dichtel
1945d2f0c9b1SIdo Schimmel /* The route is deleted from a multipath route. If this
1946d2f0c9b1SIdo Schimmel * multipath route is the first route in the node, then we need
1947d2f0c9b1SIdo Schimmel * to emit a delete notification. Otherwise, we need to skip
1948d2f0c9b1SIdo Schimmel * the notification.
1949d2f0c9b1SIdo Schimmel */
1950d2f0c9b1SIdo Schimmel if (rt->fib6_metric == leaf->fib6_metric &&
1951d2f0c9b1SIdo Schimmel rt6_qualify_for_ecmp(leaf))
1952d2f0c9b1SIdo Schimmel notify_del = true;
195351ebd318SNicolas Dichtel list_for_each_entry_safe(sibling, next_sibling,
195493c2fb25SDavid Ahern &rt->fib6_siblings, fib6_siblings)
195593c2fb25SDavid Ahern sibling->fib6_nsiblings--;
195693c2fb25SDavid Ahern rt->fib6_nsiblings = 0;
1957*52da0252SOmid Ehtemam-Haghighi list_del_rcu(&rt->fib6_siblings);
1958d7dedee1SIdo Schimmel rt6_multipath_rebalance(next_sibling);
195951ebd318SNicolas Dichtel }
196051ebd318SNicolas Dichtel
19611da177e4SLinus Torvalds /* Adjust walkers */
19629a03cd8fSMichal Kubeček read_lock(&net->ipv6.fib6_walker_lock);
19639a03cd8fSMichal Kubeček FOR_WALKERS(net, w) {
19641da177e4SLinus Torvalds if (w->state == FWS_C && w->leaf == rt) {
19651da177e4SLinus Torvalds RT6_TRACE("walker %p adjusted by delroute\n", w);
19668fb11a9aSDavid Ahern w->leaf = rcu_dereference_protected(rt->fib6_next,
196766f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
1968507c9b1eSDavid S. Miller if (!w->leaf)
19691da177e4SLinus Torvalds w->state = FWS_U;
19701da177e4SLinus Torvalds }
19711da177e4SLinus Torvalds }
19729a03cd8fSMichal Kubeček read_unlock(&net->ipv6.fib6_walker_lock);
19731da177e4SLinus Torvalds
19744512c43eSWei Wang /* If it was last route, call fib6_repair_tree() to:
19754512c43eSWei Wang * 1. For root node, put back null_entry as how the table was created.
19764512c43eSWei Wang * 2. For other nodes, expunge its radix tree node.
19774512c43eSWei Wang */
197866f5d6ceSWei Wang if (!rcu_access_pointer(fn->leaf)) {
19794512c43eSWei Wang if (!(fn->fn_flags & RTN_TL_ROOT)) {
19801da177e4SLinus Torvalds fn->fn_flags &= ~RTN_RTINFO;
1981c572872fSBenjamin Thery net->ipv6.rt6_stats->fib_route_nodes--;
19824512c43eSWei Wang }
198366f5d6ceSWei Wang fn = fib6_repair_tree(net, table, fn);
19841da177e4SLinus Torvalds }
19851da177e4SLinus Torvalds
19866e9e16e6SHannes Frederic Sowa fib6_purge_rt(rt, fn, net);
19871da177e4SLinus Torvalds
1988d2f0c9b1SIdo Schimmel if (!info->skip_notify_kernel) {
1989d2f0c9b1SIdo Schimmel if (notify_del)
1990caafb250SIdo Schimmel call_fib6_entry_notifiers(net, FIB_EVENT_ENTRY_DEL,
1991d2f0c9b1SIdo Schimmel rt, NULL);
1992d2f0c9b1SIdo Schimmel else if (replace_rt)
1993d2f0c9b1SIdo Schimmel call_fib6_entry_notifiers_replace(net, replace_rt);
1994d2f0c9b1SIdo Schimmel }
199516a16cd3SDavid Ahern if (!info->skip_notify)
199637a1d361SRoopa Prabhu inet6_rt_notify(RTM_DELROUTE, rt, info, 0);
1997d5382fefSIdo Schimmel
199893531c67SDavid Ahern fib6_info_release(rt);
19991da177e4SLinus Torvalds }
20001da177e4SLinus Torvalds
200166f5d6ceSWei Wang /* Need to own table->tb6_lock */
fib6_del(struct fib6_info * rt,struct nl_info * info)20028d1c802bSDavid Ahern int fib6_del(struct fib6_info *rt, struct nl_info *info)
20031da177e4SLinus Torvalds {
20048ed67789SDaniel Lezcano struct net *net = info->nl_net;
20058d1c802bSDavid Ahern struct fib6_info __rcu **rtp;
20068d1c802bSDavid Ahern struct fib6_info __rcu **rtp_next;
2007843d926bSEric Dumazet struct fib6_table *table;
2008843d926bSEric Dumazet struct fib6_node *fn;
20091da177e4SLinus Torvalds
2010843d926bSEric Dumazet if (rt == net->ipv6.fib6_null_entry)
2011843d926bSEric Dumazet return -ENOENT;
2012843d926bSEric Dumazet
2013843d926bSEric Dumazet table = rt->fib6_table;
2014843d926bSEric Dumazet fn = rcu_dereference_protected(rt->fib6_node,
2015843d926bSEric Dumazet lockdep_is_held(&table->tb6_lock));
2016843d926bSEric Dumazet if (!fn)
20171da177e4SLinus Torvalds return -ENOENT;
20181da177e4SLinus Torvalds
2019547b792cSIlpo Järvinen WARN_ON(!(fn->fn_flags & RTN_RTINFO));
20201da177e4SLinus Torvalds
20211da177e4SLinus Torvalds /*
20221da177e4SLinus Torvalds * Walk the leaf entries looking for ourself
20231da177e4SLinus Torvalds */
20241da177e4SLinus Torvalds
202566f5d6ceSWei Wang for (rtp = &fn->leaf; *rtp; rtp = rtp_next) {
20268d1c802bSDavid Ahern struct fib6_info *cur = rcu_dereference_protected(*rtp,
202766f5d6ceSWei Wang lockdep_is_held(&table->tb6_lock));
202866f5d6ceSWei Wang if (rt == cur) {
2029b9b33e7cSPaolo Abeni if (fib6_requires_src(cur))
2030b9b33e7cSPaolo Abeni fib6_routes_require_src_dec(info->nl_net);
203166f5d6ceSWei Wang fib6_del_route(table, fn, rtp, info);
20321da177e4SLinus Torvalds return 0;
20331da177e4SLinus Torvalds }
20348fb11a9aSDavid Ahern rtp_next = &cur->fib6_next;
20351da177e4SLinus Torvalds }
20361da177e4SLinus Torvalds return -ENOENT;
20371da177e4SLinus Torvalds }
20381da177e4SLinus Torvalds
20391da177e4SLinus Torvalds /*
20401da177e4SLinus Torvalds * Tree traversal function.
20411da177e4SLinus Torvalds *
20421da177e4SLinus Torvalds * Certainly, it is not interrupt safe.
20431da177e4SLinus Torvalds * However, it is internally reenterable wrt itself and fib6_add/fib6_del.
20441da177e4SLinus Torvalds * It means, that we can modify tree during walking
20451da177e4SLinus Torvalds * and use this function for garbage collection, clone pruning,
20461da177e4SLinus Torvalds * cleaning tree when a device goes down etc. etc.
20471da177e4SLinus Torvalds *
20481da177e4SLinus Torvalds * It guarantees that every node will be traversed,
20491da177e4SLinus Torvalds * and that it will be traversed only once.
20501da177e4SLinus Torvalds *
20511da177e4SLinus Torvalds * Callback function w->func may return:
20521da177e4SLinus Torvalds * 0 -> continue walking.
20531da177e4SLinus Torvalds * positive value -> walking is suspended (used by tree dumps,
20541da177e4SLinus Torvalds * and probably by gc, if it will be split to several slices)
20551da177e4SLinus Torvalds * negative value -> terminate walking.
20561da177e4SLinus Torvalds *
20571da177e4SLinus Torvalds * The function itself returns:
20581da177e4SLinus Torvalds * 0 -> walk is complete.
20591da177e4SLinus Torvalds * >0 -> walk is incomplete (i.e. suspended)
20601da177e4SLinus Torvalds * <0 -> walk is terminated by an error.
206166f5d6ceSWei Wang *
206266f5d6ceSWei Wang * This function is called with tb6_lock held.
20631da177e4SLinus Torvalds */
20641da177e4SLinus Torvalds
fib6_walk_continue(struct fib6_walker * w)206594b2cfe0SHannes Frederic Sowa static int fib6_walk_continue(struct fib6_walker *w)
20661da177e4SLinus Torvalds {
206766f5d6ceSWei Wang struct fib6_node *fn, *pn, *left, *right;
20681da177e4SLinus Torvalds
20692b760fcfSWei Wang /* w->root should always be table->tb6_root */
20702b760fcfSWei Wang WARN_ON_ONCE(!(w->root->fn_flags & RTN_TL_ROOT));
20712b760fcfSWei Wang
20721da177e4SLinus Torvalds for (;;) {
20731da177e4SLinus Torvalds fn = w->node;
2074507c9b1eSDavid S. Miller if (!fn)
20751da177e4SLinus Torvalds return 0;
20761da177e4SLinus Torvalds
20771da177e4SLinus Torvalds switch (w->state) {
20781da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
20791da177e4SLinus Torvalds case FWS_S:
20807fc33165SYOSHIFUJI Hideaki if (FIB6_SUBTREE(fn)) {
20817fc33165SYOSHIFUJI Hideaki w->node = FIB6_SUBTREE(fn);
20821da177e4SLinus Torvalds continue;
20831da177e4SLinus Torvalds }
20841da177e4SLinus Torvalds w->state = FWS_L;
2085a8eceea8SJoe Perches fallthrough;
20861da177e4SLinus Torvalds #endif
20871da177e4SLinus Torvalds case FWS_L:
208866f5d6ceSWei Wang left = rcu_dereference_protected(fn->left, 1);
208966f5d6ceSWei Wang if (left) {
209066f5d6ceSWei Wang w->node = left;
20911da177e4SLinus Torvalds w->state = FWS_INIT;
20921da177e4SLinus Torvalds continue;
20931da177e4SLinus Torvalds }
20941da177e4SLinus Torvalds w->state = FWS_R;
2095a8eceea8SJoe Perches fallthrough;
20961da177e4SLinus Torvalds case FWS_R:
209766f5d6ceSWei Wang right = rcu_dereference_protected(fn->right, 1);
209866f5d6ceSWei Wang if (right) {
209966f5d6ceSWei Wang w->node = right;
21001da177e4SLinus Torvalds w->state = FWS_INIT;
21011da177e4SLinus Torvalds continue;
21021da177e4SLinus Torvalds }
21031da177e4SLinus Torvalds w->state = FWS_C;
210466f5d6ceSWei Wang w->leaf = rcu_dereference_protected(fn->leaf, 1);
2105a8eceea8SJoe Perches fallthrough;
21061da177e4SLinus Torvalds case FWS_C:
21071da177e4SLinus Torvalds if (w->leaf && fn->fn_flags & RTN_RTINFO) {
21082bec5a36SPatrick McHardy int err;
21092bec5a36SPatrick McHardy
2110fa809e2fSEric Dumazet if (w->skip) {
2111fa809e2fSEric Dumazet w->skip--;
21121c265854SKumar Sundararajan goto skip;
21132bec5a36SPatrick McHardy }
21142bec5a36SPatrick McHardy
21152bec5a36SPatrick McHardy err = w->func(w);
21161da177e4SLinus Torvalds if (err)
21171da177e4SLinus Torvalds return err;
21182bec5a36SPatrick McHardy
21192bec5a36SPatrick McHardy w->count++;
21201da177e4SLinus Torvalds continue;
21211da177e4SLinus Torvalds }
21221c265854SKumar Sundararajan skip:
21231da177e4SLinus Torvalds w->state = FWS_U;
2124a8eceea8SJoe Perches fallthrough;
21251da177e4SLinus Torvalds case FWS_U:
21261da177e4SLinus Torvalds if (fn == w->root)
21271da177e4SLinus Torvalds return 0;
212866f5d6ceSWei Wang pn = rcu_dereference_protected(fn->parent, 1);
212966f5d6ceSWei Wang left = rcu_dereference_protected(pn->left, 1);
213066f5d6ceSWei Wang right = rcu_dereference_protected(pn->right, 1);
21311da177e4SLinus Torvalds w->node = pn;
21321da177e4SLinus Torvalds #ifdef CONFIG_IPV6_SUBTREES
21337fc33165SYOSHIFUJI Hideaki if (FIB6_SUBTREE(pn) == fn) {
2134547b792cSIlpo Järvinen WARN_ON(!(fn->fn_flags & RTN_ROOT));
21351da177e4SLinus Torvalds w->state = FWS_L;
21361da177e4SLinus Torvalds continue;
21371da177e4SLinus Torvalds }
21381da177e4SLinus Torvalds #endif
213966f5d6ceSWei Wang if (left == fn) {
21401da177e4SLinus Torvalds w->state = FWS_R;
21411da177e4SLinus Torvalds continue;
21421da177e4SLinus Torvalds }
214366f5d6ceSWei Wang if (right == fn) {
21441da177e4SLinus Torvalds w->state = FWS_C;
214566f5d6ceSWei Wang w->leaf = rcu_dereference_protected(w->node->leaf, 1);
21461da177e4SLinus Torvalds continue;
21471da177e4SLinus Torvalds }
21481da177e4SLinus Torvalds #if RT6_DEBUG >= 2
2149547b792cSIlpo Järvinen WARN_ON(1);
21501da177e4SLinus Torvalds #endif
21511da177e4SLinus Torvalds }
21521da177e4SLinus Torvalds }
21531da177e4SLinus Torvalds }
21541da177e4SLinus Torvalds
fib6_walk(struct net * net,struct fib6_walker * w)21559a03cd8fSMichal Kubeček static int fib6_walk(struct net *net, struct fib6_walker *w)
21561da177e4SLinus Torvalds {
21571da177e4SLinus Torvalds int res;
21581da177e4SLinus Torvalds
21591da177e4SLinus Torvalds w->state = FWS_INIT;
21601da177e4SLinus Torvalds w->node = w->root;
21611da177e4SLinus Torvalds
21629a03cd8fSMichal Kubeček fib6_walker_link(net, w);
21631da177e4SLinus Torvalds res = fib6_walk_continue(w);
21641da177e4SLinus Torvalds if (res <= 0)
21659a03cd8fSMichal Kubeček fib6_walker_unlink(net, w);
21661da177e4SLinus Torvalds return res;
21671da177e4SLinus Torvalds }
21681da177e4SLinus Torvalds
fib6_clean_node(struct fib6_walker * w)216994b2cfe0SHannes Frederic Sowa static int fib6_clean_node(struct fib6_walker *w)
21701da177e4SLinus Torvalds {
21711da177e4SLinus Torvalds int res;
21728d1c802bSDavid Ahern struct fib6_info *rt;
217394b2cfe0SHannes Frederic Sowa struct fib6_cleaner *c = container_of(w, struct fib6_cleaner, w);
2174ec7d43c2SBenjamin Thery struct nl_info info = {
2175ec7d43c2SBenjamin Thery .nl_net = c->net,
21767c6bb7d2SDavid Ahern .skip_notify = c->skip_notify,
2177ec7d43c2SBenjamin Thery };
21781da177e4SLinus Torvalds
2179327571cbSHannes Frederic Sowa if (c->sernum != FIB6_NO_SERNUM_CHANGE &&
2180aafc2e32SEric Dumazet READ_ONCE(w->node->fn_sernum) != c->sernum)
2181aafc2e32SEric Dumazet WRITE_ONCE(w->node->fn_sernum, c->sernum);
2182327571cbSHannes Frederic Sowa
2183327571cbSHannes Frederic Sowa if (!c->func) {
2184327571cbSHannes Frederic Sowa WARN_ON_ONCE(c->sernum == FIB6_NO_SERNUM_CHANGE);
2185327571cbSHannes Frederic Sowa w->leaf = NULL;
2186327571cbSHannes Frederic Sowa return 0;
2187327571cbSHannes Frederic Sowa }
2188327571cbSHannes Frederic Sowa
218966f5d6ceSWei Wang for_each_fib6_walker_rt(w) {
21901da177e4SLinus Torvalds res = c->func(rt, c->arg);
2191b5cb5a75SIdo Schimmel if (res == -1) {
21921da177e4SLinus Torvalds w->leaf = rt;
2193528c4cebSDenis V. Lunev res = fib6_del(rt, &info);
21941da177e4SLinus Torvalds if (res) {
21951da177e4SLinus Torvalds #if RT6_DEBUG >= 2
219691df42beSJoe Perches pr_debug("%s: del failed: rt=%p@%p err=%d\n",
21974e587ea7SWei Wang __func__, rt,
219893c2fb25SDavid Ahern rcu_access_pointer(rt->fib6_node),
21994e587ea7SWei Wang res);
22001da177e4SLinus Torvalds #endif
22011da177e4SLinus Torvalds continue;
22021da177e4SLinus Torvalds }
22031da177e4SLinus Torvalds return 0;
2204b5cb5a75SIdo Schimmel } else if (res == -2) {
220593c2fb25SDavid Ahern if (WARN_ON(!rt->fib6_nsiblings))
2206b5cb5a75SIdo Schimmel continue;
220793c2fb25SDavid Ahern rt = list_last_entry(&rt->fib6_siblings,
220893c2fb25SDavid Ahern struct fib6_info, fib6_siblings);
2209b5cb5a75SIdo Schimmel continue;
22101da177e4SLinus Torvalds }
2211547b792cSIlpo Järvinen WARN_ON(res != 0);
22121da177e4SLinus Torvalds }
22131da177e4SLinus Torvalds w->leaf = rt;
22141da177e4SLinus Torvalds return 0;
22151da177e4SLinus Torvalds }
22161da177e4SLinus Torvalds
22171da177e4SLinus Torvalds /*
22181da177e4SLinus Torvalds * Convenient frontend to tree walker.
22191da177e4SLinus Torvalds *
22201da177e4SLinus Torvalds * func is called on each route.
2221b5cb5a75SIdo Schimmel * It may return -2 -> skip multipath route.
2222b5cb5a75SIdo Schimmel * -1 -> delete this route.
22231da177e4SLinus Torvalds * 0 -> continue walking
22241da177e4SLinus Torvalds */
22251da177e4SLinus Torvalds
fib6_clean_tree(struct net * net,struct fib6_node * root,int (* func)(struct fib6_info *,void * arg),int sernum,void * arg,bool skip_notify)2226ec7d43c2SBenjamin Thery static void fib6_clean_tree(struct net *net, struct fib6_node *root,
22278d1c802bSDavid Ahern int (*func)(struct fib6_info *, void *arg),
22287c6bb7d2SDavid Ahern int sernum, void *arg, bool skip_notify)
22291da177e4SLinus Torvalds {
223094b2cfe0SHannes Frederic Sowa struct fib6_cleaner c;
22311da177e4SLinus Torvalds
22321da177e4SLinus Torvalds c.w.root = root;
22331da177e4SLinus Torvalds c.w.func = fib6_clean_node;
22342bec5a36SPatrick McHardy c.w.count = 0;
22352bec5a36SPatrick McHardy c.w.skip = 0;
22361e47b483SStefano Brivio c.w.skip_in_node = 0;
22371da177e4SLinus Torvalds c.func = func;
2238327571cbSHannes Frederic Sowa c.sernum = sernum;
22391da177e4SLinus Torvalds c.arg = arg;
2240ec7d43c2SBenjamin Thery c.net = net;
22417c6bb7d2SDavid Ahern c.skip_notify = skip_notify;
22421da177e4SLinus Torvalds
22439a03cd8fSMichal Kubeček fib6_walk(net, &c.w);
22441da177e4SLinus Torvalds }
22451da177e4SLinus Torvalds
__fib6_clean_all(struct net * net,int (* func)(struct fib6_info *,void *),int sernum,void * arg,bool skip_notify)2246327571cbSHannes Frederic Sowa static void __fib6_clean_all(struct net *net,
22478d1c802bSDavid Ahern int (*func)(struct fib6_info *, void *),
22487c6bb7d2SDavid Ahern int sernum, void *arg, bool skip_notify)
2249c71099acSThomas Graf {
2250c71099acSThomas Graf struct fib6_table *table;
225158f09b78SDaniel Lezcano struct hlist_head *head;
22521b43af54SPatrick McHardy unsigned int h;
2253c71099acSThomas Graf
22541b43af54SPatrick McHardy rcu_read_lock();
2255a33bc5c1SNeil Horman for (h = 0; h < FIB6_TABLE_HASHSZ; h++) {
2256f3db4851SDaniel Lezcano head = &net->ipv6.fib_table_hash[h];
2257b67bfe0dSSasha Levin hlist_for_each_entry_rcu(table, head, tb6_hlist) {
225866f5d6ceSWei Wang spin_lock_bh(&table->tb6_lock);
2259ec7d43c2SBenjamin Thery fib6_clean_tree(net, &table->tb6_root,
22607c6bb7d2SDavid Ahern func, sernum, arg, skip_notify);
226166f5d6ceSWei Wang spin_unlock_bh(&table->tb6_lock);
2262c71099acSThomas Graf }
2263c71099acSThomas Graf }
22641b43af54SPatrick McHardy rcu_read_unlock();
2265c71099acSThomas Graf }
2266c71099acSThomas Graf
fib6_clean_all(struct net * net,int (* func)(struct fib6_info *,void *),void * arg)22678d1c802bSDavid Ahern void fib6_clean_all(struct net *net, int (*func)(struct fib6_info *, void *),
2268327571cbSHannes Frederic Sowa void *arg)
2269327571cbSHannes Frederic Sowa {
22707c6bb7d2SDavid Ahern __fib6_clean_all(net, func, FIB6_NO_SERNUM_CHANGE, arg, false);
22717c6bb7d2SDavid Ahern }
22727c6bb7d2SDavid Ahern
fib6_clean_all_skip_notify(struct net * net,int (* func)(struct fib6_info *,void *),void * arg)22737c6bb7d2SDavid Ahern void fib6_clean_all_skip_notify(struct net *net,
22747c6bb7d2SDavid Ahern int (*func)(struct fib6_info *, void *),
22757c6bb7d2SDavid Ahern void *arg)
22767c6bb7d2SDavid Ahern {
22777c6bb7d2SDavid Ahern __fib6_clean_all(net, func, FIB6_NO_SERNUM_CHANGE, arg, true);
2278327571cbSHannes Frederic Sowa }
2279327571cbSHannes Frederic Sowa
fib6_flush_trees(struct net * net)2280705f1c86SHannes Frederic Sowa static void fib6_flush_trees(struct net *net)
2281705f1c86SHannes Frederic Sowa {
2282812918c4SHannes Frederic Sowa int new_sernum = fib6_new_sernum(net);
2283705f1c86SHannes Frederic Sowa
22847c6bb7d2SDavid Ahern __fib6_clean_all(net, NULL, new_sernum, NULL, false);
2285705f1c86SHannes Frederic Sowa }
2286705f1c86SHannes Frederic Sowa
22871da177e4SLinus Torvalds /*
22881da177e4SLinus Torvalds * Garbage collection
22891da177e4SLinus Torvalds */
22901da177e4SLinus Torvalds
fib6_age(struct fib6_info * rt,void * arg)2291b577b9aaSDavid Ahern static int fib6_age(struct fib6_info *rt, void *arg)
22921da177e4SLinus Torvalds {
2293b577b9aaSDavid Ahern struct fib6_gc_args *gc_args = arg;
22941da177e4SLinus Torvalds unsigned long now = jiffies;
22951da177e4SLinus Torvalds
22961da177e4SLinus Torvalds /*
22971da177e4SLinus Torvalds * check addrconf expiration here.
22981da177e4SLinus Torvalds * Routes are expired even if they are in use.
22991da177e4SLinus Torvalds */
23001da177e4SLinus Torvalds
2301b577b9aaSDavid Ahern if (rt->fib6_flags & RTF_EXPIRES && rt->expires) {
230214895687SDavid Ahern if (time_after(now, rt->expires)) {
23031da177e4SLinus Torvalds RT6_TRACE("expiring %p\n", rt);
23041da177e4SLinus Torvalds return -1;
23051da177e4SLinus Torvalds }
23063570df91SMichal Kubeček gc_args->more++;
23071da177e4SLinus Torvalds }
23081da177e4SLinus Torvalds
2309c757faa8SWei Wang /* Also age clones in the exception table.
2310c757faa8SWei Wang * Note, that clones are aged out
2311c757faa8SWei Wang * only if they are not in use now.
2312c757faa8SWei Wang */
2313c757faa8SWei Wang rt6_age_exceptions(rt, gc_args, now);
2314c757faa8SWei Wang
23151da177e4SLinus Torvalds return 0;
23161da177e4SLinus Torvalds }
23171da177e4SLinus Torvalds
fib6_run_gc(unsigned long expires,struct net * net,bool force)23182ac3ac8fSMichal Kubeček void fib6_run_gc(unsigned long expires, struct net *net, bool force)
23191da177e4SLinus Torvalds {
23203570df91SMichal Kubeček struct fib6_gc_args gc_args;
232149a18d86SMichal Kubeček unsigned long now;
232249a18d86SMichal Kubeček
23232ac3ac8fSMichal Kubeček if (force) {
23243dc94f93SMichal Kubeček spin_lock_bh(&net->ipv6.fib6_gc_lock);
23253dc94f93SMichal Kubeček } else if (!spin_trylock_bh(&net->ipv6.fib6_gc_lock)) {
2326417f28bbSStephen Hemminger mod_timer(&net->ipv6.ip6_fib_timer, jiffies + HZ);
23271da177e4SLinus Torvalds return;
23281da177e4SLinus Torvalds }
23292ac3ac8fSMichal Kubeček gc_args.timeout = expires ? (int)expires :
23302ac3ac8fSMichal Kubeček net->ipv6.sysctl.ip6_rt_gc_interval;
2331db916649SWei Wang gc_args.more = 0;
2332f3db4851SDaniel Lezcano
2333b577b9aaSDavid Ahern fib6_clean_all(net, fib6_age, &gc_args);
233449a18d86SMichal Kubeček now = jiffies;
233549a18d86SMichal Kubeček net->ipv6.ip6_rt_last_gc = now;
23361da177e4SLinus Torvalds
23371da177e4SLinus Torvalds if (gc_args.more)
2338c8a45222SStephen Hemminger mod_timer(&net->ipv6.ip6_fib_timer,
233949a18d86SMichal Kubeček round_jiffies(now
2340c8a45222SStephen Hemminger + net->ipv6.sysctl.ip6_rt_gc_interval));
2341417f28bbSStephen Hemminger else
2342417f28bbSStephen Hemminger del_timer(&net->ipv6.ip6_fib_timer);
23433dc94f93SMichal Kubeček spin_unlock_bh(&net->ipv6.fib6_gc_lock);
23441da177e4SLinus Torvalds }
23451da177e4SLinus Torvalds
fib6_gc_timer_cb(struct timer_list * t)234686cb30ecSKees Cook static void fib6_gc_timer_cb(struct timer_list *t)
23475b7c931dSDaniel Lezcano {
234886cb30ecSKees Cook struct net *arg = from_timer(arg, t, ipv6.ip6_fib_timer);
234986cb30ecSKees Cook
235086cb30ecSKees Cook fib6_run_gc(0, arg, true);
23515b7c931dSDaniel Lezcano }
23525b7c931dSDaniel Lezcano
fib6_net_init(struct net * net)23532c8c1e72SAlexey Dobriyan static int __net_init fib6_net_init(struct net *net)
235458f09b78SDaniel Lezcano {
235510da66f7SEric Dumazet size_t size = sizeof(struct hlist_head) * FIB6_TABLE_HASHSZ;
235616ab6d7dSIdo Schimmel int err;
235716ab6d7dSIdo Schimmel
235816ab6d7dSIdo Schimmel err = fib6_notifier_init(net);
235916ab6d7dSIdo Schimmel if (err)
236016ab6d7dSIdo Schimmel return err;
236110da66f7SEric Dumazet
2362ed13923fSIdo Schimmel /* Default to 3-tuple */
2363ed13923fSIdo Schimmel net->ipv6.sysctl.multipath_hash_fields =
2364ed13923fSIdo Schimmel FIB_MULTIPATH_HASH_FIELD_DEFAULT_MASK;
2365ed13923fSIdo Schimmel
23663dc94f93SMichal Kubeček spin_lock_init(&net->ipv6.fib6_gc_lock);
23679a03cd8fSMichal Kubeček rwlock_init(&net->ipv6.fib6_walker_lock);
23689a03cd8fSMichal Kubeček INIT_LIST_HEAD(&net->ipv6.fib6_walkers);
236986cb30ecSKees Cook timer_setup(&net->ipv6.ip6_fib_timer, fib6_gc_timer_cb, 0);
237063152fc0SDaniel Lezcano
2371c572872fSBenjamin Thery net->ipv6.rt6_stats = kzalloc(sizeof(*net->ipv6.rt6_stats), GFP_KERNEL);
2372c572872fSBenjamin Thery if (!net->ipv6.rt6_stats)
237367db5ca7SIdo Schimmel goto out_notifier;
2374c572872fSBenjamin Thery
237510da66f7SEric Dumazet /* Avoid false sharing : Use at least a full cache line */
237610da66f7SEric Dumazet size = max_t(size_t, size, L1_CACHE_BYTES);
237710da66f7SEric Dumazet
237810da66f7SEric Dumazet net->ipv6.fib_table_hash = kzalloc(size, GFP_KERNEL);
237958f09b78SDaniel Lezcano if (!net->ipv6.fib_table_hash)
2380c572872fSBenjamin Thery goto out_rt6_stats;
238158f09b78SDaniel Lezcano
238258f09b78SDaniel Lezcano net->ipv6.fib6_main_tbl = kzalloc(sizeof(*net->ipv6.fib6_main_tbl),
238358f09b78SDaniel Lezcano GFP_KERNEL);
238458f09b78SDaniel Lezcano if (!net->ipv6.fib6_main_tbl)
238558f09b78SDaniel Lezcano goto out_fib_table_hash;
238658f09b78SDaniel Lezcano
238758f09b78SDaniel Lezcano net->ipv6.fib6_main_tbl->tb6_id = RT6_TABLE_MAIN;
238866f5d6ceSWei Wang rcu_assign_pointer(net->ipv6.fib6_main_tbl->tb6_root.leaf,
2389421842edSDavid Ahern net->ipv6.fib6_null_entry);
239058f09b78SDaniel Lezcano net->ipv6.fib6_main_tbl->tb6_root.fn_flags =
239158f09b78SDaniel Lezcano RTN_ROOT | RTN_TL_ROOT | RTN_RTINFO;
23928e773277SDavid S. Miller inet_peer_base_init(&net->ipv6.fib6_main_tbl->tb6_peers);
239358f09b78SDaniel Lezcano
239458f09b78SDaniel Lezcano #ifdef CONFIG_IPV6_MULTIPLE_TABLES
239558f09b78SDaniel Lezcano net->ipv6.fib6_local_tbl = kzalloc(sizeof(*net->ipv6.fib6_local_tbl),
239658f09b78SDaniel Lezcano GFP_KERNEL);
239758f09b78SDaniel Lezcano if (!net->ipv6.fib6_local_tbl)
239858f09b78SDaniel Lezcano goto out_fib6_main_tbl;
239958f09b78SDaniel Lezcano net->ipv6.fib6_local_tbl->tb6_id = RT6_TABLE_LOCAL;
240066f5d6ceSWei Wang rcu_assign_pointer(net->ipv6.fib6_local_tbl->tb6_root.leaf,
2401421842edSDavid Ahern net->ipv6.fib6_null_entry);
240258f09b78SDaniel Lezcano net->ipv6.fib6_local_tbl->tb6_root.fn_flags =
240358f09b78SDaniel Lezcano RTN_ROOT | RTN_TL_ROOT | RTN_RTINFO;
24048e773277SDavid S. Miller inet_peer_base_init(&net->ipv6.fib6_local_tbl->tb6_peers);
240558f09b78SDaniel Lezcano #endif
240658f09b78SDaniel Lezcano fib6_tables_init(net);
240758f09b78SDaniel Lezcano
2408417f28bbSStephen Hemminger return 0;
240958f09b78SDaniel Lezcano
241058f09b78SDaniel Lezcano #ifdef CONFIG_IPV6_MULTIPLE_TABLES
241158f09b78SDaniel Lezcano out_fib6_main_tbl:
241258f09b78SDaniel Lezcano kfree(net->ipv6.fib6_main_tbl);
241358f09b78SDaniel Lezcano #endif
241458f09b78SDaniel Lezcano out_fib_table_hash:
241558f09b78SDaniel Lezcano kfree(net->ipv6.fib_table_hash);
2416c572872fSBenjamin Thery out_rt6_stats:
2417c572872fSBenjamin Thery kfree(net->ipv6.rt6_stats);
241867db5ca7SIdo Schimmel out_notifier:
241916ab6d7dSIdo Schimmel fib6_notifier_exit(net);
2420417f28bbSStephen Hemminger return -ENOMEM;
242158f09b78SDaniel Lezcano }
242258f09b78SDaniel Lezcano
fib6_net_exit(struct net * net)242358f09b78SDaniel Lezcano static void fib6_net_exit(struct net *net)
242458f09b78SDaniel Lezcano {
2425ba1cc08dSSabrina Dubroca unsigned int i;
2426ba1cc08dSSabrina Dubroca
2427417f28bbSStephen Hemminger del_timer_sync(&net->ipv6.ip6_fib_timer);
2428417f28bbSStephen Hemminger
242932a805baSEric Dumazet for (i = 0; i < FIB6_TABLE_HASHSZ; i++) {
2430ba1cc08dSSabrina Dubroca struct hlist_head *head = &net->ipv6.fib_table_hash[i];
2431ba1cc08dSSabrina Dubroca struct hlist_node *tmp;
2432ba1cc08dSSabrina Dubroca struct fib6_table *tb;
2433ba1cc08dSSabrina Dubroca
2434ba1cc08dSSabrina Dubroca hlist_for_each_entry_safe(tb, tmp, head, tb6_hlist) {
2435ba1cc08dSSabrina Dubroca hlist_del(&tb->tb6_hlist);
2436ba1cc08dSSabrina Dubroca fib6_free_table(tb);
2437ba1cc08dSSabrina Dubroca }
2438ba1cc08dSSabrina Dubroca }
2439ba1cc08dSSabrina Dubroca
244058f09b78SDaniel Lezcano kfree(net->ipv6.fib_table_hash);
2441c572872fSBenjamin Thery kfree(net->ipv6.rt6_stats);
244216ab6d7dSIdo Schimmel fib6_notifier_exit(net);
244358f09b78SDaniel Lezcano }
244458f09b78SDaniel Lezcano
244558f09b78SDaniel Lezcano static struct pernet_operations fib6_net_ops = {
244658f09b78SDaniel Lezcano .init = fib6_net_init,
244758f09b78SDaniel Lezcano .exit = fib6_net_exit,
244858f09b78SDaniel Lezcano };
244958f09b78SDaniel Lezcano
fib6_init(void)2450d63bddbeSDaniel Lezcano int __init fib6_init(void)
24511da177e4SLinus Torvalds {
2452e0b85590SDaniel Lezcano int ret = -ENOMEM;
245363152fc0SDaniel Lezcano
24541da177e4SLinus Torvalds fib6_node_kmem = kmem_cache_create("fib6_nodes",
24556126891cSVasily Averin sizeof(struct fib6_node), 0,
24566126891cSVasily Averin SLAB_HWCACHE_ALIGN | SLAB_ACCOUNT,
245720c2df83SPaul Mundt NULL);
2458f845ab6bSDaniel Lezcano if (!fib6_node_kmem)
2459e0b85590SDaniel Lezcano goto out;
2460e0b85590SDaniel Lezcano
246158f09b78SDaniel Lezcano ret = register_pernet_subsys(&fib6_net_ops);
246258f09b78SDaniel Lezcano if (ret)
2463c572872fSBenjamin Thery goto out_kmem_cache_create;
2464e8803b6cSDavid S. Miller
246516feebcfSFlorian Westphal ret = rtnl_register_module(THIS_MODULE, PF_INET6, RTM_GETROUTE, NULL,
246616feebcfSFlorian Westphal inet6_dump_fib, 0);
2467e8803b6cSDavid S. Miller if (ret)
2468e8803b6cSDavid S. Miller goto out_unregister_subsys;
2469705f1c86SHannes Frederic Sowa
2470705f1c86SHannes Frederic Sowa __fib6_flush_trees = fib6_flush_trees;
2471d63bddbeSDaniel Lezcano out:
2472d63bddbeSDaniel Lezcano return ret;
2473d63bddbeSDaniel Lezcano
2474e8803b6cSDavid S. Miller out_unregister_subsys:
2475e8803b6cSDavid S. Miller unregister_pernet_subsys(&fib6_net_ops);
2476d63bddbeSDaniel Lezcano out_kmem_cache_create:
2477d63bddbeSDaniel Lezcano kmem_cache_destroy(fib6_node_kmem);
2478d63bddbeSDaniel Lezcano goto out;
24791da177e4SLinus Torvalds }
24801da177e4SLinus Torvalds
fib6_gc_cleanup(void)24811da177e4SLinus Torvalds void fib6_gc_cleanup(void)
24821da177e4SLinus Torvalds {
248358f09b78SDaniel Lezcano unregister_pernet_subsys(&fib6_net_ops);
24841da177e4SLinus Torvalds kmem_cache_destroy(fib6_node_kmem);
24851da177e4SLinus Torvalds }
24868d2ca1d7SHannes Frederic Sowa
24878d2ca1d7SHannes Frederic Sowa #ifdef CONFIG_PROC_FS
ipv6_route_native_seq_show(struct seq_file * seq,void * v)2488138d0be3SYonghong Song static int ipv6_route_native_seq_show(struct seq_file *seq, void *v)
24898d2ca1d7SHannes Frederic Sowa {
24908d1c802bSDavid Ahern struct fib6_info *rt = v;
24918d2ca1d7SHannes Frederic Sowa struct ipv6_route_iter *iter = seq->private;
2492f88d8ea6SDavid Ahern struct fib6_nh *fib6_nh = rt->fib6_nh;
24932b2450caSDavid Ahern unsigned int flags = rt->fib6_flags;
24945e670d84SDavid Ahern const struct net_device *dev;
24958d2ca1d7SHannes Frederic Sowa
2496f88d8ea6SDavid Ahern if (rt->nh)
2497ef1148d4SEric Dumazet fib6_nh = nexthop_fib6_nh(rt->nh);
2498f88d8ea6SDavid Ahern
249993c2fb25SDavid Ahern seq_printf(seq, "%pi6 %02x ", &rt->fib6_dst.addr, rt->fib6_dst.plen);
25008d2ca1d7SHannes Frederic Sowa
25018d2ca1d7SHannes Frederic Sowa #ifdef CONFIG_IPV6_SUBTREES
250293c2fb25SDavid Ahern seq_printf(seq, "%pi6 %02x ", &rt->fib6_src.addr, rt->fib6_src.plen);
25038d2ca1d7SHannes Frederic Sowa #else
25048d2ca1d7SHannes Frederic Sowa seq_puts(seq, "00000000000000000000000000000000 00 ");
25058d2ca1d7SHannes Frederic Sowa #endif
2506f88d8ea6SDavid Ahern if (fib6_nh->fib_nh_gw_family) {
25072b2450caSDavid Ahern flags |= RTF_GATEWAY;
2508f88d8ea6SDavid Ahern seq_printf(seq, "%pi6", &fib6_nh->fib_nh_gw6);
25092b2450caSDavid Ahern } else {
25108d2ca1d7SHannes Frederic Sowa seq_puts(seq, "00000000000000000000000000000000");
25112b2450caSDavid Ahern }
25128d2ca1d7SHannes Frederic Sowa
2513f88d8ea6SDavid Ahern dev = fib6_nh->fib_nh_dev;
25148d2ca1d7SHannes Frederic Sowa seq_printf(seq, " %08x %08x %08x %08x %8s\n",
2515f05713e0SEric Dumazet rt->fib6_metric, refcount_read(&rt->fib6_ref), 0,
25162b2450caSDavid Ahern flags, dev ? dev->name : "");
25178d2ca1d7SHannes Frederic Sowa iter->w.leaf = NULL;
25188d2ca1d7SHannes Frederic Sowa return 0;
25198d2ca1d7SHannes Frederic Sowa }
25208d2ca1d7SHannes Frederic Sowa
ipv6_route_yield(struct fib6_walker * w)252194b2cfe0SHannes Frederic Sowa static int ipv6_route_yield(struct fib6_walker *w)
25228d2ca1d7SHannes Frederic Sowa {
25238d2ca1d7SHannes Frederic Sowa struct ipv6_route_iter *iter = w->args;
25248d2ca1d7SHannes Frederic Sowa
25258d2ca1d7SHannes Frederic Sowa if (!iter->skip)
25268d2ca1d7SHannes Frederic Sowa return 1;
25278d2ca1d7SHannes Frederic Sowa
25288d2ca1d7SHannes Frederic Sowa do {
252966f5d6ceSWei Wang iter->w.leaf = rcu_dereference_protected(
25308fb11a9aSDavid Ahern iter->w.leaf->fib6_next,
253166f5d6ceSWei Wang lockdep_is_held(&iter->tbl->tb6_lock));
25328d2ca1d7SHannes Frederic Sowa iter->skip--;
25338d2ca1d7SHannes Frederic Sowa if (!iter->skip && iter->w.leaf)
25348d2ca1d7SHannes Frederic Sowa return 1;
25358d2ca1d7SHannes Frederic Sowa } while (iter->w.leaf);
25368d2ca1d7SHannes Frederic Sowa
25378d2ca1d7SHannes Frederic Sowa return 0;
25388d2ca1d7SHannes Frederic Sowa }
25398d2ca1d7SHannes Frederic Sowa
ipv6_route_seq_setup_walk(struct ipv6_route_iter * iter,struct net * net)25409a03cd8fSMichal Kubeček static void ipv6_route_seq_setup_walk(struct ipv6_route_iter *iter,
25419a03cd8fSMichal Kubeček struct net *net)
25428d2ca1d7SHannes Frederic Sowa {
25438d2ca1d7SHannes Frederic Sowa memset(&iter->w, 0, sizeof(iter->w));
25448d2ca1d7SHannes Frederic Sowa iter->w.func = ipv6_route_yield;
25458d2ca1d7SHannes Frederic Sowa iter->w.root = &iter->tbl->tb6_root;
25468d2ca1d7SHannes Frederic Sowa iter->w.state = FWS_INIT;
25478d2ca1d7SHannes Frederic Sowa iter->w.node = iter->w.root;
25488d2ca1d7SHannes Frederic Sowa iter->w.args = iter;
2549aafc2e32SEric Dumazet iter->sernum = READ_ONCE(iter->w.root->fn_sernum);
25508d2ca1d7SHannes Frederic Sowa INIT_LIST_HEAD(&iter->w.lh);
25519a03cd8fSMichal Kubeček fib6_walker_link(net, &iter->w);
25528d2ca1d7SHannes Frederic Sowa }
25538d2ca1d7SHannes Frederic Sowa
ipv6_route_seq_next_table(struct fib6_table * tbl,struct net * net)25548d2ca1d7SHannes Frederic Sowa static struct fib6_table *ipv6_route_seq_next_table(struct fib6_table *tbl,
25558d2ca1d7SHannes Frederic Sowa struct net *net)
25568d2ca1d7SHannes Frederic Sowa {
25578d2ca1d7SHannes Frederic Sowa unsigned int h;
25588d2ca1d7SHannes Frederic Sowa struct hlist_node *node;
25598d2ca1d7SHannes Frederic Sowa
25608d2ca1d7SHannes Frederic Sowa if (tbl) {
25618d2ca1d7SHannes Frederic Sowa h = (tbl->tb6_id & (FIB6_TABLE_HASHSZ - 1)) + 1;
2562ef1148d4SEric Dumazet node = rcu_dereference(hlist_next_rcu(&tbl->tb6_hlist));
25638d2ca1d7SHannes Frederic Sowa } else {
25648d2ca1d7SHannes Frederic Sowa h = 0;
25658d2ca1d7SHannes Frederic Sowa node = NULL;
25668d2ca1d7SHannes Frederic Sowa }
25678d2ca1d7SHannes Frederic Sowa
25688d2ca1d7SHannes Frederic Sowa while (!node && h < FIB6_TABLE_HASHSZ) {
2569ef1148d4SEric Dumazet node = rcu_dereference(
25708d2ca1d7SHannes Frederic Sowa hlist_first_rcu(&net->ipv6.fib_table_hash[h++]));
25718d2ca1d7SHannes Frederic Sowa }
25728d2ca1d7SHannes Frederic Sowa return hlist_entry_safe(node, struct fib6_table, tb6_hlist);
25738d2ca1d7SHannes Frederic Sowa }
25748d2ca1d7SHannes Frederic Sowa
ipv6_route_check_sernum(struct ipv6_route_iter * iter)25750a67d3efSHannes Frederic Sowa static void ipv6_route_check_sernum(struct ipv6_route_iter *iter)
25760a67d3efSHannes Frederic Sowa {
2577aafc2e32SEric Dumazet int sernum = READ_ONCE(iter->w.root->fn_sernum);
2578aafc2e32SEric Dumazet
2579aafc2e32SEric Dumazet if (iter->sernum != sernum) {
2580aafc2e32SEric Dumazet iter->sernum = sernum;
25810a67d3efSHannes Frederic Sowa iter->w.state = FWS_INIT;
25820a67d3efSHannes Frederic Sowa iter->w.node = iter->w.root;
25830a67d3efSHannes Frederic Sowa WARN_ON(iter->w.skip);
25840a67d3efSHannes Frederic Sowa iter->w.skip = iter->w.count;
25850a67d3efSHannes Frederic Sowa }
25860a67d3efSHannes Frederic Sowa }
25870a67d3efSHannes Frederic Sowa
ipv6_route_seq_next(struct seq_file * seq,void * v,loff_t * pos)25888d2ca1d7SHannes Frederic Sowa static void *ipv6_route_seq_next(struct seq_file *seq, void *v, loff_t *pos)
25898d2ca1d7SHannes Frederic Sowa {
25908d2ca1d7SHannes Frederic Sowa int r;
25918d1c802bSDavid Ahern struct fib6_info *n;
25928d2ca1d7SHannes Frederic Sowa struct net *net = seq_file_net(seq);
25938d2ca1d7SHannes Frederic Sowa struct ipv6_route_iter *iter = seq->private;
25948d2ca1d7SHannes Frederic Sowa
25954fc427e0SVasily Averin ++(*pos);
25968d2ca1d7SHannes Frederic Sowa if (!v)
25978d2ca1d7SHannes Frederic Sowa goto iter_table;
25988d2ca1d7SHannes Frederic Sowa
2599ef1148d4SEric Dumazet n = rcu_dereference(((struct fib6_info *)v)->fib6_next);
26004fc427e0SVasily Averin if (n)
26018d2ca1d7SHannes Frederic Sowa return n;
26028d2ca1d7SHannes Frederic Sowa
26038d2ca1d7SHannes Frederic Sowa iter_table:
26040a67d3efSHannes Frederic Sowa ipv6_route_check_sernum(iter);
260566f5d6ceSWei Wang spin_lock_bh(&iter->tbl->tb6_lock);
26068d2ca1d7SHannes Frederic Sowa r = fib6_walk_continue(&iter->w);
260766f5d6ceSWei Wang spin_unlock_bh(&iter->tbl->tb6_lock);
26088d2ca1d7SHannes Frederic Sowa if (r > 0) {
26098d2ca1d7SHannes Frederic Sowa return iter->w.leaf;
26108d2ca1d7SHannes Frederic Sowa } else if (r < 0) {
26119a03cd8fSMichal Kubeček fib6_walker_unlink(net, &iter->w);
26128d2ca1d7SHannes Frederic Sowa return NULL;
26138d2ca1d7SHannes Frederic Sowa }
26149a03cd8fSMichal Kubeček fib6_walker_unlink(net, &iter->w);
26158d2ca1d7SHannes Frederic Sowa
26168d2ca1d7SHannes Frederic Sowa iter->tbl = ipv6_route_seq_next_table(iter->tbl, net);
26178d2ca1d7SHannes Frederic Sowa if (!iter->tbl)
26188d2ca1d7SHannes Frederic Sowa return NULL;
26198d2ca1d7SHannes Frederic Sowa
26209a03cd8fSMichal Kubeček ipv6_route_seq_setup_walk(iter, net);
26218d2ca1d7SHannes Frederic Sowa goto iter_table;
26228d2ca1d7SHannes Frederic Sowa }
26238d2ca1d7SHannes Frederic Sowa
ipv6_route_seq_start(struct seq_file * seq,loff_t * pos)26248d2ca1d7SHannes Frederic Sowa static void *ipv6_route_seq_start(struct seq_file *seq, loff_t *pos)
2625ef1148d4SEric Dumazet __acquires(RCU)
26268d2ca1d7SHannes Frederic Sowa {
26278d2ca1d7SHannes Frederic Sowa struct net *net = seq_file_net(seq);
26288d2ca1d7SHannes Frederic Sowa struct ipv6_route_iter *iter = seq->private;
26298d2ca1d7SHannes Frederic Sowa
2630ef1148d4SEric Dumazet rcu_read_lock();
26318d2ca1d7SHannes Frederic Sowa iter->tbl = ipv6_route_seq_next_table(NULL, net);
26328d2ca1d7SHannes Frederic Sowa iter->skip = *pos;
26338d2ca1d7SHannes Frederic Sowa
26348d2ca1d7SHannes Frederic Sowa if (iter->tbl) {
26356617dfd4SYonghong Song loff_t p = 0;
26366617dfd4SYonghong Song
26379a03cd8fSMichal Kubeček ipv6_route_seq_setup_walk(iter, net);
26386617dfd4SYonghong Song return ipv6_route_seq_next(seq, NULL, &p);
26398d2ca1d7SHannes Frederic Sowa } else {
26408d2ca1d7SHannes Frederic Sowa return NULL;
26418d2ca1d7SHannes Frederic Sowa }
26428d2ca1d7SHannes Frederic Sowa }
26438d2ca1d7SHannes Frederic Sowa
ipv6_route_iter_active(struct ipv6_route_iter * iter)26448d2ca1d7SHannes Frederic Sowa static bool ipv6_route_iter_active(struct ipv6_route_iter *iter)
26458d2ca1d7SHannes Frederic Sowa {
264694b2cfe0SHannes Frederic Sowa struct fib6_walker *w = &iter->w;
26478d2ca1d7SHannes Frederic Sowa return w->node && !(w->state == FWS_U && w->node == w->root);
26488d2ca1d7SHannes Frederic Sowa }
26498d2ca1d7SHannes Frederic Sowa
ipv6_route_native_seq_stop(struct seq_file * seq,void * v)2650138d0be3SYonghong Song static void ipv6_route_native_seq_stop(struct seq_file *seq, void *v)
2651ef1148d4SEric Dumazet __releases(RCU)
26528d2ca1d7SHannes Frederic Sowa {
26539a03cd8fSMichal Kubeček struct net *net = seq_file_net(seq);
26548d2ca1d7SHannes Frederic Sowa struct ipv6_route_iter *iter = seq->private;
26558d2ca1d7SHannes Frederic Sowa
26568d2ca1d7SHannes Frederic Sowa if (ipv6_route_iter_active(iter))
26579a03cd8fSMichal Kubeček fib6_walker_unlink(net, &iter->w);
26588d2ca1d7SHannes Frederic Sowa
2659ef1148d4SEric Dumazet rcu_read_unlock();
26608d2ca1d7SHannes Frederic Sowa }
26618d2ca1d7SHannes Frederic Sowa
2662138d0be3SYonghong Song #if IS_BUILTIN(CONFIG_IPV6) && defined(CONFIG_BPF_SYSCALL)
ipv6_route_prog_seq_show(struct bpf_prog * prog,struct bpf_iter_meta * meta,void * v)2663138d0be3SYonghong Song static int ipv6_route_prog_seq_show(struct bpf_prog *prog,
2664138d0be3SYonghong Song struct bpf_iter_meta *meta,
2665138d0be3SYonghong Song void *v)
2666138d0be3SYonghong Song {
2667138d0be3SYonghong Song struct bpf_iter__ipv6_route ctx;
2668138d0be3SYonghong Song
2669138d0be3SYonghong Song ctx.meta = meta;
2670138d0be3SYonghong Song ctx.rt = v;
2671138d0be3SYonghong Song return bpf_iter_run_prog(prog, &ctx);
2672138d0be3SYonghong Song }
2673138d0be3SYonghong Song
ipv6_route_seq_show(struct seq_file * seq,void * v)2674138d0be3SYonghong Song static int ipv6_route_seq_show(struct seq_file *seq, void *v)
2675138d0be3SYonghong Song {
2676138d0be3SYonghong Song struct ipv6_route_iter *iter = seq->private;
2677138d0be3SYonghong Song struct bpf_iter_meta meta;
2678138d0be3SYonghong Song struct bpf_prog *prog;
2679138d0be3SYonghong Song int ret;
2680138d0be3SYonghong Song
2681138d0be3SYonghong Song meta.seq = seq;
2682138d0be3SYonghong Song prog = bpf_iter_get_info(&meta, false);
2683138d0be3SYonghong Song if (!prog)
2684138d0be3SYonghong Song return ipv6_route_native_seq_show(seq, v);
2685138d0be3SYonghong Song
2686138d0be3SYonghong Song ret = ipv6_route_prog_seq_show(prog, &meta, v);
2687138d0be3SYonghong Song iter->w.leaf = NULL;
2688138d0be3SYonghong Song
2689138d0be3SYonghong Song return ret;
2690138d0be3SYonghong Song }
2691138d0be3SYonghong Song
ipv6_route_seq_stop(struct seq_file * seq,void * v)2692138d0be3SYonghong Song static void ipv6_route_seq_stop(struct seq_file *seq, void *v)
2693138d0be3SYonghong Song {
2694138d0be3SYonghong Song struct bpf_iter_meta meta;
2695138d0be3SYonghong Song struct bpf_prog *prog;
2696138d0be3SYonghong Song
2697138d0be3SYonghong Song if (!v) {
2698138d0be3SYonghong Song meta.seq = seq;
2699138d0be3SYonghong Song prog = bpf_iter_get_info(&meta, true);
2700138d0be3SYonghong Song if (prog)
2701138d0be3SYonghong Song (void)ipv6_route_prog_seq_show(prog, &meta, v);
2702138d0be3SYonghong Song }
2703138d0be3SYonghong Song
2704138d0be3SYonghong Song ipv6_route_native_seq_stop(seq, v);
2705138d0be3SYonghong Song }
2706138d0be3SYonghong Song #else
ipv6_route_seq_show(struct seq_file * seq,void * v)2707138d0be3SYonghong Song static int ipv6_route_seq_show(struct seq_file *seq, void *v)
2708138d0be3SYonghong Song {
2709138d0be3SYonghong Song return ipv6_route_native_seq_show(seq, v);
2710138d0be3SYonghong Song }
2711138d0be3SYonghong Song
ipv6_route_seq_stop(struct seq_file * seq,void * v)2712138d0be3SYonghong Song static void ipv6_route_seq_stop(struct seq_file *seq, void *v)
2713138d0be3SYonghong Song {
2714138d0be3SYonghong Song ipv6_route_native_seq_stop(seq, v);
2715138d0be3SYonghong Song }
2716138d0be3SYonghong Song #endif
2717138d0be3SYonghong Song
2718c3506372SChristoph Hellwig const struct seq_operations ipv6_route_seq_ops = {
27198d2ca1d7SHannes Frederic Sowa .start = ipv6_route_seq_start,
27208d2ca1d7SHannes Frederic Sowa .next = ipv6_route_seq_next,
27218d2ca1d7SHannes Frederic Sowa .stop = ipv6_route_seq_stop,
27228d2ca1d7SHannes Frederic Sowa .show = ipv6_route_seq_show
27238d2ca1d7SHannes Frederic Sowa };
27248d2ca1d7SHannes Frederic Sowa #endif /* CONFIG_PROC_FS */
2725