xref: /openbmc/linux/drivers/net/netdevsim/fib.c (revision 8fc4e4aa)
1 /*
2  * Copyright (c) 2018 Cumulus Networks. All rights reserved.
3  * Copyright (c) 2018 David Ahern <dsa@cumulusnetworks.com>
4  *
5  * This software is licensed under the GNU General License Version 2,
6  * June 1991 as shown in the file COPYING in the top-level directory of this
7  * source tree.
8  *
9  * THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS"
10  * WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING,
11  * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
12  * FOR A PARTICULAR PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE
13  * OF THE PROGRAM IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME
14  * THE COST OF ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
15  */
16 
17 #include <linux/bitmap.h>
18 #include <linux/in6.h>
19 #include <linux/kernel.h>
20 #include <linux/list.h>
21 #include <linux/rhashtable.h>
22 #include <linux/spinlock_types.h>
23 #include <linux/types.h>
24 #include <net/fib_notifier.h>
25 #include <net/ip_fib.h>
26 #include <net/ip6_fib.h>
27 #include <net/fib_rules.h>
28 #include <net/net_namespace.h>
29 #include <net/nexthop.h>
30 #include <linux/debugfs.h>
31 
32 #include "netdevsim.h"
33 
34 struct nsim_fib_entry {
35 	u64 max;
36 	atomic64_t num;
37 };
38 
39 struct nsim_per_fib_data {
40 	struct nsim_fib_entry fib;
41 	struct nsim_fib_entry rules;
42 };
43 
44 struct nsim_fib_data {
45 	struct notifier_block fib_nb;
46 	struct nsim_per_fib_data ipv4;
47 	struct nsim_per_fib_data ipv6;
48 	struct nsim_fib_entry nexthops;
49 	struct rhashtable fib_rt_ht;
50 	struct list_head fib_rt_list;
51 	struct mutex fib_lock; /* Protects FIB HT and list */
52 	struct notifier_block nexthop_nb;
53 	struct rhashtable nexthop_ht;
54 	struct devlink *devlink;
55 	struct work_struct fib_event_work;
56 	struct list_head fib_event_queue;
57 	spinlock_t fib_event_queue_lock; /* Protects fib event queue list */
58 	struct mutex nh_lock; /* Protects NH HT */
59 	struct dentry *ddir;
60 	bool fail_route_offload;
61 	bool fail_res_nexthop_group_replace;
62 	bool fail_nexthop_bucket_replace;
63 };
64 
65 struct nsim_fib_rt_key {
66 	unsigned char addr[sizeof(struct in6_addr)];
67 	unsigned char prefix_len;
68 	int family;
69 	u32 tb_id;
70 };
71 
72 struct nsim_fib_rt {
73 	struct nsim_fib_rt_key key;
74 	struct rhash_head ht_node;
75 	struct list_head list;	/* Member of fib_rt_list */
76 };
77 
78 struct nsim_fib4_rt {
79 	struct nsim_fib_rt common;
80 	struct fib_info *fi;
81 	u8 tos;
82 	u8 type;
83 };
84 
85 struct nsim_fib6_rt {
86 	struct nsim_fib_rt common;
87 	struct list_head nh_list;
88 	unsigned int nhs;
89 };
90 
91 struct nsim_fib6_rt_nh {
92 	struct list_head list;	/* Member of nh_list */
93 	struct fib6_info *rt;
94 };
95 
96 struct nsim_fib6_event {
97 	struct fib6_info **rt_arr;
98 	unsigned int nrt6;
99 };
100 
101 struct nsim_fib_event {
102 	struct list_head list; /* node in fib queue */
103 	union {
104 		struct fib_entry_notifier_info fen_info;
105 		struct nsim_fib6_event fib6_event;
106 	};
107 	struct nsim_fib_data *data;
108 	unsigned long event;
109 	int family;
110 };
111 
112 static const struct rhashtable_params nsim_fib_rt_ht_params = {
113 	.key_offset = offsetof(struct nsim_fib_rt, key),
114 	.head_offset = offsetof(struct nsim_fib_rt, ht_node),
115 	.key_len = sizeof(struct nsim_fib_rt_key),
116 	.automatic_shrinking = true,
117 };
118 
119 struct nsim_nexthop {
120 	struct rhash_head ht_node;
121 	u64 occ;
122 	u32 id;
123 	bool is_resilient;
124 };
125 
126 static const struct rhashtable_params nsim_nexthop_ht_params = {
127 	.key_offset = offsetof(struct nsim_nexthop, id),
128 	.head_offset = offsetof(struct nsim_nexthop, ht_node),
129 	.key_len = sizeof(u32),
130 	.automatic_shrinking = true,
131 };
132 
133 u64 nsim_fib_get_val(struct nsim_fib_data *fib_data,
134 		     enum nsim_resource_id res_id, bool max)
135 {
136 	struct nsim_fib_entry *entry;
137 
138 	switch (res_id) {
139 	case NSIM_RESOURCE_IPV4_FIB:
140 		entry = &fib_data->ipv4.fib;
141 		break;
142 	case NSIM_RESOURCE_IPV4_FIB_RULES:
143 		entry = &fib_data->ipv4.rules;
144 		break;
145 	case NSIM_RESOURCE_IPV6_FIB:
146 		entry = &fib_data->ipv6.fib;
147 		break;
148 	case NSIM_RESOURCE_IPV6_FIB_RULES:
149 		entry = &fib_data->ipv6.rules;
150 		break;
151 	case NSIM_RESOURCE_NEXTHOPS:
152 		entry = &fib_data->nexthops;
153 		break;
154 	default:
155 		return 0;
156 	}
157 
158 	return max ? entry->max : atomic64_read(&entry->num);
159 }
160 
161 static void nsim_fib_set_max(struct nsim_fib_data *fib_data,
162 			     enum nsim_resource_id res_id, u64 val)
163 {
164 	struct nsim_fib_entry *entry;
165 
166 	switch (res_id) {
167 	case NSIM_RESOURCE_IPV4_FIB:
168 		entry = &fib_data->ipv4.fib;
169 		break;
170 	case NSIM_RESOURCE_IPV4_FIB_RULES:
171 		entry = &fib_data->ipv4.rules;
172 		break;
173 	case NSIM_RESOURCE_IPV6_FIB:
174 		entry = &fib_data->ipv6.fib;
175 		break;
176 	case NSIM_RESOURCE_IPV6_FIB_RULES:
177 		entry = &fib_data->ipv6.rules;
178 		break;
179 	case NSIM_RESOURCE_NEXTHOPS:
180 		entry = &fib_data->nexthops;
181 		break;
182 	default:
183 		WARN_ON(1);
184 		return;
185 	}
186 	entry->max = val;
187 }
188 
189 static int nsim_fib_rule_account(struct nsim_fib_entry *entry, bool add,
190 				 struct netlink_ext_ack *extack)
191 {
192 	int err = 0;
193 
194 	if (add) {
195 		if (!atomic64_add_unless(&entry->num, 1, entry->max)) {
196 			err = -ENOSPC;
197 			NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported fib rule entries");
198 		}
199 	} else {
200 		atomic64_dec_if_positive(&entry->num);
201 	}
202 
203 	return err;
204 }
205 
206 static int nsim_fib_rule_event(struct nsim_fib_data *data,
207 			       struct fib_notifier_info *info, bool add)
208 {
209 	struct netlink_ext_ack *extack = info->extack;
210 	int err = 0;
211 
212 	switch (info->family) {
213 	case AF_INET:
214 		err = nsim_fib_rule_account(&data->ipv4.rules, add, extack);
215 		break;
216 	case AF_INET6:
217 		err = nsim_fib_rule_account(&data->ipv6.rules, add, extack);
218 		break;
219 	}
220 
221 	return err;
222 }
223 
224 static int nsim_fib_account(struct nsim_fib_entry *entry, bool add)
225 {
226 	int err = 0;
227 
228 	if (add) {
229 		if (!atomic64_add_unless(&entry->num, 1, entry->max))
230 			err = -ENOSPC;
231 	} else {
232 		atomic64_dec_if_positive(&entry->num);
233 	}
234 
235 	return err;
236 }
237 
238 static void nsim_fib_rt_init(struct nsim_fib_data *data,
239 			     struct nsim_fib_rt *fib_rt, const void *addr,
240 			     size_t addr_len, unsigned int prefix_len,
241 			     int family, u32 tb_id)
242 {
243 	memcpy(fib_rt->key.addr, addr, addr_len);
244 	fib_rt->key.prefix_len = prefix_len;
245 	fib_rt->key.family = family;
246 	fib_rt->key.tb_id = tb_id;
247 	list_add(&fib_rt->list, &data->fib_rt_list);
248 }
249 
250 static void nsim_fib_rt_fini(struct nsim_fib_rt *fib_rt)
251 {
252 	list_del(&fib_rt->list);
253 }
254 
255 static struct nsim_fib_rt *nsim_fib_rt_lookup(struct rhashtable *fib_rt_ht,
256 					      const void *addr, size_t addr_len,
257 					      unsigned int prefix_len,
258 					      int family, u32 tb_id)
259 {
260 	struct nsim_fib_rt_key key;
261 
262 	memset(&key, 0, sizeof(key));
263 	memcpy(key.addr, addr, addr_len);
264 	key.prefix_len = prefix_len;
265 	key.family = family;
266 	key.tb_id = tb_id;
267 
268 	return rhashtable_lookup_fast(fib_rt_ht, &key, nsim_fib_rt_ht_params);
269 }
270 
271 static struct nsim_fib4_rt *
272 nsim_fib4_rt_create(struct nsim_fib_data *data,
273 		    struct fib_entry_notifier_info *fen_info)
274 {
275 	struct nsim_fib4_rt *fib4_rt;
276 
277 	fib4_rt = kzalloc(sizeof(*fib4_rt), GFP_KERNEL);
278 	if (!fib4_rt)
279 		return NULL;
280 
281 	nsim_fib_rt_init(data, &fib4_rt->common, &fen_info->dst, sizeof(u32),
282 			 fen_info->dst_len, AF_INET, fen_info->tb_id);
283 
284 	fib4_rt->fi = fen_info->fi;
285 	fib_info_hold(fib4_rt->fi);
286 	fib4_rt->tos = fen_info->tos;
287 	fib4_rt->type = fen_info->type;
288 
289 	return fib4_rt;
290 }
291 
292 static void nsim_fib4_rt_destroy(struct nsim_fib4_rt *fib4_rt)
293 {
294 	fib_info_put(fib4_rt->fi);
295 	nsim_fib_rt_fini(&fib4_rt->common);
296 	kfree(fib4_rt);
297 }
298 
299 static struct nsim_fib4_rt *
300 nsim_fib4_rt_lookup(struct rhashtable *fib_rt_ht,
301 		    const struct fib_entry_notifier_info *fen_info)
302 {
303 	struct nsim_fib_rt *fib_rt;
304 
305 	fib_rt = nsim_fib_rt_lookup(fib_rt_ht, &fen_info->dst, sizeof(u32),
306 				    fen_info->dst_len, AF_INET,
307 				    fen_info->tb_id);
308 	if (!fib_rt)
309 		return NULL;
310 
311 	return container_of(fib_rt, struct nsim_fib4_rt, common);
312 }
313 
314 static void
315 nsim_fib4_rt_offload_failed_flag_set(struct net *net,
316 				     struct fib_entry_notifier_info *fen_info)
317 {
318 	u32 *p_dst = (u32 *)&fen_info->dst;
319 	struct fib_rt_info fri;
320 
321 	fri.fi = fen_info->fi;
322 	fri.tb_id = fen_info->tb_id;
323 	fri.dst = cpu_to_be32(*p_dst);
324 	fri.dst_len = fen_info->dst_len;
325 	fri.tos = fen_info->tos;
326 	fri.type = fen_info->type;
327 	fri.offload = false;
328 	fri.trap = false;
329 	fri.offload_failed = true;
330 	fib_alias_hw_flags_set(net, &fri);
331 }
332 
333 static void nsim_fib4_rt_hw_flags_set(struct net *net,
334 				      const struct nsim_fib4_rt *fib4_rt,
335 				      bool trap)
336 {
337 	u32 *p_dst = (u32 *) fib4_rt->common.key.addr;
338 	int dst_len = fib4_rt->common.key.prefix_len;
339 	struct fib_rt_info fri;
340 
341 	fri.fi = fib4_rt->fi;
342 	fri.tb_id = fib4_rt->common.key.tb_id;
343 	fri.dst = cpu_to_be32(*p_dst);
344 	fri.dst_len = dst_len;
345 	fri.tos = fib4_rt->tos;
346 	fri.type = fib4_rt->type;
347 	fri.offload = false;
348 	fri.trap = trap;
349 	fri.offload_failed = false;
350 	fib_alias_hw_flags_set(net, &fri);
351 }
352 
353 static int nsim_fib4_rt_add(struct nsim_fib_data *data,
354 			    struct nsim_fib4_rt *fib4_rt)
355 {
356 	struct net *net = devlink_net(data->devlink);
357 	int err;
358 
359 	err = rhashtable_insert_fast(&data->fib_rt_ht,
360 				     &fib4_rt->common.ht_node,
361 				     nsim_fib_rt_ht_params);
362 	if (err)
363 		goto err_fib_dismiss;
364 
365 	/* Simulate hardware programming latency. */
366 	msleep(1);
367 	nsim_fib4_rt_hw_flags_set(net, fib4_rt, true);
368 
369 	return 0;
370 
371 err_fib_dismiss:
372 	/* Drop the accounting that was increased from the notification
373 	 * context when FIB_EVENT_ENTRY_REPLACE was triggered.
374 	 */
375 	nsim_fib_account(&data->ipv4.fib, false);
376 	return err;
377 }
378 
379 static int nsim_fib4_rt_replace(struct nsim_fib_data *data,
380 				struct nsim_fib4_rt *fib4_rt,
381 				struct nsim_fib4_rt *fib4_rt_old)
382 {
383 	struct net *net = devlink_net(data->devlink);
384 	int err;
385 
386 	/* We are replacing a route, so need to remove the accounting which
387 	 * was increased when FIB_EVENT_ENTRY_REPLACE was triggered.
388 	 */
389 	err = nsim_fib_account(&data->ipv4.fib, false);
390 	if (err)
391 		return err;
392 	err = rhashtable_replace_fast(&data->fib_rt_ht,
393 				      &fib4_rt_old->common.ht_node,
394 				      &fib4_rt->common.ht_node,
395 				      nsim_fib_rt_ht_params);
396 	if (err)
397 		return err;
398 
399 	msleep(1);
400 	nsim_fib4_rt_hw_flags_set(net, fib4_rt, true);
401 
402 	nsim_fib4_rt_hw_flags_set(net, fib4_rt_old, false);
403 	nsim_fib4_rt_destroy(fib4_rt_old);
404 
405 	return 0;
406 }
407 
408 static int nsim_fib4_rt_insert(struct nsim_fib_data *data,
409 			       struct fib_entry_notifier_info *fen_info)
410 {
411 	struct nsim_fib4_rt *fib4_rt, *fib4_rt_old;
412 	int err;
413 
414 	if (data->fail_route_offload) {
415 		/* For testing purposes, user set debugfs fail_route_offload
416 		 * value to true. Simulate hardware programming latency and then
417 		 * fail.
418 		 */
419 		msleep(1);
420 		return -EINVAL;
421 	}
422 
423 	fib4_rt = nsim_fib4_rt_create(data, fen_info);
424 	if (!fib4_rt)
425 		return -ENOMEM;
426 
427 	fib4_rt_old = nsim_fib4_rt_lookup(&data->fib_rt_ht, fen_info);
428 	if (!fib4_rt_old)
429 		err = nsim_fib4_rt_add(data, fib4_rt);
430 	else
431 		err = nsim_fib4_rt_replace(data, fib4_rt, fib4_rt_old);
432 
433 	if (err)
434 		nsim_fib4_rt_destroy(fib4_rt);
435 
436 	return err;
437 }
438 
439 static void nsim_fib4_rt_remove(struct nsim_fib_data *data,
440 				const struct fib_entry_notifier_info *fen_info)
441 {
442 	struct nsim_fib4_rt *fib4_rt;
443 
444 	fib4_rt = nsim_fib4_rt_lookup(&data->fib_rt_ht, fen_info);
445 	if (!fib4_rt)
446 		return;
447 
448 	rhashtable_remove_fast(&data->fib_rt_ht, &fib4_rt->common.ht_node,
449 			       nsim_fib_rt_ht_params);
450 	nsim_fib4_rt_destroy(fib4_rt);
451 }
452 
453 static int nsim_fib4_event(struct nsim_fib_data *data,
454 			   struct fib_entry_notifier_info *fen_info,
455 			   unsigned long event)
456 {
457 	int err = 0;
458 
459 	switch (event) {
460 	case FIB_EVENT_ENTRY_REPLACE:
461 		err = nsim_fib4_rt_insert(data, fen_info);
462 		if (err) {
463 			struct net *net = devlink_net(data->devlink);
464 
465 			nsim_fib4_rt_offload_failed_flag_set(net, fen_info);
466 		}
467 		break;
468 	case FIB_EVENT_ENTRY_DEL:
469 		nsim_fib4_rt_remove(data, fen_info);
470 		break;
471 	default:
472 		break;
473 	}
474 
475 	return err;
476 }
477 
478 static struct nsim_fib6_rt_nh *
479 nsim_fib6_rt_nh_find(const struct nsim_fib6_rt *fib6_rt,
480 		     const struct fib6_info *rt)
481 {
482 	struct nsim_fib6_rt_nh *fib6_rt_nh;
483 
484 	list_for_each_entry(fib6_rt_nh, &fib6_rt->nh_list, list) {
485 		if (fib6_rt_nh->rt == rt)
486 			return fib6_rt_nh;
487 	}
488 
489 	return NULL;
490 }
491 
492 static int nsim_fib6_rt_nh_add(struct nsim_fib6_rt *fib6_rt,
493 			       struct fib6_info *rt)
494 {
495 	struct nsim_fib6_rt_nh *fib6_rt_nh;
496 
497 	fib6_rt_nh = kzalloc(sizeof(*fib6_rt_nh), GFP_KERNEL);
498 	if (!fib6_rt_nh)
499 		return -ENOMEM;
500 
501 	fib6_info_hold(rt);
502 	fib6_rt_nh->rt = rt;
503 	list_add_tail(&fib6_rt_nh->list, &fib6_rt->nh_list);
504 	fib6_rt->nhs++;
505 
506 	return 0;
507 }
508 
509 #if IS_ENABLED(CONFIG_IPV6)
510 static void nsim_rt6_release(struct fib6_info *rt)
511 {
512 	fib6_info_release(rt);
513 }
514 #else
515 static void nsim_rt6_release(struct fib6_info *rt)
516 {
517 }
518 #endif
519 
520 static void nsim_fib6_rt_nh_del(struct nsim_fib6_rt *fib6_rt,
521 				const struct fib6_info *rt)
522 {
523 	struct nsim_fib6_rt_nh *fib6_rt_nh;
524 
525 	fib6_rt_nh = nsim_fib6_rt_nh_find(fib6_rt, rt);
526 	if (!fib6_rt_nh)
527 		return;
528 
529 	fib6_rt->nhs--;
530 	list_del(&fib6_rt_nh->list);
531 	nsim_rt6_release(fib6_rt_nh->rt);
532 	kfree(fib6_rt_nh);
533 }
534 
535 static struct nsim_fib6_rt *
536 nsim_fib6_rt_create(struct nsim_fib_data *data,
537 		    struct fib6_info **rt_arr, unsigned int nrt6)
538 {
539 	struct fib6_info *rt = rt_arr[0];
540 	struct nsim_fib6_rt *fib6_rt;
541 	int i = 0;
542 	int err;
543 
544 	fib6_rt = kzalloc(sizeof(*fib6_rt), GFP_KERNEL);
545 	if (!fib6_rt)
546 		return ERR_PTR(-ENOMEM);
547 
548 	nsim_fib_rt_init(data, &fib6_rt->common, &rt->fib6_dst.addr,
549 			 sizeof(rt->fib6_dst.addr), rt->fib6_dst.plen, AF_INET6,
550 			 rt->fib6_table->tb6_id);
551 
552 	/* We consider a multipath IPv6 route as one entry, but it can be made
553 	 * up from several fib6_info structs (one for each nexthop), so we
554 	 * add them all to the same list under the entry.
555 	 */
556 	INIT_LIST_HEAD(&fib6_rt->nh_list);
557 
558 	for (i = 0; i < nrt6; i++) {
559 		err = nsim_fib6_rt_nh_add(fib6_rt, rt_arr[i]);
560 		if (err)
561 			goto err_fib6_rt_nh_del;
562 	}
563 
564 	return fib6_rt;
565 
566 err_fib6_rt_nh_del:
567 	for (i--; i >= 0; i--) {
568 		nsim_fib6_rt_nh_del(fib6_rt, rt_arr[i]);
569 	}
570 	nsim_fib_rt_fini(&fib6_rt->common);
571 	kfree(fib6_rt);
572 	return ERR_PTR(err);
573 }
574 
575 static void nsim_fib6_rt_destroy(struct nsim_fib6_rt *fib6_rt)
576 {
577 	struct nsim_fib6_rt_nh *iter, *tmp;
578 
579 	list_for_each_entry_safe(iter, tmp, &fib6_rt->nh_list, list)
580 		nsim_fib6_rt_nh_del(fib6_rt, iter->rt);
581 	WARN_ON_ONCE(!list_empty(&fib6_rt->nh_list));
582 	nsim_fib_rt_fini(&fib6_rt->common);
583 	kfree(fib6_rt);
584 }
585 
586 static struct nsim_fib6_rt *
587 nsim_fib6_rt_lookup(struct rhashtable *fib_rt_ht, const struct fib6_info *rt)
588 {
589 	struct nsim_fib_rt *fib_rt;
590 
591 	fib_rt = nsim_fib_rt_lookup(fib_rt_ht, &rt->fib6_dst.addr,
592 				    sizeof(rt->fib6_dst.addr),
593 				    rt->fib6_dst.plen, AF_INET6,
594 				    rt->fib6_table->tb6_id);
595 	if (!fib_rt)
596 		return NULL;
597 
598 	return container_of(fib_rt, struct nsim_fib6_rt, common);
599 }
600 
601 static int nsim_fib6_rt_append(struct nsim_fib_data *data,
602 			       struct nsim_fib6_event *fib6_event)
603 {
604 	struct fib6_info *rt = fib6_event->rt_arr[0];
605 	struct nsim_fib6_rt *fib6_rt;
606 	int i, err;
607 
608 	if (data->fail_route_offload) {
609 		/* For testing purposes, user set debugfs fail_route_offload
610 		 * value to true. Simulate hardware programming latency and then
611 		 * fail.
612 		 */
613 		msleep(1);
614 		return -EINVAL;
615 	}
616 
617 	fib6_rt = nsim_fib6_rt_lookup(&data->fib_rt_ht, rt);
618 	if (!fib6_rt)
619 		return -EINVAL;
620 
621 	for (i = 0; i < fib6_event->nrt6; i++) {
622 		err = nsim_fib6_rt_nh_add(fib6_rt, fib6_event->rt_arr[i]);
623 		if (err)
624 			goto err_fib6_rt_nh_del;
625 
626 		fib6_event->rt_arr[i]->trap = true;
627 	}
628 
629 	return 0;
630 
631 err_fib6_rt_nh_del:
632 	for (i--; i >= 0; i--) {
633 		fib6_event->rt_arr[i]->trap = false;
634 		nsim_fib6_rt_nh_del(fib6_rt, fib6_event->rt_arr[i]);
635 	}
636 	return err;
637 }
638 
639 #if IS_ENABLED(CONFIG_IPV6)
640 static void nsim_fib6_rt_offload_failed_flag_set(struct nsim_fib_data *data,
641 						 struct fib6_info **rt_arr,
642 						 unsigned int nrt6)
643 
644 {
645 	struct net *net = devlink_net(data->devlink);
646 	int i;
647 
648 	for (i = 0; i < nrt6; i++)
649 		fib6_info_hw_flags_set(net, rt_arr[i], false, false, true);
650 }
651 #else
652 static void nsim_fib6_rt_offload_failed_flag_set(struct nsim_fib_data *data,
653 						 struct fib6_info **rt_arr,
654 						 unsigned int nrt6)
655 {
656 }
657 #endif
658 
659 #if IS_ENABLED(CONFIG_IPV6)
660 static void nsim_fib6_rt_hw_flags_set(struct nsim_fib_data *data,
661 				      const struct nsim_fib6_rt *fib6_rt,
662 				      bool trap)
663 {
664 	struct net *net = devlink_net(data->devlink);
665 	struct nsim_fib6_rt_nh *fib6_rt_nh;
666 
667 	list_for_each_entry(fib6_rt_nh, &fib6_rt->nh_list, list)
668 		fib6_info_hw_flags_set(net, fib6_rt_nh->rt, false, trap, false);
669 }
670 #else
671 static void nsim_fib6_rt_hw_flags_set(struct nsim_fib_data *data,
672 				      const struct nsim_fib6_rt *fib6_rt,
673 				      bool trap)
674 {
675 }
676 #endif
677 
678 static int nsim_fib6_rt_add(struct nsim_fib_data *data,
679 			    struct nsim_fib6_rt *fib6_rt)
680 {
681 	int err;
682 
683 	err = rhashtable_insert_fast(&data->fib_rt_ht,
684 				     &fib6_rt->common.ht_node,
685 				     nsim_fib_rt_ht_params);
686 
687 	if (err)
688 		goto err_fib_dismiss;
689 
690 	msleep(1);
691 	nsim_fib6_rt_hw_flags_set(data, fib6_rt, true);
692 
693 	return 0;
694 
695 err_fib_dismiss:
696 	/* Drop the accounting that was increased from the notification
697 	 * context when FIB_EVENT_ENTRY_REPLACE was triggered.
698 	 */
699 	nsim_fib_account(&data->ipv6.fib, false);
700 	return err;
701 }
702 
703 static int nsim_fib6_rt_replace(struct nsim_fib_data *data,
704 				struct nsim_fib6_rt *fib6_rt,
705 				struct nsim_fib6_rt *fib6_rt_old)
706 {
707 	int err;
708 
709 	/* We are replacing a route, so need to remove the accounting which
710 	 * was increased when FIB_EVENT_ENTRY_REPLACE was triggered.
711 	 */
712 	err = nsim_fib_account(&data->ipv6.fib, false);
713 	if (err)
714 		return err;
715 
716 	err = rhashtable_replace_fast(&data->fib_rt_ht,
717 				      &fib6_rt_old->common.ht_node,
718 				      &fib6_rt->common.ht_node,
719 				      nsim_fib_rt_ht_params);
720 
721 	if (err)
722 		return err;
723 
724 	msleep(1);
725 	nsim_fib6_rt_hw_flags_set(data, fib6_rt, true);
726 
727 	nsim_fib6_rt_hw_flags_set(data, fib6_rt_old, false);
728 	nsim_fib6_rt_destroy(fib6_rt_old);
729 
730 	return 0;
731 }
732 
733 static int nsim_fib6_rt_insert(struct nsim_fib_data *data,
734 			       struct nsim_fib6_event *fib6_event)
735 {
736 	struct fib6_info *rt = fib6_event->rt_arr[0];
737 	struct nsim_fib6_rt *fib6_rt, *fib6_rt_old;
738 	int err;
739 
740 	if (data->fail_route_offload) {
741 		/* For testing purposes, user set debugfs fail_route_offload
742 		 * value to true. Simulate hardware programming latency and then
743 		 * fail.
744 		 */
745 		msleep(1);
746 		return -EINVAL;
747 	}
748 
749 	fib6_rt = nsim_fib6_rt_create(data, fib6_event->rt_arr,
750 				      fib6_event->nrt6);
751 	if (IS_ERR(fib6_rt))
752 		return PTR_ERR(fib6_rt);
753 
754 	fib6_rt_old = nsim_fib6_rt_lookup(&data->fib_rt_ht, rt);
755 	if (!fib6_rt_old)
756 		err = nsim_fib6_rt_add(data, fib6_rt);
757 	else
758 		err = nsim_fib6_rt_replace(data, fib6_rt, fib6_rt_old);
759 
760 	if (err)
761 		nsim_fib6_rt_destroy(fib6_rt);
762 
763 	return err;
764 }
765 
766 static void nsim_fib6_rt_remove(struct nsim_fib_data *data,
767 				struct nsim_fib6_event *fib6_event)
768 {
769 	struct fib6_info *rt = fib6_event->rt_arr[0];
770 	struct nsim_fib6_rt *fib6_rt;
771 	int i;
772 
773 	/* Multipath routes are first added to the FIB trie and only then
774 	 * notified. If we vetoed the addition, we will get a delete
775 	 * notification for a route we do not have. Therefore, do not warn if
776 	 * route was not found.
777 	 */
778 	fib6_rt = nsim_fib6_rt_lookup(&data->fib_rt_ht, rt);
779 	if (!fib6_rt)
780 		return;
781 
782 	/* If not all the nexthops are deleted, then only reduce the nexthop
783 	 * group.
784 	 */
785 	if (fib6_event->nrt6 != fib6_rt->nhs) {
786 		for (i = 0; i < fib6_event->nrt6; i++)
787 			nsim_fib6_rt_nh_del(fib6_rt, fib6_event->rt_arr[i]);
788 		return;
789 	}
790 
791 	rhashtable_remove_fast(&data->fib_rt_ht, &fib6_rt->common.ht_node,
792 			       nsim_fib_rt_ht_params);
793 	nsim_fib6_rt_destroy(fib6_rt);
794 }
795 
796 static int nsim_fib6_event_init(struct nsim_fib6_event *fib6_event,
797 				struct fib6_entry_notifier_info *fen6_info)
798 {
799 	struct fib6_info *rt = fen6_info->rt;
800 	struct fib6_info **rt_arr;
801 	struct fib6_info *iter;
802 	unsigned int nrt6;
803 	int i = 0;
804 
805 	nrt6 = fen6_info->nsiblings + 1;
806 
807 	rt_arr = kcalloc(nrt6, sizeof(struct fib6_info *), GFP_ATOMIC);
808 	if (!rt_arr)
809 		return -ENOMEM;
810 
811 	fib6_event->rt_arr = rt_arr;
812 	fib6_event->nrt6 = nrt6;
813 
814 	rt_arr[0] = rt;
815 	fib6_info_hold(rt);
816 
817 	if (!fen6_info->nsiblings)
818 		return 0;
819 
820 	list_for_each_entry(iter, &rt->fib6_siblings, fib6_siblings) {
821 		if (i == fen6_info->nsiblings)
822 			break;
823 
824 		rt_arr[i + 1] = iter;
825 		fib6_info_hold(iter);
826 		i++;
827 	}
828 	WARN_ON_ONCE(i != fen6_info->nsiblings);
829 
830 	return 0;
831 }
832 
833 static void nsim_fib6_event_fini(struct nsim_fib6_event *fib6_event)
834 {
835 	int i;
836 
837 	for (i = 0; i < fib6_event->nrt6; i++)
838 		nsim_rt6_release(fib6_event->rt_arr[i]);
839 	kfree(fib6_event->rt_arr);
840 }
841 
842 static int nsim_fib6_event(struct nsim_fib_data *data,
843 			   struct nsim_fib6_event *fib6_event,
844 			   unsigned long event)
845 {
846 	int err;
847 
848 	if (fib6_event->rt_arr[0]->fib6_src.plen)
849 		return 0;
850 
851 	switch (event) {
852 	case FIB_EVENT_ENTRY_REPLACE:
853 		err = nsim_fib6_rt_insert(data, fib6_event);
854 		if (err)
855 			goto err_rt_offload_failed_flag_set;
856 		break;
857 	case FIB_EVENT_ENTRY_APPEND:
858 		err = nsim_fib6_rt_append(data, fib6_event);
859 		if (err)
860 			goto err_rt_offload_failed_flag_set;
861 		break;
862 	case FIB_EVENT_ENTRY_DEL:
863 		nsim_fib6_rt_remove(data, fib6_event);
864 		break;
865 	default:
866 		break;
867 	}
868 
869 	return 0;
870 
871 err_rt_offload_failed_flag_set:
872 	nsim_fib6_rt_offload_failed_flag_set(data, fib6_event->rt_arr,
873 					     fib6_event->nrt6);
874 	return err;
875 }
876 
877 static void nsim_fib_event(struct nsim_fib_event *fib_event)
878 {
879 	switch (fib_event->family) {
880 	case AF_INET:
881 		nsim_fib4_event(fib_event->data, &fib_event->fen_info,
882 				fib_event->event);
883 		fib_info_put(fib_event->fen_info.fi);
884 		break;
885 	case AF_INET6:
886 		nsim_fib6_event(fib_event->data, &fib_event->fib6_event,
887 				fib_event->event);
888 		nsim_fib6_event_fini(&fib_event->fib6_event);
889 		break;
890 	}
891 }
892 
893 static int nsim_fib4_prepare_event(struct fib_notifier_info *info,
894 				   struct nsim_fib_event *fib_event,
895 				   unsigned long event)
896 {
897 	struct nsim_fib_data *data = fib_event->data;
898 	struct fib_entry_notifier_info *fen_info;
899 	struct netlink_ext_ack *extack;
900 	int err = 0;
901 
902 	fen_info = container_of(info, struct fib_entry_notifier_info,
903 				info);
904 	fib_event->fen_info = *fen_info;
905 	extack = info->extack;
906 
907 	switch (event) {
908 	case FIB_EVENT_ENTRY_REPLACE:
909 		err = nsim_fib_account(&data->ipv4.fib, true);
910 		if (err) {
911 			NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported fib entries");
912 			return err;
913 		}
914 		break;
915 	case FIB_EVENT_ENTRY_DEL:
916 		nsim_fib_account(&data->ipv4.fib, false);
917 		break;
918 	}
919 
920 	/* Take reference on fib_info to prevent it from being
921 	 * freed while event is queued. Release it afterwards.
922 	 */
923 	fib_info_hold(fib_event->fen_info.fi);
924 
925 	return 0;
926 }
927 
928 static int nsim_fib6_prepare_event(struct fib_notifier_info *info,
929 				   struct nsim_fib_event *fib_event,
930 				   unsigned long event)
931 {
932 	struct nsim_fib_data *data = fib_event->data;
933 	struct fib6_entry_notifier_info *fen6_info;
934 	struct netlink_ext_ack *extack;
935 	int err = 0;
936 
937 	fen6_info = container_of(info, struct fib6_entry_notifier_info,
938 				 info);
939 
940 	err = nsim_fib6_event_init(&fib_event->fib6_event, fen6_info);
941 	if (err)
942 		return err;
943 
944 	extack = info->extack;
945 	switch (event) {
946 	case FIB_EVENT_ENTRY_REPLACE:
947 		err = nsim_fib_account(&data->ipv6.fib, true);
948 		if (err) {
949 			NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported fib entries");
950 			goto err_fib6_event_fini;
951 		}
952 		break;
953 	case FIB_EVENT_ENTRY_DEL:
954 		nsim_fib_account(&data->ipv6.fib, false);
955 		break;
956 	}
957 
958 	return 0;
959 
960 err_fib6_event_fini:
961 	nsim_fib6_event_fini(&fib_event->fib6_event);
962 	return err;
963 }
964 
965 static int nsim_fib_event_schedule_work(struct nsim_fib_data *data,
966 					struct fib_notifier_info *info,
967 					unsigned long event)
968 {
969 	struct nsim_fib_event *fib_event;
970 	int err;
971 
972 	if (info->family != AF_INET && info->family != AF_INET6)
973 		/* netdevsim does not support 'RTNL_FAMILY_IP6MR' and
974 		 * 'RTNL_FAMILY_IPMR' and should ignore them.
975 		 */
976 		return NOTIFY_DONE;
977 
978 	fib_event = kzalloc(sizeof(*fib_event), GFP_ATOMIC);
979 	if (!fib_event)
980 		return NOTIFY_BAD;
981 
982 	fib_event->data = data;
983 	fib_event->event = event;
984 	fib_event->family = info->family;
985 
986 	switch (info->family) {
987 	case AF_INET:
988 		err = nsim_fib4_prepare_event(info, fib_event, event);
989 		break;
990 	case AF_INET6:
991 		err = nsim_fib6_prepare_event(info, fib_event, event);
992 		break;
993 	}
994 
995 	if (err)
996 		goto err_fib_prepare_event;
997 
998 	/* Enqueue the event and trigger the work */
999 	spin_lock_bh(&data->fib_event_queue_lock);
1000 	list_add_tail(&fib_event->list, &data->fib_event_queue);
1001 	spin_unlock_bh(&data->fib_event_queue_lock);
1002 	schedule_work(&data->fib_event_work);
1003 
1004 	return NOTIFY_DONE;
1005 
1006 err_fib_prepare_event:
1007 	kfree(fib_event);
1008 	return NOTIFY_BAD;
1009 }
1010 
1011 static int nsim_fib_event_nb(struct notifier_block *nb, unsigned long event,
1012 			     void *ptr)
1013 {
1014 	struct nsim_fib_data *data = container_of(nb, struct nsim_fib_data,
1015 						  fib_nb);
1016 	struct fib_notifier_info *info = ptr;
1017 	int err;
1018 
1019 	switch (event) {
1020 	case FIB_EVENT_RULE_ADD:
1021 	case FIB_EVENT_RULE_DEL:
1022 		err = nsim_fib_rule_event(data, info,
1023 					  event == FIB_EVENT_RULE_ADD);
1024 		return notifier_from_errno(err);
1025 	case FIB_EVENT_ENTRY_REPLACE:
1026 	case FIB_EVENT_ENTRY_APPEND:
1027 	case FIB_EVENT_ENTRY_DEL:
1028 		return nsim_fib_event_schedule_work(data, info, event);
1029 	}
1030 
1031 	return NOTIFY_DONE;
1032 }
1033 
1034 static void nsim_fib4_rt_free(struct nsim_fib_rt *fib_rt,
1035 			      struct nsim_fib_data *data)
1036 {
1037 	struct devlink *devlink = data->devlink;
1038 	struct nsim_fib4_rt *fib4_rt;
1039 
1040 	fib4_rt = container_of(fib_rt, struct nsim_fib4_rt, common);
1041 	nsim_fib4_rt_hw_flags_set(devlink_net(devlink), fib4_rt, false);
1042 	nsim_fib_account(&data->ipv4.fib, false);
1043 	nsim_fib4_rt_destroy(fib4_rt);
1044 }
1045 
1046 static void nsim_fib6_rt_free(struct nsim_fib_rt *fib_rt,
1047 			      struct nsim_fib_data *data)
1048 {
1049 	struct nsim_fib6_rt *fib6_rt;
1050 
1051 	fib6_rt = container_of(fib_rt, struct nsim_fib6_rt, common);
1052 	nsim_fib6_rt_hw_flags_set(data, fib6_rt, false);
1053 	nsim_fib_account(&data->ipv6.fib, false);
1054 	nsim_fib6_rt_destroy(fib6_rt);
1055 }
1056 
1057 static void nsim_fib_rt_free(void *ptr, void *arg)
1058 {
1059 	struct nsim_fib_rt *fib_rt = ptr;
1060 	struct nsim_fib_data *data = arg;
1061 
1062 	switch (fib_rt->key.family) {
1063 	case AF_INET:
1064 		nsim_fib4_rt_free(fib_rt, data);
1065 		break;
1066 	case AF_INET6:
1067 		nsim_fib6_rt_free(fib_rt, data);
1068 		break;
1069 	default:
1070 		WARN_ON_ONCE(1);
1071 	}
1072 }
1073 
1074 /* inconsistent dump, trying again */
1075 static void nsim_fib_dump_inconsistent(struct notifier_block *nb)
1076 {
1077 	struct nsim_fib_data *data = container_of(nb, struct nsim_fib_data,
1078 						  fib_nb);
1079 	struct nsim_fib_rt *fib_rt, *fib_rt_tmp;
1080 
1081 	/* Flush the work to make sure there is no race with notifications. */
1082 	flush_work(&data->fib_event_work);
1083 
1084 	/* The notifier block is still not registered, so we do not need to
1085 	 * take any locks here.
1086 	 */
1087 	list_for_each_entry_safe(fib_rt, fib_rt_tmp, &data->fib_rt_list, list) {
1088 		rhashtable_remove_fast(&data->fib_rt_ht, &fib_rt->ht_node,
1089 				       nsim_fib_rt_ht_params);
1090 		nsim_fib_rt_free(fib_rt, data);
1091 	}
1092 
1093 	atomic64_set(&data->ipv4.rules.num, 0ULL);
1094 	atomic64_set(&data->ipv6.rules.num, 0ULL);
1095 }
1096 
1097 static struct nsim_nexthop *nsim_nexthop_create(struct nsim_fib_data *data,
1098 						struct nh_notifier_info *info)
1099 {
1100 	struct nsim_nexthop *nexthop;
1101 	u64 occ = 0;
1102 	int i;
1103 
1104 	nexthop = kzalloc(sizeof(*nexthop), GFP_KERNEL);
1105 	if (!nexthop)
1106 		return ERR_PTR(-ENOMEM);
1107 
1108 	nexthop->id = info->id;
1109 
1110 	/* Determine the number of nexthop entries the new nexthop will
1111 	 * occupy.
1112 	 */
1113 
1114 	switch (info->type) {
1115 	case NH_NOTIFIER_INFO_TYPE_SINGLE:
1116 		occ = 1;
1117 		break;
1118 	case NH_NOTIFIER_INFO_TYPE_GRP:
1119 		for (i = 0; i < info->nh_grp->num_nh; i++)
1120 			occ += info->nh_grp->nh_entries[i].weight;
1121 		break;
1122 	case NH_NOTIFIER_INFO_TYPE_RES_TABLE:
1123 		occ = info->nh_res_table->num_nh_buckets;
1124 		nexthop->is_resilient = true;
1125 		break;
1126 	default:
1127 		NL_SET_ERR_MSG_MOD(info->extack, "Unsupported nexthop type");
1128 		kfree(nexthop);
1129 		return ERR_PTR(-EOPNOTSUPP);
1130 	}
1131 
1132 	nexthop->occ = occ;
1133 	return nexthop;
1134 }
1135 
1136 static void nsim_nexthop_destroy(struct nsim_nexthop *nexthop)
1137 {
1138 	kfree(nexthop);
1139 }
1140 
1141 static int nsim_nexthop_account(struct nsim_fib_data *data, u64 occ,
1142 				bool add, struct netlink_ext_ack *extack)
1143 {
1144 	int i, err = 0;
1145 
1146 	if (add) {
1147 		for (i = 0; i < occ; i++)
1148 			if (!atomic64_add_unless(&data->nexthops.num, 1,
1149 						 data->nexthops.max)) {
1150 				err = -ENOSPC;
1151 				NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported nexthops");
1152 				goto err_num_decrease;
1153 			}
1154 	} else {
1155 		if (WARN_ON(occ > atomic64_read(&data->nexthops.num)))
1156 			return -EINVAL;
1157 		atomic64_sub(occ, &data->nexthops.num);
1158 	}
1159 
1160 	return err;
1161 
1162 err_num_decrease:
1163 	atomic64_sub(i, &data->nexthops.num);
1164 	return err;
1165 
1166 }
1167 
1168 static void nsim_nexthop_hw_flags_set(struct net *net,
1169 				      const struct nsim_nexthop *nexthop,
1170 				      bool trap)
1171 {
1172 	int i;
1173 
1174 	nexthop_set_hw_flags(net, nexthop->id, false, trap);
1175 
1176 	if (!nexthop->is_resilient)
1177 		return;
1178 
1179 	for (i = 0; i < nexthop->occ; i++)
1180 		nexthop_bucket_set_hw_flags(net, nexthop->id, i, false, trap);
1181 }
1182 
1183 static int nsim_nexthop_add(struct nsim_fib_data *data,
1184 			    struct nsim_nexthop *nexthop,
1185 			    struct netlink_ext_ack *extack)
1186 {
1187 	struct net *net = devlink_net(data->devlink);
1188 	int err;
1189 
1190 	err = nsim_nexthop_account(data, nexthop->occ, true, extack);
1191 	if (err)
1192 		return err;
1193 
1194 	err = rhashtable_insert_fast(&data->nexthop_ht, &nexthop->ht_node,
1195 				     nsim_nexthop_ht_params);
1196 	if (err) {
1197 		NL_SET_ERR_MSG_MOD(extack, "Failed to insert nexthop");
1198 		goto err_nexthop_dismiss;
1199 	}
1200 
1201 	nsim_nexthop_hw_flags_set(net, nexthop, true);
1202 
1203 	return 0;
1204 
1205 err_nexthop_dismiss:
1206 	nsim_nexthop_account(data, nexthop->occ, false, extack);
1207 	return err;
1208 }
1209 
1210 static int nsim_nexthop_replace(struct nsim_fib_data *data,
1211 				struct nsim_nexthop *nexthop,
1212 				struct nsim_nexthop *nexthop_old,
1213 				struct netlink_ext_ack *extack)
1214 {
1215 	struct net *net = devlink_net(data->devlink);
1216 	int err;
1217 
1218 	err = nsim_nexthop_account(data, nexthop->occ, true, extack);
1219 	if (err)
1220 		return err;
1221 
1222 	err = rhashtable_replace_fast(&data->nexthop_ht,
1223 				      &nexthop_old->ht_node, &nexthop->ht_node,
1224 				      nsim_nexthop_ht_params);
1225 	if (err) {
1226 		NL_SET_ERR_MSG_MOD(extack, "Failed to replace nexthop");
1227 		goto err_nexthop_dismiss;
1228 	}
1229 
1230 	nsim_nexthop_hw_flags_set(net, nexthop, true);
1231 	nsim_nexthop_account(data, nexthop_old->occ, false, extack);
1232 	nsim_nexthop_destroy(nexthop_old);
1233 
1234 	return 0;
1235 
1236 err_nexthop_dismiss:
1237 	nsim_nexthop_account(data, nexthop->occ, false, extack);
1238 	return err;
1239 }
1240 
1241 static int nsim_nexthop_insert(struct nsim_fib_data *data,
1242 			       struct nh_notifier_info *info)
1243 {
1244 	struct nsim_nexthop *nexthop, *nexthop_old;
1245 	int err;
1246 
1247 	nexthop = nsim_nexthop_create(data, info);
1248 	if (IS_ERR(nexthop))
1249 		return PTR_ERR(nexthop);
1250 
1251 	nexthop_old = rhashtable_lookup_fast(&data->nexthop_ht, &info->id,
1252 					     nsim_nexthop_ht_params);
1253 	if (!nexthop_old)
1254 		err = nsim_nexthop_add(data, nexthop, info->extack);
1255 	else
1256 		err = nsim_nexthop_replace(data, nexthop, nexthop_old,
1257 					   info->extack);
1258 
1259 	if (err)
1260 		nsim_nexthop_destroy(nexthop);
1261 
1262 	return err;
1263 }
1264 
1265 static void nsim_nexthop_remove(struct nsim_fib_data *data,
1266 				struct nh_notifier_info *info)
1267 {
1268 	struct nsim_nexthop *nexthop;
1269 
1270 	nexthop = rhashtable_lookup_fast(&data->nexthop_ht, &info->id,
1271 					 nsim_nexthop_ht_params);
1272 	if (!nexthop)
1273 		return;
1274 
1275 	rhashtable_remove_fast(&data->nexthop_ht, &nexthop->ht_node,
1276 			       nsim_nexthop_ht_params);
1277 	nsim_nexthop_account(data, nexthop->occ, false, info->extack);
1278 	nsim_nexthop_destroy(nexthop);
1279 }
1280 
1281 static int nsim_nexthop_res_table_pre_replace(struct nsim_fib_data *data,
1282 					      struct nh_notifier_info *info)
1283 {
1284 	if (data->fail_res_nexthop_group_replace) {
1285 		NL_SET_ERR_MSG_MOD(info->extack, "Failed to replace a resilient nexthop group");
1286 		return -EINVAL;
1287 	}
1288 
1289 	return 0;
1290 }
1291 
1292 static int nsim_nexthop_bucket_replace(struct nsim_fib_data *data,
1293 				       struct nh_notifier_info *info)
1294 {
1295 	if (data->fail_nexthop_bucket_replace) {
1296 		NL_SET_ERR_MSG_MOD(info->extack, "Failed to replace nexthop bucket");
1297 		return -EINVAL;
1298 	}
1299 
1300 	nexthop_bucket_set_hw_flags(info->net, info->id,
1301 				    info->nh_res_bucket->bucket_index,
1302 				    false, true);
1303 
1304 	return 0;
1305 }
1306 
1307 static int nsim_nexthop_event_nb(struct notifier_block *nb, unsigned long event,
1308 				 void *ptr)
1309 {
1310 	struct nsim_fib_data *data = container_of(nb, struct nsim_fib_data,
1311 						  nexthop_nb);
1312 	struct nh_notifier_info *info = ptr;
1313 	int err = 0;
1314 
1315 	mutex_lock(&data->nh_lock);
1316 	switch (event) {
1317 	case NEXTHOP_EVENT_REPLACE:
1318 		err = nsim_nexthop_insert(data, info);
1319 		break;
1320 	case NEXTHOP_EVENT_DEL:
1321 		nsim_nexthop_remove(data, info);
1322 		break;
1323 	case NEXTHOP_EVENT_RES_TABLE_PRE_REPLACE:
1324 		err = nsim_nexthop_res_table_pre_replace(data, info);
1325 		break;
1326 	case NEXTHOP_EVENT_BUCKET_REPLACE:
1327 		err = nsim_nexthop_bucket_replace(data, info);
1328 		break;
1329 	default:
1330 		break;
1331 	}
1332 
1333 	mutex_unlock(&data->nh_lock);
1334 	return notifier_from_errno(err);
1335 }
1336 
1337 static void nsim_nexthop_free(void *ptr, void *arg)
1338 {
1339 	struct nsim_nexthop *nexthop = ptr;
1340 	struct nsim_fib_data *data = arg;
1341 	struct net *net;
1342 
1343 	net = devlink_net(data->devlink);
1344 	nsim_nexthop_hw_flags_set(net, nexthop, false);
1345 	nsim_nexthop_account(data, nexthop->occ, false, NULL);
1346 	nsim_nexthop_destroy(nexthop);
1347 }
1348 
1349 static ssize_t nsim_nexthop_bucket_activity_write(struct file *file,
1350 						  const char __user *user_buf,
1351 						  size_t size, loff_t *ppos)
1352 {
1353 	struct nsim_fib_data *data = file->private_data;
1354 	struct net *net = devlink_net(data->devlink);
1355 	struct nsim_nexthop *nexthop;
1356 	unsigned long *activity;
1357 	loff_t pos = *ppos;
1358 	u16 bucket_index;
1359 	char buf[128];
1360 	int err = 0;
1361 	u32 nhid;
1362 
1363 	if (pos != 0)
1364 		return -EINVAL;
1365 	if (size > sizeof(buf))
1366 		return -EINVAL;
1367 	if (copy_from_user(buf, user_buf, size))
1368 		return -EFAULT;
1369 	if (sscanf(buf, "%u %hu", &nhid, &bucket_index) != 2)
1370 		return -EINVAL;
1371 
1372 	rtnl_lock();
1373 
1374 	nexthop = rhashtable_lookup_fast(&data->nexthop_ht, &nhid,
1375 					 nsim_nexthop_ht_params);
1376 	if (!nexthop || !nexthop->is_resilient ||
1377 	    bucket_index >= nexthop->occ) {
1378 		err = -EINVAL;
1379 		goto out;
1380 	}
1381 
1382 	activity = bitmap_zalloc(nexthop->occ, GFP_KERNEL);
1383 	if (!activity) {
1384 		err = -ENOMEM;
1385 		goto out;
1386 	}
1387 
1388 	bitmap_set(activity, bucket_index, 1);
1389 	nexthop_res_grp_activity_update(net, nhid, nexthop->occ, activity);
1390 	bitmap_free(activity);
1391 
1392 out:
1393 	rtnl_unlock();
1394 
1395 	*ppos = size;
1396 	return err ?: size;
1397 }
1398 
1399 static const struct file_operations nsim_nexthop_bucket_activity_fops = {
1400 	.open = simple_open,
1401 	.write = nsim_nexthop_bucket_activity_write,
1402 	.llseek = no_llseek,
1403 	.owner = THIS_MODULE,
1404 };
1405 
1406 static u64 nsim_fib_ipv4_resource_occ_get(void *priv)
1407 {
1408 	struct nsim_fib_data *data = priv;
1409 
1410 	return nsim_fib_get_val(data, NSIM_RESOURCE_IPV4_FIB, false);
1411 }
1412 
1413 static u64 nsim_fib_ipv4_rules_res_occ_get(void *priv)
1414 {
1415 	struct nsim_fib_data *data = priv;
1416 
1417 	return nsim_fib_get_val(data, NSIM_RESOURCE_IPV4_FIB_RULES, false);
1418 }
1419 
1420 static u64 nsim_fib_ipv6_resource_occ_get(void *priv)
1421 {
1422 	struct nsim_fib_data *data = priv;
1423 
1424 	return nsim_fib_get_val(data, NSIM_RESOURCE_IPV6_FIB, false);
1425 }
1426 
1427 static u64 nsim_fib_ipv6_rules_res_occ_get(void *priv)
1428 {
1429 	struct nsim_fib_data *data = priv;
1430 
1431 	return nsim_fib_get_val(data, NSIM_RESOURCE_IPV6_FIB_RULES, false);
1432 }
1433 
1434 static u64 nsim_fib_nexthops_res_occ_get(void *priv)
1435 {
1436 	struct nsim_fib_data *data = priv;
1437 
1438 	return nsim_fib_get_val(data, NSIM_RESOURCE_NEXTHOPS, false);
1439 }
1440 
1441 static void nsim_fib_set_max_all(struct nsim_fib_data *data,
1442 				 struct devlink *devlink)
1443 {
1444 	enum nsim_resource_id res_ids[] = {
1445 		NSIM_RESOURCE_IPV4_FIB, NSIM_RESOURCE_IPV4_FIB_RULES,
1446 		NSIM_RESOURCE_IPV6_FIB, NSIM_RESOURCE_IPV6_FIB_RULES,
1447 		NSIM_RESOURCE_NEXTHOPS,
1448 	};
1449 	int i;
1450 
1451 	for (i = 0; i < ARRAY_SIZE(res_ids); i++) {
1452 		int err;
1453 		u64 val;
1454 
1455 		err = devlink_resource_size_get(devlink, res_ids[i], &val);
1456 		if (err)
1457 			val = (u64) -1;
1458 		nsim_fib_set_max(data, res_ids[i], val);
1459 	}
1460 }
1461 
1462 static void nsim_fib_event_work(struct work_struct *work)
1463 {
1464 	struct nsim_fib_data *data = container_of(work, struct nsim_fib_data,
1465 						  fib_event_work);
1466 	struct nsim_fib_event *fib_event, *next_fib_event;
1467 
1468 	LIST_HEAD(fib_event_queue);
1469 
1470 	spin_lock_bh(&data->fib_event_queue_lock);
1471 	list_splice_init(&data->fib_event_queue, &fib_event_queue);
1472 	spin_unlock_bh(&data->fib_event_queue_lock);
1473 
1474 	mutex_lock(&data->fib_lock);
1475 	list_for_each_entry_safe(fib_event, next_fib_event, &fib_event_queue,
1476 				 list) {
1477 		nsim_fib_event(fib_event);
1478 		list_del(&fib_event->list);
1479 		kfree(fib_event);
1480 		cond_resched();
1481 	}
1482 	mutex_unlock(&data->fib_lock);
1483 }
1484 
1485 static int
1486 nsim_fib_debugfs_init(struct nsim_fib_data *data, struct nsim_dev *nsim_dev)
1487 {
1488 	data->ddir = debugfs_create_dir("fib", nsim_dev->ddir);
1489 	if (IS_ERR(data->ddir))
1490 		return PTR_ERR(data->ddir);
1491 
1492 	data->fail_route_offload = false;
1493 	debugfs_create_bool("fail_route_offload", 0600, data->ddir,
1494 			    &data->fail_route_offload);
1495 
1496 	data->fail_res_nexthop_group_replace = false;
1497 	debugfs_create_bool("fail_res_nexthop_group_replace", 0600, data->ddir,
1498 			    &data->fail_res_nexthop_group_replace);
1499 
1500 	data->fail_nexthop_bucket_replace = false;
1501 	debugfs_create_bool("fail_nexthop_bucket_replace", 0600, data->ddir,
1502 			    &data->fail_nexthop_bucket_replace);
1503 
1504 	debugfs_create_file("nexthop_bucket_activity", 0200, data->ddir,
1505 			    data, &nsim_nexthop_bucket_activity_fops);
1506 	return 0;
1507 }
1508 
1509 static void nsim_fib_debugfs_exit(struct nsim_fib_data *data)
1510 {
1511 	debugfs_remove_recursive(data->ddir);
1512 }
1513 
1514 struct nsim_fib_data *nsim_fib_create(struct devlink *devlink,
1515 				      struct netlink_ext_ack *extack)
1516 {
1517 	struct nsim_fib_data *data;
1518 	struct nsim_dev *nsim_dev;
1519 	int err;
1520 
1521 	data = kzalloc(sizeof(*data), GFP_KERNEL);
1522 	if (!data)
1523 		return ERR_PTR(-ENOMEM);
1524 	data->devlink = devlink;
1525 
1526 	nsim_dev = devlink_priv(devlink);
1527 	err = nsim_fib_debugfs_init(data, nsim_dev);
1528 	if (err)
1529 		goto err_data_free;
1530 
1531 	mutex_init(&data->nh_lock);
1532 	err = rhashtable_init(&data->nexthop_ht, &nsim_nexthop_ht_params);
1533 	if (err)
1534 		goto err_debugfs_exit;
1535 
1536 	mutex_init(&data->fib_lock);
1537 	INIT_LIST_HEAD(&data->fib_rt_list);
1538 	err = rhashtable_init(&data->fib_rt_ht, &nsim_fib_rt_ht_params);
1539 	if (err)
1540 		goto err_rhashtable_nexthop_destroy;
1541 
1542 	INIT_WORK(&data->fib_event_work, nsim_fib_event_work);
1543 	INIT_LIST_HEAD(&data->fib_event_queue);
1544 	spin_lock_init(&data->fib_event_queue_lock);
1545 
1546 	nsim_fib_set_max_all(data, devlink);
1547 
1548 	data->nexthop_nb.notifier_call = nsim_nexthop_event_nb;
1549 	err = register_nexthop_notifier(devlink_net(devlink), &data->nexthop_nb,
1550 					extack);
1551 	if (err) {
1552 		pr_err("Failed to register nexthop notifier\n");
1553 		goto err_rhashtable_fib_destroy;
1554 	}
1555 
1556 	data->fib_nb.notifier_call = nsim_fib_event_nb;
1557 	err = register_fib_notifier(devlink_net(devlink), &data->fib_nb,
1558 				    nsim_fib_dump_inconsistent, extack);
1559 	if (err) {
1560 		pr_err("Failed to register fib notifier\n");
1561 		goto err_nexthop_nb_unregister;
1562 	}
1563 
1564 	devlink_resource_occ_get_register(devlink,
1565 					  NSIM_RESOURCE_IPV4_FIB,
1566 					  nsim_fib_ipv4_resource_occ_get,
1567 					  data);
1568 	devlink_resource_occ_get_register(devlink,
1569 					  NSIM_RESOURCE_IPV4_FIB_RULES,
1570 					  nsim_fib_ipv4_rules_res_occ_get,
1571 					  data);
1572 	devlink_resource_occ_get_register(devlink,
1573 					  NSIM_RESOURCE_IPV6_FIB,
1574 					  nsim_fib_ipv6_resource_occ_get,
1575 					  data);
1576 	devlink_resource_occ_get_register(devlink,
1577 					  NSIM_RESOURCE_IPV6_FIB_RULES,
1578 					  nsim_fib_ipv6_rules_res_occ_get,
1579 					  data);
1580 	devlink_resource_occ_get_register(devlink,
1581 					  NSIM_RESOURCE_NEXTHOPS,
1582 					  nsim_fib_nexthops_res_occ_get,
1583 					  data);
1584 	return data;
1585 
1586 err_nexthop_nb_unregister:
1587 	unregister_nexthop_notifier(devlink_net(devlink), &data->nexthop_nb);
1588 err_rhashtable_fib_destroy:
1589 	flush_work(&data->fib_event_work);
1590 	rhashtable_free_and_destroy(&data->fib_rt_ht, nsim_fib_rt_free,
1591 				    data);
1592 err_rhashtable_nexthop_destroy:
1593 	rhashtable_free_and_destroy(&data->nexthop_ht, nsim_nexthop_free,
1594 				    data);
1595 	mutex_destroy(&data->fib_lock);
1596 err_debugfs_exit:
1597 	mutex_destroy(&data->nh_lock);
1598 	nsim_fib_debugfs_exit(data);
1599 err_data_free:
1600 	kfree(data);
1601 	return ERR_PTR(err);
1602 }
1603 
1604 void nsim_fib_destroy(struct devlink *devlink, struct nsim_fib_data *data)
1605 {
1606 	devlink_resource_occ_get_unregister(devlink,
1607 					    NSIM_RESOURCE_NEXTHOPS);
1608 	devlink_resource_occ_get_unregister(devlink,
1609 					    NSIM_RESOURCE_IPV6_FIB_RULES);
1610 	devlink_resource_occ_get_unregister(devlink,
1611 					    NSIM_RESOURCE_IPV6_FIB);
1612 	devlink_resource_occ_get_unregister(devlink,
1613 					    NSIM_RESOURCE_IPV4_FIB_RULES);
1614 	devlink_resource_occ_get_unregister(devlink,
1615 					    NSIM_RESOURCE_IPV4_FIB);
1616 	unregister_fib_notifier(devlink_net(devlink), &data->fib_nb);
1617 	unregister_nexthop_notifier(devlink_net(devlink), &data->nexthop_nb);
1618 	flush_work(&data->fib_event_work);
1619 	rhashtable_free_and_destroy(&data->fib_rt_ht, nsim_fib_rt_free,
1620 				    data);
1621 	rhashtable_free_and_destroy(&data->nexthop_ht, nsim_nexthop_free,
1622 				    data);
1623 	WARN_ON_ONCE(!list_empty(&data->fib_event_queue));
1624 	WARN_ON_ONCE(!list_empty(&data->fib_rt_list));
1625 	mutex_destroy(&data->fib_lock);
1626 	mutex_destroy(&data->nh_lock);
1627 	nsim_fib_debugfs_exit(data);
1628 	kfree(data);
1629 }
1630