1 // SPDX-License-Identifier: BSD-3-Clause OR GPL-2.0 2 /* Copyright (c) 2016-2018 Mellanox Technologies. All rights reserved */ 3 4 #include <linux/kernel.h> 5 #include <linux/types.h> 6 #include <linux/rhashtable.h> 7 #include <linux/bitops.h> 8 #include <linux/in6.h> 9 #include <linux/notifier.h> 10 #include <linux/inetdevice.h> 11 #include <linux/netdevice.h> 12 #include <linux/if_bridge.h> 13 #include <linux/socket.h> 14 #include <linux/route.h> 15 #include <linux/gcd.h> 16 #include <linux/if_macvlan.h> 17 #include <linux/refcount.h> 18 #include <linux/jhash.h> 19 #include <linux/net_namespace.h> 20 #include <linux/mutex.h> 21 #include <net/netevent.h> 22 #include <net/neighbour.h> 23 #include <net/arp.h> 24 #include <net/inet_dscp.h> 25 #include <net/ip_fib.h> 26 #include <net/ip6_fib.h> 27 #include <net/nexthop.h> 28 #include <net/fib_rules.h> 29 #include <net/ip_tunnels.h> 30 #include <net/l3mdev.h> 31 #include <net/addrconf.h> 32 #include <net/ndisc.h> 33 #include <net/ipv6.h> 34 #include <net/fib_notifier.h> 35 #include <net/switchdev.h> 36 37 #include "spectrum.h" 38 #include "core.h" 39 #include "reg.h" 40 #include "spectrum_cnt.h" 41 #include "spectrum_dpipe.h" 42 #include "spectrum_ipip.h" 43 #include "spectrum_mr.h" 44 #include "spectrum_mr_tcam.h" 45 #include "spectrum_router.h" 46 #include "spectrum_span.h" 47 48 struct mlxsw_sp_fib; 49 struct mlxsw_sp_vr; 50 struct mlxsw_sp_lpm_tree; 51 struct mlxsw_sp_rif_ops; 52 53 struct mlxsw_sp_rif { 54 struct list_head nexthop_list; 55 struct list_head neigh_list; 56 struct net_device *dev; /* NULL for underlay RIF */ 57 struct mlxsw_sp_fid *fid; 58 unsigned char addr[ETH_ALEN]; 59 int mtu; 60 u16 rif_index; 61 u8 mac_profile_id; 62 u16 vr_id; 63 const struct mlxsw_sp_rif_ops *ops; 64 struct mlxsw_sp *mlxsw_sp; 65 66 unsigned int counter_ingress; 67 bool counter_ingress_valid; 68 unsigned int counter_egress; 69 bool counter_egress_valid; 70 }; 71 72 struct mlxsw_sp_rif_params { 73 struct net_device *dev; 74 union { 75 u16 system_port; 76 u16 lag_id; 77 }; 78 u16 vid; 79 bool lag; 80 }; 81 82 struct mlxsw_sp_rif_subport { 83 struct mlxsw_sp_rif common; 84 refcount_t ref_count; 85 union { 86 u16 system_port; 87 u16 lag_id; 88 }; 89 u16 vid; 90 bool lag; 91 }; 92 93 struct mlxsw_sp_rif_ipip_lb { 94 struct mlxsw_sp_rif common; 95 struct mlxsw_sp_rif_ipip_lb_config lb_config; 96 u16 ul_vr_id; /* Reserved for Spectrum-2. */ 97 u16 ul_rif_id; /* Reserved for Spectrum. */ 98 }; 99 100 struct mlxsw_sp_rif_params_ipip_lb { 101 struct mlxsw_sp_rif_params common; 102 struct mlxsw_sp_rif_ipip_lb_config lb_config; 103 }; 104 105 struct mlxsw_sp_rif_ops { 106 enum mlxsw_sp_rif_type type; 107 size_t rif_size; 108 109 void (*setup)(struct mlxsw_sp_rif *rif, 110 const struct mlxsw_sp_rif_params *params); 111 int (*configure)(struct mlxsw_sp_rif *rif, 112 struct netlink_ext_ack *extack); 113 void (*deconfigure)(struct mlxsw_sp_rif *rif); 114 struct mlxsw_sp_fid * (*fid_get)(struct mlxsw_sp_rif *rif, 115 struct netlink_ext_ack *extack); 116 void (*fdb_del)(struct mlxsw_sp_rif *rif, const char *mac); 117 }; 118 119 struct mlxsw_sp_rif_mac_profile { 120 unsigned char mac_prefix[ETH_ALEN]; 121 refcount_t ref_count; 122 u8 id; 123 }; 124 125 struct mlxsw_sp_router_ops { 126 int (*init)(struct mlxsw_sp *mlxsw_sp); 127 int (*ipips_init)(struct mlxsw_sp *mlxsw_sp); 128 }; 129 130 static struct mlxsw_sp_rif * 131 mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp, 132 const struct net_device *dev); 133 static void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif); 134 static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree); 135 static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp, 136 struct mlxsw_sp_lpm_tree *lpm_tree); 137 static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp, 138 const struct mlxsw_sp_fib *fib, 139 u8 tree_id); 140 static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp, 141 const struct mlxsw_sp_fib *fib); 142 143 static unsigned int * 144 mlxsw_sp_rif_p_counter_get(struct mlxsw_sp_rif *rif, 145 enum mlxsw_sp_rif_counter_dir dir) 146 { 147 switch (dir) { 148 case MLXSW_SP_RIF_COUNTER_EGRESS: 149 return &rif->counter_egress; 150 case MLXSW_SP_RIF_COUNTER_INGRESS: 151 return &rif->counter_ingress; 152 } 153 return NULL; 154 } 155 156 static bool 157 mlxsw_sp_rif_counter_valid_get(struct mlxsw_sp_rif *rif, 158 enum mlxsw_sp_rif_counter_dir dir) 159 { 160 switch (dir) { 161 case MLXSW_SP_RIF_COUNTER_EGRESS: 162 return rif->counter_egress_valid; 163 case MLXSW_SP_RIF_COUNTER_INGRESS: 164 return rif->counter_ingress_valid; 165 } 166 return false; 167 } 168 169 static void 170 mlxsw_sp_rif_counter_valid_set(struct mlxsw_sp_rif *rif, 171 enum mlxsw_sp_rif_counter_dir dir, 172 bool valid) 173 { 174 switch (dir) { 175 case MLXSW_SP_RIF_COUNTER_EGRESS: 176 rif->counter_egress_valid = valid; 177 break; 178 case MLXSW_SP_RIF_COUNTER_INGRESS: 179 rif->counter_ingress_valid = valid; 180 break; 181 } 182 } 183 184 static int mlxsw_sp_rif_counter_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index, 185 unsigned int counter_index, bool enable, 186 enum mlxsw_sp_rif_counter_dir dir) 187 { 188 char ritr_pl[MLXSW_REG_RITR_LEN]; 189 bool is_egress = false; 190 int err; 191 192 if (dir == MLXSW_SP_RIF_COUNTER_EGRESS) 193 is_egress = true; 194 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index); 195 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 196 if (err) 197 return err; 198 199 mlxsw_reg_ritr_counter_pack(ritr_pl, counter_index, enable, 200 is_egress); 201 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 202 } 203 204 int mlxsw_sp_rif_counter_value_get(struct mlxsw_sp *mlxsw_sp, 205 struct mlxsw_sp_rif *rif, 206 enum mlxsw_sp_rif_counter_dir dir, u64 *cnt) 207 { 208 char ricnt_pl[MLXSW_REG_RICNT_LEN]; 209 unsigned int *p_counter_index; 210 bool valid; 211 int err; 212 213 valid = mlxsw_sp_rif_counter_valid_get(rif, dir); 214 if (!valid) 215 return -EINVAL; 216 217 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir); 218 if (!p_counter_index) 219 return -EINVAL; 220 mlxsw_reg_ricnt_pack(ricnt_pl, *p_counter_index, 221 MLXSW_REG_RICNT_OPCODE_NOP); 222 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl); 223 if (err) 224 return err; 225 *cnt = mlxsw_reg_ricnt_good_unicast_packets_get(ricnt_pl); 226 return 0; 227 } 228 229 struct mlxsw_sp_rif_counter_set_basic { 230 u64 good_unicast_packets; 231 u64 good_multicast_packets; 232 u64 good_broadcast_packets; 233 u64 good_unicast_bytes; 234 u64 good_multicast_bytes; 235 u64 good_broadcast_bytes; 236 u64 error_packets; 237 u64 discard_packets; 238 u64 error_bytes; 239 u64 discard_bytes; 240 }; 241 242 static int 243 mlxsw_sp_rif_counter_fetch_clear(struct mlxsw_sp_rif *rif, 244 enum mlxsw_sp_rif_counter_dir dir, 245 struct mlxsw_sp_rif_counter_set_basic *set) 246 { 247 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 248 char ricnt_pl[MLXSW_REG_RICNT_LEN]; 249 unsigned int *p_counter_index; 250 int err; 251 252 if (!mlxsw_sp_rif_counter_valid_get(rif, dir)) 253 return -EINVAL; 254 255 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir); 256 if (!p_counter_index) 257 return -EINVAL; 258 259 mlxsw_reg_ricnt_pack(ricnt_pl, *p_counter_index, 260 MLXSW_REG_RICNT_OPCODE_CLEAR); 261 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl); 262 if (err) 263 return err; 264 265 if (!set) 266 return 0; 267 268 #define MLXSW_SP_RIF_COUNTER_EXTRACT(NAME) \ 269 (set->NAME = mlxsw_reg_ricnt_ ## NAME ## _get(ricnt_pl)) 270 271 MLXSW_SP_RIF_COUNTER_EXTRACT(good_unicast_packets); 272 MLXSW_SP_RIF_COUNTER_EXTRACT(good_multicast_packets); 273 MLXSW_SP_RIF_COUNTER_EXTRACT(good_broadcast_packets); 274 MLXSW_SP_RIF_COUNTER_EXTRACT(good_unicast_bytes); 275 MLXSW_SP_RIF_COUNTER_EXTRACT(good_multicast_bytes); 276 MLXSW_SP_RIF_COUNTER_EXTRACT(good_broadcast_bytes); 277 MLXSW_SP_RIF_COUNTER_EXTRACT(error_packets); 278 MLXSW_SP_RIF_COUNTER_EXTRACT(discard_packets); 279 MLXSW_SP_RIF_COUNTER_EXTRACT(error_bytes); 280 MLXSW_SP_RIF_COUNTER_EXTRACT(discard_bytes); 281 282 #undef MLXSW_SP_RIF_COUNTER_EXTRACT 283 284 return 0; 285 } 286 287 static int mlxsw_sp_rif_counter_clear(struct mlxsw_sp *mlxsw_sp, 288 unsigned int counter_index) 289 { 290 char ricnt_pl[MLXSW_REG_RICNT_LEN]; 291 292 mlxsw_reg_ricnt_pack(ricnt_pl, counter_index, 293 MLXSW_REG_RICNT_OPCODE_CLEAR); 294 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ricnt), ricnt_pl); 295 } 296 297 int mlxsw_sp_rif_counter_alloc(struct mlxsw_sp_rif *rif, 298 enum mlxsw_sp_rif_counter_dir dir) 299 { 300 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 301 unsigned int *p_counter_index; 302 int err; 303 304 if (mlxsw_sp_rif_counter_valid_get(rif, dir)) 305 return 0; 306 307 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir); 308 if (!p_counter_index) 309 return -EINVAL; 310 311 err = mlxsw_sp_counter_alloc(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF, 312 p_counter_index); 313 if (err) 314 return err; 315 316 err = mlxsw_sp_rif_counter_clear(mlxsw_sp, *p_counter_index); 317 if (err) 318 goto err_counter_clear; 319 320 err = mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index, 321 *p_counter_index, true, dir); 322 if (err) 323 goto err_counter_edit; 324 mlxsw_sp_rif_counter_valid_set(rif, dir, true); 325 return 0; 326 327 err_counter_edit: 328 err_counter_clear: 329 mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF, 330 *p_counter_index); 331 return err; 332 } 333 334 void mlxsw_sp_rif_counter_free(struct mlxsw_sp_rif *rif, 335 enum mlxsw_sp_rif_counter_dir dir) 336 { 337 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 338 unsigned int *p_counter_index; 339 340 if (!mlxsw_sp_rif_counter_valid_get(rif, dir)) 341 return; 342 343 p_counter_index = mlxsw_sp_rif_p_counter_get(rif, dir); 344 if (WARN_ON(!p_counter_index)) 345 return; 346 mlxsw_sp_rif_counter_edit(mlxsw_sp, rif->rif_index, 347 *p_counter_index, false, dir); 348 mlxsw_sp_counter_free(mlxsw_sp, MLXSW_SP_COUNTER_SUB_POOL_RIF, 349 *p_counter_index); 350 mlxsw_sp_rif_counter_valid_set(rif, dir, false); 351 } 352 353 static void mlxsw_sp_rif_counters_alloc(struct mlxsw_sp_rif *rif) 354 { 355 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 356 struct devlink *devlink; 357 358 devlink = priv_to_devlink(mlxsw_sp->core); 359 if (!devlink_dpipe_table_counter_enabled(devlink, 360 MLXSW_SP_DPIPE_TABLE_NAME_ERIF)) 361 return; 362 mlxsw_sp_rif_counter_alloc(rif, MLXSW_SP_RIF_COUNTER_EGRESS); 363 } 364 365 static void mlxsw_sp_rif_counters_free(struct mlxsw_sp_rif *rif) 366 { 367 mlxsw_sp_rif_counter_free(rif, MLXSW_SP_RIF_COUNTER_EGRESS); 368 } 369 370 #define MLXSW_SP_PREFIX_COUNT (sizeof(struct in6_addr) * BITS_PER_BYTE + 1) 371 372 struct mlxsw_sp_prefix_usage { 373 DECLARE_BITMAP(b, MLXSW_SP_PREFIX_COUNT); 374 }; 375 376 #define mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) \ 377 for_each_set_bit(prefix, (prefix_usage)->b, MLXSW_SP_PREFIX_COUNT) 378 379 static bool 380 mlxsw_sp_prefix_usage_eq(struct mlxsw_sp_prefix_usage *prefix_usage1, 381 struct mlxsw_sp_prefix_usage *prefix_usage2) 382 { 383 return !memcmp(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1)); 384 } 385 386 static void 387 mlxsw_sp_prefix_usage_cpy(struct mlxsw_sp_prefix_usage *prefix_usage1, 388 struct mlxsw_sp_prefix_usage *prefix_usage2) 389 { 390 memcpy(prefix_usage1, prefix_usage2, sizeof(*prefix_usage1)); 391 } 392 393 static void 394 mlxsw_sp_prefix_usage_set(struct mlxsw_sp_prefix_usage *prefix_usage, 395 unsigned char prefix_len) 396 { 397 set_bit(prefix_len, prefix_usage->b); 398 } 399 400 static void 401 mlxsw_sp_prefix_usage_clear(struct mlxsw_sp_prefix_usage *prefix_usage, 402 unsigned char prefix_len) 403 { 404 clear_bit(prefix_len, prefix_usage->b); 405 } 406 407 struct mlxsw_sp_fib_key { 408 unsigned char addr[sizeof(struct in6_addr)]; 409 unsigned char prefix_len; 410 }; 411 412 enum mlxsw_sp_fib_entry_type { 413 MLXSW_SP_FIB_ENTRY_TYPE_REMOTE, 414 MLXSW_SP_FIB_ENTRY_TYPE_LOCAL, 415 MLXSW_SP_FIB_ENTRY_TYPE_TRAP, 416 MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE, 417 MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE, 418 419 /* This is a special case of local delivery, where a packet should be 420 * decapsulated on reception. Note that there is no corresponding ENCAP, 421 * because that's a type of next hop, not of FIB entry. (There can be 422 * several next hops in a REMOTE entry, and some of them may be 423 * encapsulating entries.) 424 */ 425 MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP, 426 MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP, 427 }; 428 429 struct mlxsw_sp_nexthop_group_info; 430 struct mlxsw_sp_nexthop_group; 431 struct mlxsw_sp_fib_entry; 432 433 struct mlxsw_sp_fib_node { 434 struct mlxsw_sp_fib_entry *fib_entry; 435 struct list_head list; 436 struct rhash_head ht_node; 437 struct mlxsw_sp_fib *fib; 438 struct mlxsw_sp_fib_key key; 439 }; 440 441 struct mlxsw_sp_fib_entry_decap { 442 struct mlxsw_sp_ipip_entry *ipip_entry; 443 u32 tunnel_index; 444 }; 445 446 struct mlxsw_sp_fib_entry { 447 struct mlxsw_sp_fib_node *fib_node; 448 enum mlxsw_sp_fib_entry_type type; 449 struct list_head nexthop_group_node; 450 struct mlxsw_sp_nexthop_group *nh_group; 451 struct mlxsw_sp_fib_entry_decap decap; /* Valid for decap entries. */ 452 }; 453 454 struct mlxsw_sp_fib4_entry { 455 struct mlxsw_sp_fib_entry common; 456 struct fib_info *fi; 457 u32 tb_id; 458 dscp_t dscp; 459 u8 type; 460 }; 461 462 struct mlxsw_sp_fib6_entry { 463 struct mlxsw_sp_fib_entry common; 464 struct list_head rt6_list; 465 unsigned int nrt6; 466 }; 467 468 struct mlxsw_sp_rt6 { 469 struct list_head list; 470 struct fib6_info *rt; 471 }; 472 473 struct mlxsw_sp_lpm_tree { 474 u8 id; /* tree ID */ 475 unsigned int ref_count; 476 enum mlxsw_sp_l3proto proto; 477 unsigned long prefix_ref_count[MLXSW_SP_PREFIX_COUNT]; 478 struct mlxsw_sp_prefix_usage prefix_usage; 479 }; 480 481 struct mlxsw_sp_fib { 482 struct rhashtable ht; 483 struct list_head node_list; 484 struct mlxsw_sp_vr *vr; 485 struct mlxsw_sp_lpm_tree *lpm_tree; 486 enum mlxsw_sp_l3proto proto; 487 }; 488 489 struct mlxsw_sp_vr { 490 u16 id; /* virtual router ID */ 491 u32 tb_id; /* kernel fib table id */ 492 unsigned int rif_count; 493 struct mlxsw_sp_fib *fib4; 494 struct mlxsw_sp_fib *fib6; 495 struct mlxsw_sp_mr_table *mr_table[MLXSW_SP_L3_PROTO_MAX]; 496 struct mlxsw_sp_rif *ul_rif; 497 refcount_t ul_rif_refcnt; 498 }; 499 500 static const struct rhashtable_params mlxsw_sp_fib_ht_params; 501 502 static struct mlxsw_sp_fib *mlxsw_sp_fib_create(struct mlxsw_sp *mlxsw_sp, 503 struct mlxsw_sp_vr *vr, 504 enum mlxsw_sp_l3proto proto) 505 { 506 struct mlxsw_sp_lpm_tree *lpm_tree; 507 struct mlxsw_sp_fib *fib; 508 int err; 509 510 lpm_tree = mlxsw_sp->router->lpm.proto_trees[proto]; 511 fib = kzalloc(sizeof(*fib), GFP_KERNEL); 512 if (!fib) 513 return ERR_PTR(-ENOMEM); 514 err = rhashtable_init(&fib->ht, &mlxsw_sp_fib_ht_params); 515 if (err) 516 goto err_rhashtable_init; 517 INIT_LIST_HEAD(&fib->node_list); 518 fib->proto = proto; 519 fib->vr = vr; 520 fib->lpm_tree = lpm_tree; 521 mlxsw_sp_lpm_tree_hold(lpm_tree); 522 err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, lpm_tree->id); 523 if (err) 524 goto err_lpm_tree_bind; 525 return fib; 526 527 err_lpm_tree_bind: 528 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree); 529 err_rhashtable_init: 530 kfree(fib); 531 return ERR_PTR(err); 532 } 533 534 static void mlxsw_sp_fib_destroy(struct mlxsw_sp *mlxsw_sp, 535 struct mlxsw_sp_fib *fib) 536 { 537 mlxsw_sp_vr_lpm_tree_unbind(mlxsw_sp, fib); 538 mlxsw_sp_lpm_tree_put(mlxsw_sp, fib->lpm_tree); 539 WARN_ON(!list_empty(&fib->node_list)); 540 rhashtable_destroy(&fib->ht); 541 kfree(fib); 542 } 543 544 static struct mlxsw_sp_lpm_tree * 545 mlxsw_sp_lpm_tree_find_unused(struct mlxsw_sp *mlxsw_sp) 546 { 547 static struct mlxsw_sp_lpm_tree *lpm_tree; 548 int i; 549 550 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) { 551 lpm_tree = &mlxsw_sp->router->lpm.trees[i]; 552 if (lpm_tree->ref_count == 0) 553 return lpm_tree; 554 } 555 return NULL; 556 } 557 558 static int mlxsw_sp_lpm_tree_alloc(struct mlxsw_sp *mlxsw_sp, 559 struct mlxsw_sp_lpm_tree *lpm_tree) 560 { 561 char ralta_pl[MLXSW_REG_RALTA_LEN]; 562 563 mlxsw_reg_ralta_pack(ralta_pl, true, 564 (enum mlxsw_reg_ralxx_protocol) lpm_tree->proto, 565 lpm_tree->id); 566 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl); 567 } 568 569 static void mlxsw_sp_lpm_tree_free(struct mlxsw_sp *mlxsw_sp, 570 struct mlxsw_sp_lpm_tree *lpm_tree) 571 { 572 char ralta_pl[MLXSW_REG_RALTA_LEN]; 573 574 mlxsw_reg_ralta_pack(ralta_pl, false, 575 (enum mlxsw_reg_ralxx_protocol) lpm_tree->proto, 576 lpm_tree->id); 577 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralta), ralta_pl); 578 } 579 580 static int 581 mlxsw_sp_lpm_tree_left_struct_set(struct mlxsw_sp *mlxsw_sp, 582 struct mlxsw_sp_prefix_usage *prefix_usage, 583 struct mlxsw_sp_lpm_tree *lpm_tree) 584 { 585 char ralst_pl[MLXSW_REG_RALST_LEN]; 586 u8 root_bin = 0; 587 u8 prefix; 588 u8 last_prefix = MLXSW_REG_RALST_BIN_NO_CHILD; 589 590 mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) 591 root_bin = prefix; 592 593 mlxsw_reg_ralst_pack(ralst_pl, root_bin, lpm_tree->id); 594 mlxsw_sp_prefix_usage_for_each(prefix, prefix_usage) { 595 if (prefix == 0) 596 continue; 597 mlxsw_reg_ralst_bin_pack(ralst_pl, prefix, last_prefix, 598 MLXSW_REG_RALST_BIN_NO_CHILD); 599 last_prefix = prefix; 600 } 601 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralst), ralst_pl); 602 } 603 604 static struct mlxsw_sp_lpm_tree * 605 mlxsw_sp_lpm_tree_create(struct mlxsw_sp *mlxsw_sp, 606 struct mlxsw_sp_prefix_usage *prefix_usage, 607 enum mlxsw_sp_l3proto proto) 608 { 609 struct mlxsw_sp_lpm_tree *lpm_tree; 610 int err; 611 612 lpm_tree = mlxsw_sp_lpm_tree_find_unused(mlxsw_sp); 613 if (!lpm_tree) 614 return ERR_PTR(-EBUSY); 615 lpm_tree->proto = proto; 616 err = mlxsw_sp_lpm_tree_alloc(mlxsw_sp, lpm_tree); 617 if (err) 618 return ERR_PTR(err); 619 620 err = mlxsw_sp_lpm_tree_left_struct_set(mlxsw_sp, prefix_usage, 621 lpm_tree); 622 if (err) 623 goto err_left_struct_set; 624 memcpy(&lpm_tree->prefix_usage, prefix_usage, 625 sizeof(lpm_tree->prefix_usage)); 626 memset(&lpm_tree->prefix_ref_count, 0, 627 sizeof(lpm_tree->prefix_ref_count)); 628 lpm_tree->ref_count = 1; 629 return lpm_tree; 630 631 err_left_struct_set: 632 mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree); 633 return ERR_PTR(err); 634 } 635 636 static void mlxsw_sp_lpm_tree_destroy(struct mlxsw_sp *mlxsw_sp, 637 struct mlxsw_sp_lpm_tree *lpm_tree) 638 { 639 mlxsw_sp_lpm_tree_free(mlxsw_sp, lpm_tree); 640 } 641 642 static struct mlxsw_sp_lpm_tree * 643 mlxsw_sp_lpm_tree_get(struct mlxsw_sp *mlxsw_sp, 644 struct mlxsw_sp_prefix_usage *prefix_usage, 645 enum mlxsw_sp_l3proto proto) 646 { 647 struct mlxsw_sp_lpm_tree *lpm_tree; 648 int i; 649 650 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) { 651 lpm_tree = &mlxsw_sp->router->lpm.trees[i]; 652 if (lpm_tree->ref_count != 0 && 653 lpm_tree->proto == proto && 654 mlxsw_sp_prefix_usage_eq(&lpm_tree->prefix_usage, 655 prefix_usage)) { 656 mlxsw_sp_lpm_tree_hold(lpm_tree); 657 return lpm_tree; 658 } 659 } 660 return mlxsw_sp_lpm_tree_create(mlxsw_sp, prefix_usage, proto); 661 } 662 663 static void mlxsw_sp_lpm_tree_hold(struct mlxsw_sp_lpm_tree *lpm_tree) 664 { 665 lpm_tree->ref_count++; 666 } 667 668 static void mlxsw_sp_lpm_tree_put(struct mlxsw_sp *mlxsw_sp, 669 struct mlxsw_sp_lpm_tree *lpm_tree) 670 { 671 if (--lpm_tree->ref_count == 0) 672 mlxsw_sp_lpm_tree_destroy(mlxsw_sp, lpm_tree); 673 } 674 675 #define MLXSW_SP_LPM_TREE_MIN 1 /* tree 0 is reserved */ 676 677 static int mlxsw_sp_lpm_init(struct mlxsw_sp *mlxsw_sp) 678 { 679 struct mlxsw_sp_prefix_usage req_prefix_usage = {{ 0 } }; 680 struct mlxsw_sp_lpm_tree *lpm_tree; 681 u64 max_trees; 682 int err, i; 683 684 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_LPM_TREES)) 685 return -EIO; 686 687 max_trees = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_LPM_TREES); 688 mlxsw_sp->router->lpm.tree_count = max_trees - MLXSW_SP_LPM_TREE_MIN; 689 mlxsw_sp->router->lpm.trees = kcalloc(mlxsw_sp->router->lpm.tree_count, 690 sizeof(struct mlxsw_sp_lpm_tree), 691 GFP_KERNEL); 692 if (!mlxsw_sp->router->lpm.trees) 693 return -ENOMEM; 694 695 for (i = 0; i < mlxsw_sp->router->lpm.tree_count; i++) { 696 lpm_tree = &mlxsw_sp->router->lpm.trees[i]; 697 lpm_tree->id = i + MLXSW_SP_LPM_TREE_MIN; 698 } 699 700 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage, 701 MLXSW_SP_L3_PROTO_IPV4); 702 if (IS_ERR(lpm_tree)) { 703 err = PTR_ERR(lpm_tree); 704 goto err_ipv4_tree_get; 705 } 706 mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4] = lpm_tree; 707 708 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage, 709 MLXSW_SP_L3_PROTO_IPV6); 710 if (IS_ERR(lpm_tree)) { 711 err = PTR_ERR(lpm_tree); 712 goto err_ipv6_tree_get; 713 } 714 mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV6] = lpm_tree; 715 716 return 0; 717 718 err_ipv6_tree_get: 719 lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4]; 720 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree); 721 err_ipv4_tree_get: 722 kfree(mlxsw_sp->router->lpm.trees); 723 return err; 724 } 725 726 static void mlxsw_sp_lpm_fini(struct mlxsw_sp *mlxsw_sp) 727 { 728 struct mlxsw_sp_lpm_tree *lpm_tree; 729 730 lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV6]; 731 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree); 732 733 lpm_tree = mlxsw_sp->router->lpm.proto_trees[MLXSW_SP_L3_PROTO_IPV4]; 734 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree); 735 736 kfree(mlxsw_sp->router->lpm.trees); 737 } 738 739 static bool mlxsw_sp_vr_is_used(const struct mlxsw_sp_vr *vr) 740 { 741 return !!vr->fib4 || !!vr->fib6 || 742 !!vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] || 743 !!vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]; 744 } 745 746 static struct mlxsw_sp_vr *mlxsw_sp_vr_find_unused(struct mlxsw_sp *mlxsw_sp) 747 { 748 struct mlxsw_sp_vr *vr; 749 int i; 750 751 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) { 752 vr = &mlxsw_sp->router->vrs[i]; 753 if (!mlxsw_sp_vr_is_used(vr)) 754 return vr; 755 } 756 return NULL; 757 } 758 759 static int mlxsw_sp_vr_lpm_tree_bind(struct mlxsw_sp *mlxsw_sp, 760 const struct mlxsw_sp_fib *fib, u8 tree_id) 761 { 762 char raltb_pl[MLXSW_REG_RALTB_LEN]; 763 764 mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id, 765 (enum mlxsw_reg_ralxx_protocol) fib->proto, 766 tree_id); 767 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl); 768 } 769 770 static int mlxsw_sp_vr_lpm_tree_unbind(struct mlxsw_sp *mlxsw_sp, 771 const struct mlxsw_sp_fib *fib) 772 { 773 char raltb_pl[MLXSW_REG_RALTB_LEN]; 774 775 /* Bind to tree 0 which is default */ 776 mlxsw_reg_raltb_pack(raltb_pl, fib->vr->id, 777 (enum mlxsw_reg_ralxx_protocol) fib->proto, 0); 778 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raltb), raltb_pl); 779 } 780 781 static u32 mlxsw_sp_fix_tb_id(u32 tb_id) 782 { 783 /* For our purpose, squash main, default and local tables into one */ 784 if (tb_id == RT_TABLE_LOCAL || tb_id == RT_TABLE_DEFAULT) 785 tb_id = RT_TABLE_MAIN; 786 return tb_id; 787 } 788 789 static struct mlxsw_sp_vr *mlxsw_sp_vr_find(struct mlxsw_sp *mlxsw_sp, 790 u32 tb_id) 791 { 792 struct mlxsw_sp_vr *vr; 793 int i; 794 795 tb_id = mlxsw_sp_fix_tb_id(tb_id); 796 797 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) { 798 vr = &mlxsw_sp->router->vrs[i]; 799 if (mlxsw_sp_vr_is_used(vr) && vr->tb_id == tb_id) 800 return vr; 801 } 802 return NULL; 803 } 804 805 int mlxsw_sp_router_tb_id_vr_id(struct mlxsw_sp *mlxsw_sp, u32 tb_id, 806 u16 *vr_id) 807 { 808 struct mlxsw_sp_vr *vr; 809 int err = 0; 810 811 mutex_lock(&mlxsw_sp->router->lock); 812 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id); 813 if (!vr) { 814 err = -ESRCH; 815 goto out; 816 } 817 *vr_id = vr->id; 818 out: 819 mutex_unlock(&mlxsw_sp->router->lock); 820 return err; 821 } 822 823 static struct mlxsw_sp_fib *mlxsw_sp_vr_fib(const struct mlxsw_sp_vr *vr, 824 enum mlxsw_sp_l3proto proto) 825 { 826 switch (proto) { 827 case MLXSW_SP_L3_PROTO_IPV4: 828 return vr->fib4; 829 case MLXSW_SP_L3_PROTO_IPV6: 830 return vr->fib6; 831 } 832 return NULL; 833 } 834 835 static struct mlxsw_sp_vr *mlxsw_sp_vr_create(struct mlxsw_sp *mlxsw_sp, 836 u32 tb_id, 837 struct netlink_ext_ack *extack) 838 { 839 struct mlxsw_sp_mr_table *mr4_table, *mr6_table; 840 struct mlxsw_sp_fib *fib4; 841 struct mlxsw_sp_fib *fib6; 842 struct mlxsw_sp_vr *vr; 843 int err; 844 845 vr = mlxsw_sp_vr_find_unused(mlxsw_sp); 846 if (!vr) { 847 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported virtual routers"); 848 return ERR_PTR(-EBUSY); 849 } 850 fib4 = mlxsw_sp_fib_create(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4); 851 if (IS_ERR(fib4)) 852 return ERR_CAST(fib4); 853 fib6 = mlxsw_sp_fib_create(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6); 854 if (IS_ERR(fib6)) { 855 err = PTR_ERR(fib6); 856 goto err_fib6_create; 857 } 858 mr4_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id, 859 MLXSW_SP_L3_PROTO_IPV4); 860 if (IS_ERR(mr4_table)) { 861 err = PTR_ERR(mr4_table); 862 goto err_mr4_table_create; 863 } 864 mr6_table = mlxsw_sp_mr_table_create(mlxsw_sp, vr->id, 865 MLXSW_SP_L3_PROTO_IPV6); 866 if (IS_ERR(mr6_table)) { 867 err = PTR_ERR(mr6_table); 868 goto err_mr6_table_create; 869 } 870 871 vr->fib4 = fib4; 872 vr->fib6 = fib6; 873 vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] = mr4_table; 874 vr->mr_table[MLXSW_SP_L3_PROTO_IPV6] = mr6_table; 875 vr->tb_id = tb_id; 876 return vr; 877 878 err_mr6_table_create: 879 mlxsw_sp_mr_table_destroy(mr4_table); 880 err_mr4_table_create: 881 mlxsw_sp_fib_destroy(mlxsw_sp, fib6); 882 err_fib6_create: 883 mlxsw_sp_fib_destroy(mlxsw_sp, fib4); 884 return ERR_PTR(err); 885 } 886 887 static void mlxsw_sp_vr_destroy(struct mlxsw_sp *mlxsw_sp, 888 struct mlxsw_sp_vr *vr) 889 { 890 mlxsw_sp_mr_table_destroy(vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]); 891 vr->mr_table[MLXSW_SP_L3_PROTO_IPV6] = NULL; 892 mlxsw_sp_mr_table_destroy(vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]); 893 vr->mr_table[MLXSW_SP_L3_PROTO_IPV4] = NULL; 894 mlxsw_sp_fib_destroy(mlxsw_sp, vr->fib6); 895 vr->fib6 = NULL; 896 mlxsw_sp_fib_destroy(mlxsw_sp, vr->fib4); 897 vr->fib4 = NULL; 898 } 899 900 static struct mlxsw_sp_vr *mlxsw_sp_vr_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id, 901 struct netlink_ext_ack *extack) 902 { 903 struct mlxsw_sp_vr *vr; 904 905 tb_id = mlxsw_sp_fix_tb_id(tb_id); 906 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id); 907 if (!vr) 908 vr = mlxsw_sp_vr_create(mlxsw_sp, tb_id, extack); 909 return vr; 910 } 911 912 static void mlxsw_sp_vr_put(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_vr *vr) 913 { 914 if (!vr->rif_count && list_empty(&vr->fib4->node_list) && 915 list_empty(&vr->fib6->node_list) && 916 mlxsw_sp_mr_table_empty(vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]) && 917 mlxsw_sp_mr_table_empty(vr->mr_table[MLXSW_SP_L3_PROTO_IPV6])) 918 mlxsw_sp_vr_destroy(mlxsw_sp, vr); 919 } 920 921 static bool 922 mlxsw_sp_vr_lpm_tree_should_replace(struct mlxsw_sp_vr *vr, 923 enum mlxsw_sp_l3proto proto, u8 tree_id) 924 { 925 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto); 926 927 if (!mlxsw_sp_vr_is_used(vr)) 928 return false; 929 if (fib->lpm_tree->id == tree_id) 930 return true; 931 return false; 932 } 933 934 static int mlxsw_sp_vr_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp, 935 struct mlxsw_sp_fib *fib, 936 struct mlxsw_sp_lpm_tree *new_tree) 937 { 938 struct mlxsw_sp_lpm_tree *old_tree = fib->lpm_tree; 939 int err; 940 941 fib->lpm_tree = new_tree; 942 mlxsw_sp_lpm_tree_hold(new_tree); 943 err = mlxsw_sp_vr_lpm_tree_bind(mlxsw_sp, fib, new_tree->id); 944 if (err) 945 goto err_tree_bind; 946 mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree); 947 return 0; 948 949 err_tree_bind: 950 mlxsw_sp_lpm_tree_put(mlxsw_sp, new_tree); 951 fib->lpm_tree = old_tree; 952 return err; 953 } 954 955 static int mlxsw_sp_vrs_lpm_tree_replace(struct mlxsw_sp *mlxsw_sp, 956 struct mlxsw_sp_fib *fib, 957 struct mlxsw_sp_lpm_tree *new_tree) 958 { 959 enum mlxsw_sp_l3proto proto = fib->proto; 960 struct mlxsw_sp_lpm_tree *old_tree; 961 u8 old_id, new_id = new_tree->id; 962 struct mlxsw_sp_vr *vr; 963 int i, err; 964 965 old_tree = mlxsw_sp->router->lpm.proto_trees[proto]; 966 old_id = old_tree->id; 967 968 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) { 969 vr = &mlxsw_sp->router->vrs[i]; 970 if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, old_id)) 971 continue; 972 err = mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp, 973 mlxsw_sp_vr_fib(vr, proto), 974 new_tree); 975 if (err) 976 goto err_tree_replace; 977 } 978 979 memcpy(new_tree->prefix_ref_count, old_tree->prefix_ref_count, 980 sizeof(new_tree->prefix_ref_count)); 981 mlxsw_sp->router->lpm.proto_trees[proto] = new_tree; 982 mlxsw_sp_lpm_tree_put(mlxsw_sp, old_tree); 983 984 return 0; 985 986 err_tree_replace: 987 for (i--; i >= 0; i--) { 988 if (!mlxsw_sp_vr_lpm_tree_should_replace(vr, proto, new_id)) 989 continue; 990 mlxsw_sp_vr_lpm_tree_replace(mlxsw_sp, 991 mlxsw_sp_vr_fib(vr, proto), 992 old_tree); 993 } 994 return err; 995 } 996 997 static int mlxsw_sp_vrs_init(struct mlxsw_sp *mlxsw_sp) 998 { 999 struct mlxsw_sp_vr *vr; 1000 u64 max_vrs; 1001 int i; 1002 1003 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_VRS)) 1004 return -EIO; 1005 1006 max_vrs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); 1007 mlxsw_sp->router->vrs = kcalloc(max_vrs, sizeof(struct mlxsw_sp_vr), 1008 GFP_KERNEL); 1009 if (!mlxsw_sp->router->vrs) 1010 return -ENOMEM; 1011 1012 for (i = 0; i < max_vrs; i++) { 1013 vr = &mlxsw_sp->router->vrs[i]; 1014 vr->id = i; 1015 } 1016 1017 return 0; 1018 } 1019 1020 static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp); 1021 1022 static void mlxsw_sp_vrs_fini(struct mlxsw_sp *mlxsw_sp) 1023 { 1024 /* At this stage we're guaranteed not to have new incoming 1025 * FIB notifications and the work queue is free from FIBs 1026 * sitting on top of mlxsw netdevs. However, we can still 1027 * have other FIBs queued. Flush the queue before flushing 1028 * the device's tables. No need for locks, as we're the only 1029 * writer. 1030 */ 1031 mlxsw_core_flush_owq(); 1032 mlxsw_sp_router_fib_flush(mlxsw_sp); 1033 kfree(mlxsw_sp->router->vrs); 1034 } 1035 1036 u32 mlxsw_sp_ipip_dev_ul_tb_id(const struct net_device *ol_dev) 1037 { 1038 struct net_device *d; 1039 u32 tb_id; 1040 1041 rcu_read_lock(); 1042 d = mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev); 1043 if (d) 1044 tb_id = l3mdev_fib_table(d) ? : RT_TABLE_MAIN; 1045 else 1046 tb_id = RT_TABLE_MAIN; 1047 rcu_read_unlock(); 1048 1049 return tb_id; 1050 } 1051 1052 static struct mlxsw_sp_rif * 1053 mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp, 1054 const struct mlxsw_sp_rif_params *params, 1055 struct netlink_ext_ack *extack); 1056 1057 static struct mlxsw_sp_rif_ipip_lb * 1058 mlxsw_sp_ipip_ol_ipip_lb_create(struct mlxsw_sp *mlxsw_sp, 1059 enum mlxsw_sp_ipip_type ipipt, 1060 struct net_device *ol_dev, 1061 struct netlink_ext_ack *extack) 1062 { 1063 struct mlxsw_sp_rif_params_ipip_lb lb_params; 1064 const struct mlxsw_sp_ipip_ops *ipip_ops; 1065 struct mlxsw_sp_rif *rif; 1066 1067 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt]; 1068 lb_params = (struct mlxsw_sp_rif_params_ipip_lb) { 1069 .common.dev = ol_dev, 1070 .common.lag = false, 1071 .lb_config = ipip_ops->ol_loopback_config(mlxsw_sp, ol_dev), 1072 }; 1073 1074 rif = mlxsw_sp_rif_create(mlxsw_sp, &lb_params.common, extack); 1075 if (IS_ERR(rif)) 1076 return ERR_CAST(rif); 1077 return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common); 1078 } 1079 1080 static struct mlxsw_sp_ipip_entry * 1081 mlxsw_sp_ipip_entry_alloc(struct mlxsw_sp *mlxsw_sp, 1082 enum mlxsw_sp_ipip_type ipipt, 1083 struct net_device *ol_dev) 1084 { 1085 const struct mlxsw_sp_ipip_ops *ipip_ops; 1086 struct mlxsw_sp_ipip_entry *ipip_entry; 1087 struct mlxsw_sp_ipip_entry *ret = NULL; 1088 int err; 1089 1090 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt]; 1091 ipip_entry = kzalloc(sizeof(*ipip_entry), GFP_KERNEL); 1092 if (!ipip_entry) 1093 return ERR_PTR(-ENOMEM); 1094 1095 ipip_entry->ol_lb = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp, ipipt, 1096 ol_dev, NULL); 1097 if (IS_ERR(ipip_entry->ol_lb)) { 1098 ret = ERR_CAST(ipip_entry->ol_lb); 1099 goto err_ol_ipip_lb_create; 1100 } 1101 1102 ipip_entry->ipipt = ipipt; 1103 ipip_entry->ol_dev = ol_dev; 1104 ipip_entry->parms = ipip_ops->parms_init(ol_dev); 1105 1106 err = ipip_ops->rem_ip_addr_set(mlxsw_sp, ipip_entry); 1107 if (err) { 1108 ret = ERR_PTR(err); 1109 goto err_rem_ip_addr_set; 1110 } 1111 1112 return ipip_entry; 1113 1114 err_rem_ip_addr_set: 1115 mlxsw_sp_rif_destroy(&ipip_entry->ol_lb->common); 1116 err_ol_ipip_lb_create: 1117 kfree(ipip_entry); 1118 return ret; 1119 } 1120 1121 static void mlxsw_sp_ipip_entry_dealloc(struct mlxsw_sp *mlxsw_sp, 1122 struct mlxsw_sp_ipip_entry *ipip_entry) 1123 { 1124 const struct mlxsw_sp_ipip_ops *ipip_ops = 1125 mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]; 1126 1127 ipip_ops->rem_ip_addr_unset(mlxsw_sp, ipip_entry); 1128 mlxsw_sp_rif_destroy(&ipip_entry->ol_lb->common); 1129 kfree(ipip_entry); 1130 } 1131 1132 static bool 1133 mlxsw_sp_ipip_entry_saddr_matches(struct mlxsw_sp *mlxsw_sp, 1134 const enum mlxsw_sp_l3proto ul_proto, 1135 union mlxsw_sp_l3addr saddr, 1136 u32 ul_tb_id, 1137 struct mlxsw_sp_ipip_entry *ipip_entry) 1138 { 1139 u32 tun_ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev); 1140 enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt; 1141 union mlxsw_sp_l3addr tun_saddr; 1142 1143 if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto) 1144 return false; 1145 1146 tun_saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ipip_entry->ol_dev); 1147 return tun_ul_tb_id == ul_tb_id && 1148 mlxsw_sp_l3addr_eq(&tun_saddr, &saddr); 1149 } 1150 1151 static int mlxsw_sp_ipip_decap_parsing_depth_inc(struct mlxsw_sp *mlxsw_sp, 1152 enum mlxsw_sp_ipip_type ipipt) 1153 { 1154 const struct mlxsw_sp_ipip_ops *ipip_ops; 1155 1156 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipipt]; 1157 1158 /* Not all tunnels require to increase the default pasing depth 1159 * (96 bytes). 1160 */ 1161 if (ipip_ops->inc_parsing_depth) 1162 return mlxsw_sp_parsing_depth_inc(mlxsw_sp); 1163 1164 return 0; 1165 } 1166 1167 static void mlxsw_sp_ipip_decap_parsing_depth_dec(struct mlxsw_sp *mlxsw_sp, 1168 enum mlxsw_sp_ipip_type ipipt) 1169 { 1170 const struct mlxsw_sp_ipip_ops *ipip_ops = 1171 mlxsw_sp->router->ipip_ops_arr[ipipt]; 1172 1173 if (ipip_ops->inc_parsing_depth) 1174 mlxsw_sp_parsing_depth_dec(mlxsw_sp); 1175 } 1176 1177 static int 1178 mlxsw_sp_fib_entry_decap_init(struct mlxsw_sp *mlxsw_sp, 1179 struct mlxsw_sp_fib_entry *fib_entry, 1180 struct mlxsw_sp_ipip_entry *ipip_entry) 1181 { 1182 u32 tunnel_index; 1183 int err; 1184 1185 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1186 1, &tunnel_index); 1187 if (err) 1188 return err; 1189 1190 err = mlxsw_sp_ipip_decap_parsing_depth_inc(mlxsw_sp, 1191 ipip_entry->ipipt); 1192 if (err) 1193 goto err_parsing_depth_inc; 1194 1195 ipip_entry->decap_fib_entry = fib_entry; 1196 fib_entry->decap.ipip_entry = ipip_entry; 1197 fib_entry->decap.tunnel_index = tunnel_index; 1198 1199 return 0; 1200 1201 err_parsing_depth_inc: 1202 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1, 1203 fib_entry->decap.tunnel_index); 1204 return err; 1205 } 1206 1207 static void mlxsw_sp_fib_entry_decap_fini(struct mlxsw_sp *mlxsw_sp, 1208 struct mlxsw_sp_fib_entry *fib_entry) 1209 { 1210 enum mlxsw_sp_ipip_type ipipt = fib_entry->decap.ipip_entry->ipipt; 1211 1212 /* Unlink this node from the IPIP entry that it's the decap entry of. */ 1213 fib_entry->decap.ipip_entry->decap_fib_entry = NULL; 1214 fib_entry->decap.ipip_entry = NULL; 1215 mlxsw_sp_ipip_decap_parsing_depth_dec(mlxsw_sp, ipipt); 1216 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1217 1, fib_entry->decap.tunnel_index); 1218 } 1219 1220 static struct mlxsw_sp_fib_node * 1221 mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr, 1222 size_t addr_len, unsigned char prefix_len); 1223 static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp, 1224 struct mlxsw_sp_fib_entry *fib_entry); 1225 1226 static void 1227 mlxsw_sp_ipip_entry_demote_decap(struct mlxsw_sp *mlxsw_sp, 1228 struct mlxsw_sp_ipip_entry *ipip_entry) 1229 { 1230 struct mlxsw_sp_fib_entry *fib_entry = ipip_entry->decap_fib_entry; 1231 1232 mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, fib_entry); 1233 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 1234 1235 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); 1236 } 1237 1238 static void 1239 mlxsw_sp_ipip_entry_promote_decap(struct mlxsw_sp *mlxsw_sp, 1240 struct mlxsw_sp_ipip_entry *ipip_entry, 1241 struct mlxsw_sp_fib_entry *decap_fib_entry) 1242 { 1243 if (mlxsw_sp_fib_entry_decap_init(mlxsw_sp, decap_fib_entry, 1244 ipip_entry)) 1245 return; 1246 decap_fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP; 1247 1248 if (mlxsw_sp_fib_entry_update(mlxsw_sp, decap_fib_entry)) 1249 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry); 1250 } 1251 1252 static struct mlxsw_sp_fib_entry * 1253 mlxsw_sp_router_ip2me_fib_entry_find(struct mlxsw_sp *mlxsw_sp, u32 tb_id, 1254 enum mlxsw_sp_l3proto proto, 1255 const union mlxsw_sp_l3addr *addr, 1256 enum mlxsw_sp_fib_entry_type type) 1257 { 1258 struct mlxsw_sp_fib_node *fib_node; 1259 unsigned char addr_prefix_len; 1260 struct mlxsw_sp_fib *fib; 1261 struct mlxsw_sp_vr *vr; 1262 const void *addrp; 1263 size_t addr_len; 1264 u32 addr4; 1265 1266 vr = mlxsw_sp_vr_find(mlxsw_sp, tb_id); 1267 if (!vr) 1268 return NULL; 1269 fib = mlxsw_sp_vr_fib(vr, proto); 1270 1271 switch (proto) { 1272 case MLXSW_SP_L3_PROTO_IPV4: 1273 addr4 = be32_to_cpu(addr->addr4); 1274 addrp = &addr4; 1275 addr_len = 4; 1276 addr_prefix_len = 32; 1277 break; 1278 case MLXSW_SP_L3_PROTO_IPV6: 1279 addrp = &addr->addr6; 1280 addr_len = 16; 1281 addr_prefix_len = 128; 1282 break; 1283 default: 1284 WARN_ON(1); 1285 return NULL; 1286 } 1287 1288 fib_node = mlxsw_sp_fib_node_lookup(fib, addrp, addr_len, 1289 addr_prefix_len); 1290 if (!fib_node || fib_node->fib_entry->type != type) 1291 return NULL; 1292 1293 return fib_node->fib_entry; 1294 } 1295 1296 /* Given an IPIP entry, find the corresponding decap route. */ 1297 static struct mlxsw_sp_fib_entry * 1298 mlxsw_sp_ipip_entry_find_decap(struct mlxsw_sp *mlxsw_sp, 1299 struct mlxsw_sp_ipip_entry *ipip_entry) 1300 { 1301 static struct mlxsw_sp_fib_node *fib_node; 1302 const struct mlxsw_sp_ipip_ops *ipip_ops; 1303 unsigned char saddr_prefix_len; 1304 union mlxsw_sp_l3addr saddr; 1305 struct mlxsw_sp_fib *ul_fib; 1306 struct mlxsw_sp_vr *ul_vr; 1307 const void *saddrp; 1308 size_t saddr_len; 1309 u32 ul_tb_id; 1310 u32 saddr4; 1311 1312 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]; 1313 1314 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ipip_entry->ol_dev); 1315 ul_vr = mlxsw_sp_vr_find(mlxsw_sp, ul_tb_id); 1316 if (!ul_vr) 1317 return NULL; 1318 1319 ul_fib = mlxsw_sp_vr_fib(ul_vr, ipip_ops->ul_proto); 1320 saddr = mlxsw_sp_ipip_netdev_saddr(ipip_ops->ul_proto, 1321 ipip_entry->ol_dev); 1322 1323 switch (ipip_ops->ul_proto) { 1324 case MLXSW_SP_L3_PROTO_IPV4: 1325 saddr4 = be32_to_cpu(saddr.addr4); 1326 saddrp = &saddr4; 1327 saddr_len = 4; 1328 saddr_prefix_len = 32; 1329 break; 1330 case MLXSW_SP_L3_PROTO_IPV6: 1331 saddrp = &saddr.addr6; 1332 saddr_len = 16; 1333 saddr_prefix_len = 128; 1334 break; 1335 default: 1336 WARN_ON(1); 1337 return NULL; 1338 } 1339 1340 fib_node = mlxsw_sp_fib_node_lookup(ul_fib, saddrp, saddr_len, 1341 saddr_prefix_len); 1342 if (!fib_node || 1343 fib_node->fib_entry->type != MLXSW_SP_FIB_ENTRY_TYPE_TRAP) 1344 return NULL; 1345 1346 return fib_node->fib_entry; 1347 } 1348 1349 static struct mlxsw_sp_ipip_entry * 1350 mlxsw_sp_ipip_entry_create(struct mlxsw_sp *mlxsw_sp, 1351 enum mlxsw_sp_ipip_type ipipt, 1352 struct net_device *ol_dev) 1353 { 1354 struct mlxsw_sp_ipip_entry *ipip_entry; 1355 1356 ipip_entry = mlxsw_sp_ipip_entry_alloc(mlxsw_sp, ipipt, ol_dev); 1357 if (IS_ERR(ipip_entry)) 1358 return ipip_entry; 1359 1360 list_add_tail(&ipip_entry->ipip_list_node, 1361 &mlxsw_sp->router->ipip_list); 1362 1363 return ipip_entry; 1364 } 1365 1366 static void 1367 mlxsw_sp_ipip_entry_destroy(struct mlxsw_sp *mlxsw_sp, 1368 struct mlxsw_sp_ipip_entry *ipip_entry) 1369 { 1370 list_del(&ipip_entry->ipip_list_node); 1371 mlxsw_sp_ipip_entry_dealloc(mlxsw_sp, ipip_entry); 1372 } 1373 1374 static bool 1375 mlxsw_sp_ipip_entry_matches_decap(struct mlxsw_sp *mlxsw_sp, 1376 const struct net_device *ul_dev, 1377 enum mlxsw_sp_l3proto ul_proto, 1378 union mlxsw_sp_l3addr ul_dip, 1379 struct mlxsw_sp_ipip_entry *ipip_entry) 1380 { 1381 u32 ul_tb_id = l3mdev_fib_table(ul_dev) ? : RT_TABLE_MAIN; 1382 enum mlxsw_sp_ipip_type ipipt = ipip_entry->ipipt; 1383 1384 if (mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto != ul_proto) 1385 return false; 1386 1387 return mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, ul_dip, 1388 ul_tb_id, ipip_entry); 1389 } 1390 1391 /* Given decap parameters, find the corresponding IPIP entry. */ 1392 static struct mlxsw_sp_ipip_entry * 1393 mlxsw_sp_ipip_entry_find_by_decap(struct mlxsw_sp *mlxsw_sp, int ul_dev_ifindex, 1394 enum mlxsw_sp_l3proto ul_proto, 1395 union mlxsw_sp_l3addr ul_dip) 1396 { 1397 struct mlxsw_sp_ipip_entry *ipip_entry = NULL; 1398 struct net_device *ul_dev; 1399 1400 rcu_read_lock(); 1401 1402 ul_dev = dev_get_by_index_rcu(mlxsw_sp_net(mlxsw_sp), ul_dev_ifindex); 1403 if (!ul_dev) 1404 goto out_unlock; 1405 1406 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list, 1407 ipip_list_node) 1408 if (mlxsw_sp_ipip_entry_matches_decap(mlxsw_sp, ul_dev, 1409 ul_proto, ul_dip, 1410 ipip_entry)) 1411 goto out_unlock; 1412 1413 rcu_read_unlock(); 1414 1415 return NULL; 1416 1417 out_unlock: 1418 rcu_read_unlock(); 1419 return ipip_entry; 1420 } 1421 1422 static bool mlxsw_sp_netdev_ipip_type(const struct mlxsw_sp *mlxsw_sp, 1423 const struct net_device *dev, 1424 enum mlxsw_sp_ipip_type *p_type) 1425 { 1426 struct mlxsw_sp_router *router = mlxsw_sp->router; 1427 const struct mlxsw_sp_ipip_ops *ipip_ops; 1428 enum mlxsw_sp_ipip_type ipipt; 1429 1430 for (ipipt = 0; ipipt < MLXSW_SP_IPIP_TYPE_MAX; ++ipipt) { 1431 ipip_ops = router->ipip_ops_arr[ipipt]; 1432 if (dev->type == ipip_ops->dev_type) { 1433 if (p_type) 1434 *p_type = ipipt; 1435 return true; 1436 } 1437 } 1438 return false; 1439 } 1440 1441 static bool mlxsw_sp_netdev_is_ipip_ol(const struct mlxsw_sp *mlxsw_sp, 1442 const struct net_device *dev) 1443 { 1444 return mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL); 1445 } 1446 1447 static struct mlxsw_sp_ipip_entry * 1448 mlxsw_sp_ipip_entry_find_by_ol_dev(struct mlxsw_sp *mlxsw_sp, 1449 const struct net_device *ol_dev) 1450 { 1451 struct mlxsw_sp_ipip_entry *ipip_entry; 1452 1453 list_for_each_entry(ipip_entry, &mlxsw_sp->router->ipip_list, 1454 ipip_list_node) 1455 if (ipip_entry->ol_dev == ol_dev) 1456 return ipip_entry; 1457 1458 return NULL; 1459 } 1460 1461 static struct mlxsw_sp_ipip_entry * 1462 mlxsw_sp_ipip_entry_find_by_ul_dev(const struct mlxsw_sp *mlxsw_sp, 1463 const struct net_device *ul_dev, 1464 struct mlxsw_sp_ipip_entry *start) 1465 { 1466 struct mlxsw_sp_ipip_entry *ipip_entry; 1467 1468 ipip_entry = list_prepare_entry(start, &mlxsw_sp->router->ipip_list, 1469 ipip_list_node); 1470 list_for_each_entry_continue(ipip_entry, &mlxsw_sp->router->ipip_list, 1471 ipip_list_node) { 1472 struct net_device *ol_dev = ipip_entry->ol_dev; 1473 struct net_device *ipip_ul_dev; 1474 1475 rcu_read_lock(); 1476 ipip_ul_dev = mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev); 1477 rcu_read_unlock(); 1478 1479 if (ipip_ul_dev == ul_dev) 1480 return ipip_entry; 1481 } 1482 1483 return NULL; 1484 } 1485 1486 static bool mlxsw_sp_netdev_is_ipip_ul(struct mlxsw_sp *mlxsw_sp, 1487 const struct net_device *dev) 1488 { 1489 return mlxsw_sp_ipip_entry_find_by_ul_dev(mlxsw_sp, dev, NULL); 1490 } 1491 1492 static bool mlxsw_sp_netdevice_ipip_can_offload(struct mlxsw_sp *mlxsw_sp, 1493 const struct net_device *ol_dev, 1494 enum mlxsw_sp_ipip_type ipipt) 1495 { 1496 const struct mlxsw_sp_ipip_ops *ops 1497 = mlxsw_sp->router->ipip_ops_arr[ipipt]; 1498 1499 return ops->can_offload(mlxsw_sp, ol_dev); 1500 } 1501 1502 static int mlxsw_sp_netdevice_ipip_ol_reg_event(struct mlxsw_sp *mlxsw_sp, 1503 struct net_device *ol_dev) 1504 { 1505 enum mlxsw_sp_ipip_type ipipt = MLXSW_SP_IPIP_TYPE_MAX; 1506 struct mlxsw_sp_ipip_entry *ipip_entry; 1507 enum mlxsw_sp_l3proto ul_proto; 1508 union mlxsw_sp_l3addr saddr; 1509 u32 ul_tb_id; 1510 1511 mlxsw_sp_netdev_ipip_type(mlxsw_sp, ol_dev, &ipipt); 1512 if (mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev, ipipt)) { 1513 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(ol_dev); 1514 ul_proto = mlxsw_sp->router->ipip_ops_arr[ipipt]->ul_proto; 1515 saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ol_dev); 1516 if (!mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, ul_proto, 1517 saddr, ul_tb_id, 1518 NULL)) { 1519 ipip_entry = mlxsw_sp_ipip_entry_create(mlxsw_sp, ipipt, 1520 ol_dev); 1521 if (IS_ERR(ipip_entry)) 1522 return PTR_ERR(ipip_entry); 1523 } 1524 } 1525 1526 return 0; 1527 } 1528 1529 static void mlxsw_sp_netdevice_ipip_ol_unreg_event(struct mlxsw_sp *mlxsw_sp, 1530 struct net_device *ol_dev) 1531 { 1532 struct mlxsw_sp_ipip_entry *ipip_entry; 1533 1534 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev); 1535 if (ipip_entry) 1536 mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry); 1537 } 1538 1539 static void 1540 mlxsw_sp_ipip_entry_ol_up_event(struct mlxsw_sp *mlxsw_sp, 1541 struct mlxsw_sp_ipip_entry *ipip_entry) 1542 { 1543 struct mlxsw_sp_fib_entry *decap_fib_entry; 1544 1545 decap_fib_entry = mlxsw_sp_ipip_entry_find_decap(mlxsw_sp, ipip_entry); 1546 if (decap_fib_entry) 1547 mlxsw_sp_ipip_entry_promote_decap(mlxsw_sp, ipip_entry, 1548 decap_fib_entry); 1549 } 1550 1551 static int 1552 mlxsw_sp_rif_ipip_lb_op(struct mlxsw_sp_rif_ipip_lb *lb_rif, u16 ul_vr_id, 1553 u16 ul_rif_id, bool enable) 1554 { 1555 struct mlxsw_sp_rif_ipip_lb_config lb_cf = lb_rif->lb_config; 1556 enum mlxsw_reg_ritr_loopback_ipip_options ipip_options; 1557 struct mlxsw_sp_rif *rif = &lb_rif->common; 1558 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 1559 char ritr_pl[MLXSW_REG_RITR_LEN]; 1560 struct in6_addr *saddr6; 1561 u32 saddr4; 1562 1563 ipip_options = MLXSW_REG_RITR_LOOPBACK_IPIP_OPTIONS_GRE_KEY_PRESET; 1564 switch (lb_cf.ul_protocol) { 1565 case MLXSW_SP_L3_PROTO_IPV4: 1566 saddr4 = be32_to_cpu(lb_cf.saddr.addr4); 1567 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF, 1568 rif->rif_index, rif->vr_id, rif->dev->mtu); 1569 mlxsw_reg_ritr_loopback_ipip4_pack(ritr_pl, lb_cf.lb_ipipt, 1570 ipip_options, ul_vr_id, 1571 ul_rif_id, saddr4, 1572 lb_cf.okey); 1573 break; 1574 1575 case MLXSW_SP_L3_PROTO_IPV6: 1576 saddr6 = &lb_cf.saddr.addr6; 1577 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF, 1578 rif->rif_index, rif->vr_id, rif->dev->mtu); 1579 mlxsw_reg_ritr_loopback_ipip6_pack(ritr_pl, lb_cf.lb_ipipt, 1580 ipip_options, ul_vr_id, 1581 ul_rif_id, saddr6, 1582 lb_cf.okey); 1583 break; 1584 } 1585 1586 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 1587 } 1588 1589 static int mlxsw_sp_netdevice_ipip_ol_update_mtu(struct mlxsw_sp *mlxsw_sp, 1590 struct net_device *ol_dev) 1591 { 1592 struct mlxsw_sp_ipip_entry *ipip_entry; 1593 struct mlxsw_sp_rif_ipip_lb *lb_rif; 1594 int err = 0; 1595 1596 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev); 1597 if (ipip_entry) { 1598 lb_rif = ipip_entry->ol_lb; 1599 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, lb_rif->ul_vr_id, 1600 lb_rif->ul_rif_id, true); 1601 if (err) 1602 goto out; 1603 lb_rif->common.mtu = ol_dev->mtu; 1604 } 1605 1606 out: 1607 return err; 1608 } 1609 1610 static void mlxsw_sp_netdevice_ipip_ol_up_event(struct mlxsw_sp *mlxsw_sp, 1611 struct net_device *ol_dev) 1612 { 1613 struct mlxsw_sp_ipip_entry *ipip_entry; 1614 1615 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev); 1616 if (ipip_entry) 1617 mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry); 1618 } 1619 1620 static void 1621 mlxsw_sp_ipip_entry_ol_down_event(struct mlxsw_sp *mlxsw_sp, 1622 struct mlxsw_sp_ipip_entry *ipip_entry) 1623 { 1624 if (ipip_entry->decap_fib_entry) 1625 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry); 1626 } 1627 1628 static void mlxsw_sp_netdevice_ipip_ol_down_event(struct mlxsw_sp *mlxsw_sp, 1629 struct net_device *ol_dev) 1630 { 1631 struct mlxsw_sp_ipip_entry *ipip_entry; 1632 1633 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev); 1634 if (ipip_entry) 1635 mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry); 1636 } 1637 1638 static void mlxsw_sp_nexthop_rif_migrate(struct mlxsw_sp *mlxsw_sp, 1639 struct mlxsw_sp_rif *old_rif, 1640 struct mlxsw_sp_rif *new_rif); 1641 static int 1642 mlxsw_sp_ipip_entry_ol_lb_update(struct mlxsw_sp *mlxsw_sp, 1643 struct mlxsw_sp_ipip_entry *ipip_entry, 1644 bool keep_encap, 1645 struct netlink_ext_ack *extack) 1646 { 1647 struct mlxsw_sp_rif_ipip_lb *old_lb_rif = ipip_entry->ol_lb; 1648 struct mlxsw_sp_rif_ipip_lb *new_lb_rif; 1649 1650 new_lb_rif = mlxsw_sp_ipip_ol_ipip_lb_create(mlxsw_sp, 1651 ipip_entry->ipipt, 1652 ipip_entry->ol_dev, 1653 extack); 1654 if (IS_ERR(new_lb_rif)) 1655 return PTR_ERR(new_lb_rif); 1656 ipip_entry->ol_lb = new_lb_rif; 1657 1658 if (keep_encap) 1659 mlxsw_sp_nexthop_rif_migrate(mlxsw_sp, &old_lb_rif->common, 1660 &new_lb_rif->common); 1661 1662 mlxsw_sp_rif_destroy(&old_lb_rif->common); 1663 1664 return 0; 1665 } 1666 1667 static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp, 1668 struct mlxsw_sp_rif *rif); 1669 1670 /** 1671 * __mlxsw_sp_ipip_entry_update_tunnel - Update offload related to IPIP entry. 1672 * @mlxsw_sp: mlxsw_sp. 1673 * @ipip_entry: IPIP entry. 1674 * @recreate_loopback: Recreates the associated loopback RIF. 1675 * @keep_encap: Updates next hops that use the tunnel netdevice. This is only 1676 * relevant when recreate_loopback is true. 1677 * @update_nexthops: Updates next hops, keeping the current loopback RIF. This 1678 * is only relevant when recreate_loopback is false. 1679 * @extack: extack. 1680 * 1681 * Return: Non-zero value on failure. 1682 */ 1683 int __mlxsw_sp_ipip_entry_update_tunnel(struct mlxsw_sp *mlxsw_sp, 1684 struct mlxsw_sp_ipip_entry *ipip_entry, 1685 bool recreate_loopback, 1686 bool keep_encap, 1687 bool update_nexthops, 1688 struct netlink_ext_ack *extack) 1689 { 1690 int err; 1691 1692 /* RIFs can't be edited, so to update loopback, we need to destroy and 1693 * recreate it. That creates a window of opportunity where RALUE and 1694 * RATR registers end up referencing a RIF that's already gone. RATRs 1695 * are handled in mlxsw_sp_ipip_entry_ol_lb_update(), and to take care 1696 * of RALUE, demote the decap route back. 1697 */ 1698 if (ipip_entry->decap_fib_entry) 1699 mlxsw_sp_ipip_entry_demote_decap(mlxsw_sp, ipip_entry); 1700 1701 if (recreate_loopback) { 1702 err = mlxsw_sp_ipip_entry_ol_lb_update(mlxsw_sp, ipip_entry, 1703 keep_encap, extack); 1704 if (err) 1705 return err; 1706 } else if (update_nexthops) { 1707 mlxsw_sp_nexthop_rif_update(mlxsw_sp, 1708 &ipip_entry->ol_lb->common); 1709 } 1710 1711 if (ipip_entry->ol_dev->flags & IFF_UP) 1712 mlxsw_sp_ipip_entry_ol_up_event(mlxsw_sp, ipip_entry); 1713 1714 return 0; 1715 } 1716 1717 static int mlxsw_sp_netdevice_ipip_ol_vrf_event(struct mlxsw_sp *mlxsw_sp, 1718 struct net_device *ol_dev, 1719 struct netlink_ext_ack *extack) 1720 { 1721 struct mlxsw_sp_ipip_entry *ipip_entry = 1722 mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev); 1723 1724 if (!ipip_entry) 1725 return 0; 1726 1727 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, 1728 true, false, false, extack); 1729 } 1730 1731 static int 1732 mlxsw_sp_netdevice_ipip_ul_vrf_event(struct mlxsw_sp *mlxsw_sp, 1733 struct mlxsw_sp_ipip_entry *ipip_entry, 1734 struct net_device *ul_dev, 1735 bool *demote_this, 1736 struct netlink_ext_ack *extack) 1737 { 1738 u32 ul_tb_id = l3mdev_fib_table(ul_dev) ? : RT_TABLE_MAIN; 1739 enum mlxsw_sp_l3proto ul_proto; 1740 union mlxsw_sp_l3addr saddr; 1741 1742 /* Moving underlay to a different VRF might cause local address 1743 * conflict, and the conflicting tunnels need to be demoted. 1744 */ 1745 ul_proto = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]->ul_proto; 1746 saddr = mlxsw_sp_ipip_netdev_saddr(ul_proto, ipip_entry->ol_dev); 1747 if (mlxsw_sp_ipip_demote_tunnel_by_saddr(mlxsw_sp, ul_proto, 1748 saddr, ul_tb_id, 1749 ipip_entry)) { 1750 *demote_this = true; 1751 return 0; 1752 } 1753 1754 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, 1755 true, true, false, extack); 1756 } 1757 1758 static int 1759 mlxsw_sp_netdevice_ipip_ul_up_event(struct mlxsw_sp *mlxsw_sp, 1760 struct mlxsw_sp_ipip_entry *ipip_entry, 1761 struct net_device *ul_dev) 1762 { 1763 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, 1764 false, false, true, NULL); 1765 } 1766 1767 static int 1768 mlxsw_sp_netdevice_ipip_ul_down_event(struct mlxsw_sp *mlxsw_sp, 1769 struct mlxsw_sp_ipip_entry *ipip_entry, 1770 struct net_device *ul_dev) 1771 { 1772 /* A down underlay device causes encapsulated packets to not be 1773 * forwarded, but decap still works. So refresh next hops without 1774 * touching anything else. 1775 */ 1776 return __mlxsw_sp_ipip_entry_update_tunnel(mlxsw_sp, ipip_entry, 1777 false, false, true, NULL); 1778 } 1779 1780 static int 1781 mlxsw_sp_netdevice_ipip_ol_change_event(struct mlxsw_sp *mlxsw_sp, 1782 struct net_device *ol_dev, 1783 struct netlink_ext_ack *extack) 1784 { 1785 const struct mlxsw_sp_ipip_ops *ipip_ops; 1786 struct mlxsw_sp_ipip_entry *ipip_entry; 1787 int err; 1788 1789 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, ol_dev); 1790 if (!ipip_entry) 1791 /* A change might make a tunnel eligible for offloading, but 1792 * that is currently not implemented. What falls to slow path 1793 * stays there. 1794 */ 1795 return 0; 1796 1797 /* A change might make a tunnel not eligible for offloading. */ 1798 if (!mlxsw_sp_netdevice_ipip_can_offload(mlxsw_sp, ol_dev, 1799 ipip_entry->ipipt)) { 1800 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry); 1801 return 0; 1802 } 1803 1804 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]; 1805 err = ipip_ops->ol_netdev_change(mlxsw_sp, ipip_entry, extack); 1806 return err; 1807 } 1808 1809 void mlxsw_sp_ipip_entry_demote_tunnel(struct mlxsw_sp *mlxsw_sp, 1810 struct mlxsw_sp_ipip_entry *ipip_entry) 1811 { 1812 struct net_device *ol_dev = ipip_entry->ol_dev; 1813 1814 if (ol_dev->flags & IFF_UP) 1815 mlxsw_sp_ipip_entry_ol_down_event(mlxsw_sp, ipip_entry); 1816 mlxsw_sp_ipip_entry_destroy(mlxsw_sp, ipip_entry); 1817 } 1818 1819 /* The configuration where several tunnels have the same local address in the 1820 * same underlay table needs special treatment in the HW. That is currently not 1821 * implemented in the driver. This function finds and demotes the first tunnel 1822 * with a given source address, except the one passed in in the argument 1823 * `except'. 1824 */ 1825 bool 1826 mlxsw_sp_ipip_demote_tunnel_by_saddr(struct mlxsw_sp *mlxsw_sp, 1827 enum mlxsw_sp_l3proto ul_proto, 1828 union mlxsw_sp_l3addr saddr, 1829 u32 ul_tb_id, 1830 const struct mlxsw_sp_ipip_entry *except) 1831 { 1832 struct mlxsw_sp_ipip_entry *ipip_entry, *tmp; 1833 1834 list_for_each_entry_safe(ipip_entry, tmp, &mlxsw_sp->router->ipip_list, 1835 ipip_list_node) { 1836 if (ipip_entry != except && 1837 mlxsw_sp_ipip_entry_saddr_matches(mlxsw_sp, ul_proto, saddr, 1838 ul_tb_id, ipip_entry)) { 1839 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry); 1840 return true; 1841 } 1842 } 1843 1844 return false; 1845 } 1846 1847 static void mlxsw_sp_ipip_demote_tunnel_by_ul_netdev(struct mlxsw_sp *mlxsw_sp, 1848 struct net_device *ul_dev) 1849 { 1850 struct mlxsw_sp_ipip_entry *ipip_entry, *tmp; 1851 1852 list_for_each_entry_safe(ipip_entry, tmp, &mlxsw_sp->router->ipip_list, 1853 ipip_list_node) { 1854 struct net_device *ol_dev = ipip_entry->ol_dev; 1855 struct net_device *ipip_ul_dev; 1856 1857 rcu_read_lock(); 1858 ipip_ul_dev = mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev); 1859 rcu_read_unlock(); 1860 if (ipip_ul_dev == ul_dev) 1861 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry); 1862 } 1863 } 1864 1865 static int mlxsw_sp_netdevice_ipip_ol_event(struct mlxsw_sp *mlxsw_sp, 1866 struct net_device *ol_dev, 1867 unsigned long event, 1868 struct netdev_notifier_info *info) 1869 { 1870 struct netdev_notifier_changeupper_info *chup; 1871 struct netlink_ext_ack *extack; 1872 int err = 0; 1873 1874 switch (event) { 1875 case NETDEV_REGISTER: 1876 err = mlxsw_sp_netdevice_ipip_ol_reg_event(mlxsw_sp, ol_dev); 1877 break; 1878 case NETDEV_UNREGISTER: 1879 mlxsw_sp_netdevice_ipip_ol_unreg_event(mlxsw_sp, ol_dev); 1880 break; 1881 case NETDEV_UP: 1882 mlxsw_sp_netdevice_ipip_ol_up_event(mlxsw_sp, ol_dev); 1883 break; 1884 case NETDEV_DOWN: 1885 mlxsw_sp_netdevice_ipip_ol_down_event(mlxsw_sp, ol_dev); 1886 break; 1887 case NETDEV_CHANGEUPPER: 1888 chup = container_of(info, typeof(*chup), info); 1889 extack = info->extack; 1890 if (netif_is_l3_master(chup->upper_dev)) 1891 err = mlxsw_sp_netdevice_ipip_ol_vrf_event(mlxsw_sp, 1892 ol_dev, 1893 extack); 1894 break; 1895 case NETDEV_CHANGE: 1896 extack = info->extack; 1897 err = mlxsw_sp_netdevice_ipip_ol_change_event(mlxsw_sp, 1898 ol_dev, extack); 1899 break; 1900 case NETDEV_CHANGEMTU: 1901 err = mlxsw_sp_netdevice_ipip_ol_update_mtu(mlxsw_sp, ol_dev); 1902 break; 1903 } 1904 return err; 1905 } 1906 1907 static int 1908 __mlxsw_sp_netdevice_ipip_ul_event(struct mlxsw_sp *mlxsw_sp, 1909 struct mlxsw_sp_ipip_entry *ipip_entry, 1910 struct net_device *ul_dev, 1911 bool *demote_this, 1912 unsigned long event, 1913 struct netdev_notifier_info *info) 1914 { 1915 struct netdev_notifier_changeupper_info *chup; 1916 struct netlink_ext_ack *extack; 1917 1918 switch (event) { 1919 case NETDEV_CHANGEUPPER: 1920 chup = container_of(info, typeof(*chup), info); 1921 extack = info->extack; 1922 if (netif_is_l3_master(chup->upper_dev)) 1923 return mlxsw_sp_netdevice_ipip_ul_vrf_event(mlxsw_sp, 1924 ipip_entry, 1925 ul_dev, 1926 demote_this, 1927 extack); 1928 break; 1929 1930 case NETDEV_UP: 1931 return mlxsw_sp_netdevice_ipip_ul_up_event(mlxsw_sp, ipip_entry, 1932 ul_dev); 1933 case NETDEV_DOWN: 1934 return mlxsw_sp_netdevice_ipip_ul_down_event(mlxsw_sp, 1935 ipip_entry, 1936 ul_dev); 1937 } 1938 return 0; 1939 } 1940 1941 static int 1942 mlxsw_sp_netdevice_ipip_ul_event(struct mlxsw_sp *mlxsw_sp, 1943 struct net_device *ul_dev, 1944 unsigned long event, 1945 struct netdev_notifier_info *info) 1946 { 1947 struct mlxsw_sp_ipip_entry *ipip_entry = NULL; 1948 int err; 1949 1950 while ((ipip_entry = mlxsw_sp_ipip_entry_find_by_ul_dev(mlxsw_sp, 1951 ul_dev, 1952 ipip_entry))) { 1953 struct mlxsw_sp_ipip_entry *prev; 1954 bool demote_this = false; 1955 1956 err = __mlxsw_sp_netdevice_ipip_ul_event(mlxsw_sp, ipip_entry, 1957 ul_dev, &demote_this, 1958 event, info); 1959 if (err) { 1960 mlxsw_sp_ipip_demote_tunnel_by_ul_netdev(mlxsw_sp, 1961 ul_dev); 1962 return err; 1963 } 1964 1965 if (demote_this) { 1966 if (list_is_first(&ipip_entry->ipip_list_node, 1967 &mlxsw_sp->router->ipip_list)) 1968 prev = NULL; 1969 else 1970 /* This can't be cached from previous iteration, 1971 * because that entry could be gone now. 1972 */ 1973 prev = list_prev_entry(ipip_entry, 1974 ipip_list_node); 1975 mlxsw_sp_ipip_entry_demote_tunnel(mlxsw_sp, ipip_entry); 1976 ipip_entry = prev; 1977 } 1978 } 1979 1980 return 0; 1981 } 1982 1983 int mlxsw_sp_router_nve_promote_decap(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id, 1984 enum mlxsw_sp_l3proto ul_proto, 1985 const union mlxsw_sp_l3addr *ul_sip, 1986 u32 tunnel_index) 1987 { 1988 enum mlxsw_sp_fib_entry_type type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 1989 struct mlxsw_sp_router *router = mlxsw_sp->router; 1990 struct mlxsw_sp_fib_entry *fib_entry; 1991 int err = 0; 1992 1993 mutex_lock(&mlxsw_sp->router->lock); 1994 1995 if (WARN_ON_ONCE(router->nve_decap_config.valid)) { 1996 err = -EINVAL; 1997 goto out; 1998 } 1999 2000 router->nve_decap_config.ul_tb_id = ul_tb_id; 2001 router->nve_decap_config.tunnel_index = tunnel_index; 2002 router->nve_decap_config.ul_proto = ul_proto; 2003 router->nve_decap_config.ul_sip = *ul_sip; 2004 router->nve_decap_config.valid = true; 2005 2006 /* It is valid to create a tunnel with a local IP and only later 2007 * assign this IP address to a local interface 2008 */ 2009 fib_entry = mlxsw_sp_router_ip2me_fib_entry_find(mlxsw_sp, ul_tb_id, 2010 ul_proto, ul_sip, 2011 type); 2012 if (!fib_entry) 2013 goto out; 2014 2015 fib_entry->decap.tunnel_index = tunnel_index; 2016 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP; 2017 2018 err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); 2019 if (err) 2020 goto err_fib_entry_update; 2021 2022 goto out; 2023 2024 err_fib_entry_update: 2025 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 2026 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); 2027 out: 2028 mutex_unlock(&mlxsw_sp->router->lock); 2029 return err; 2030 } 2031 2032 void mlxsw_sp_router_nve_demote_decap(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id, 2033 enum mlxsw_sp_l3proto ul_proto, 2034 const union mlxsw_sp_l3addr *ul_sip) 2035 { 2036 enum mlxsw_sp_fib_entry_type type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP; 2037 struct mlxsw_sp_router *router = mlxsw_sp->router; 2038 struct mlxsw_sp_fib_entry *fib_entry; 2039 2040 mutex_lock(&mlxsw_sp->router->lock); 2041 2042 if (WARN_ON_ONCE(!router->nve_decap_config.valid)) 2043 goto out; 2044 2045 router->nve_decap_config.valid = false; 2046 2047 fib_entry = mlxsw_sp_router_ip2me_fib_entry_find(mlxsw_sp, ul_tb_id, 2048 ul_proto, ul_sip, 2049 type); 2050 if (!fib_entry) 2051 goto out; 2052 2053 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 2054 mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); 2055 out: 2056 mutex_unlock(&mlxsw_sp->router->lock); 2057 } 2058 2059 static bool mlxsw_sp_router_nve_is_decap(struct mlxsw_sp *mlxsw_sp, 2060 u32 ul_tb_id, 2061 enum mlxsw_sp_l3proto ul_proto, 2062 const union mlxsw_sp_l3addr *ul_sip) 2063 { 2064 struct mlxsw_sp_router *router = mlxsw_sp->router; 2065 2066 return router->nve_decap_config.valid && 2067 router->nve_decap_config.ul_tb_id == ul_tb_id && 2068 router->nve_decap_config.ul_proto == ul_proto && 2069 !memcmp(&router->nve_decap_config.ul_sip, ul_sip, 2070 sizeof(*ul_sip)); 2071 } 2072 2073 struct mlxsw_sp_neigh_key { 2074 struct neighbour *n; 2075 }; 2076 2077 struct mlxsw_sp_neigh_entry { 2078 struct list_head rif_list_node; 2079 struct rhash_head ht_node; 2080 struct mlxsw_sp_neigh_key key; 2081 u16 rif; 2082 bool connected; 2083 unsigned char ha[ETH_ALEN]; 2084 struct list_head nexthop_list; /* list of nexthops using 2085 * this neigh entry 2086 */ 2087 struct list_head nexthop_neighs_list_node; 2088 unsigned int counter_index; 2089 bool counter_valid; 2090 }; 2091 2092 static const struct rhashtable_params mlxsw_sp_neigh_ht_params = { 2093 .key_offset = offsetof(struct mlxsw_sp_neigh_entry, key), 2094 .head_offset = offsetof(struct mlxsw_sp_neigh_entry, ht_node), 2095 .key_len = sizeof(struct mlxsw_sp_neigh_key), 2096 }; 2097 2098 struct mlxsw_sp_neigh_entry * 2099 mlxsw_sp_rif_neigh_next(struct mlxsw_sp_rif *rif, 2100 struct mlxsw_sp_neigh_entry *neigh_entry) 2101 { 2102 if (!neigh_entry) { 2103 if (list_empty(&rif->neigh_list)) 2104 return NULL; 2105 else 2106 return list_first_entry(&rif->neigh_list, 2107 typeof(*neigh_entry), 2108 rif_list_node); 2109 } 2110 if (list_is_last(&neigh_entry->rif_list_node, &rif->neigh_list)) 2111 return NULL; 2112 return list_next_entry(neigh_entry, rif_list_node); 2113 } 2114 2115 int mlxsw_sp_neigh_entry_type(struct mlxsw_sp_neigh_entry *neigh_entry) 2116 { 2117 return neigh_entry->key.n->tbl->family; 2118 } 2119 2120 unsigned char * 2121 mlxsw_sp_neigh_entry_ha(struct mlxsw_sp_neigh_entry *neigh_entry) 2122 { 2123 return neigh_entry->ha; 2124 } 2125 2126 u32 mlxsw_sp_neigh4_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry) 2127 { 2128 struct neighbour *n; 2129 2130 n = neigh_entry->key.n; 2131 return ntohl(*((__be32 *) n->primary_key)); 2132 } 2133 2134 struct in6_addr * 2135 mlxsw_sp_neigh6_entry_dip(struct mlxsw_sp_neigh_entry *neigh_entry) 2136 { 2137 struct neighbour *n; 2138 2139 n = neigh_entry->key.n; 2140 return (struct in6_addr *) &n->primary_key; 2141 } 2142 2143 int mlxsw_sp_neigh_counter_get(struct mlxsw_sp *mlxsw_sp, 2144 struct mlxsw_sp_neigh_entry *neigh_entry, 2145 u64 *p_counter) 2146 { 2147 if (!neigh_entry->counter_valid) 2148 return -EINVAL; 2149 2150 return mlxsw_sp_flow_counter_get(mlxsw_sp, neigh_entry->counter_index, 2151 p_counter, NULL); 2152 } 2153 2154 static struct mlxsw_sp_neigh_entry * 2155 mlxsw_sp_neigh_entry_alloc(struct mlxsw_sp *mlxsw_sp, struct neighbour *n, 2156 u16 rif) 2157 { 2158 struct mlxsw_sp_neigh_entry *neigh_entry; 2159 2160 neigh_entry = kzalloc(sizeof(*neigh_entry), GFP_KERNEL); 2161 if (!neigh_entry) 2162 return NULL; 2163 2164 neigh_entry->key.n = n; 2165 neigh_entry->rif = rif; 2166 INIT_LIST_HEAD(&neigh_entry->nexthop_list); 2167 2168 return neigh_entry; 2169 } 2170 2171 static void mlxsw_sp_neigh_entry_free(struct mlxsw_sp_neigh_entry *neigh_entry) 2172 { 2173 kfree(neigh_entry); 2174 } 2175 2176 static int 2177 mlxsw_sp_neigh_entry_insert(struct mlxsw_sp *mlxsw_sp, 2178 struct mlxsw_sp_neigh_entry *neigh_entry) 2179 { 2180 return rhashtable_insert_fast(&mlxsw_sp->router->neigh_ht, 2181 &neigh_entry->ht_node, 2182 mlxsw_sp_neigh_ht_params); 2183 } 2184 2185 static void 2186 mlxsw_sp_neigh_entry_remove(struct mlxsw_sp *mlxsw_sp, 2187 struct mlxsw_sp_neigh_entry *neigh_entry) 2188 { 2189 rhashtable_remove_fast(&mlxsw_sp->router->neigh_ht, 2190 &neigh_entry->ht_node, 2191 mlxsw_sp_neigh_ht_params); 2192 } 2193 2194 static bool 2195 mlxsw_sp_neigh_counter_should_alloc(struct mlxsw_sp *mlxsw_sp, 2196 struct mlxsw_sp_neigh_entry *neigh_entry) 2197 { 2198 struct devlink *devlink; 2199 const char *table_name; 2200 2201 switch (mlxsw_sp_neigh_entry_type(neigh_entry)) { 2202 case AF_INET: 2203 table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST4; 2204 break; 2205 case AF_INET6: 2206 table_name = MLXSW_SP_DPIPE_TABLE_NAME_HOST6; 2207 break; 2208 default: 2209 WARN_ON(1); 2210 return false; 2211 } 2212 2213 devlink = priv_to_devlink(mlxsw_sp->core); 2214 return devlink_dpipe_table_counter_enabled(devlink, table_name); 2215 } 2216 2217 static void 2218 mlxsw_sp_neigh_counter_alloc(struct mlxsw_sp *mlxsw_sp, 2219 struct mlxsw_sp_neigh_entry *neigh_entry) 2220 { 2221 if (!mlxsw_sp_neigh_counter_should_alloc(mlxsw_sp, neigh_entry)) 2222 return; 2223 2224 if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &neigh_entry->counter_index)) 2225 return; 2226 2227 neigh_entry->counter_valid = true; 2228 } 2229 2230 static void 2231 mlxsw_sp_neigh_counter_free(struct mlxsw_sp *mlxsw_sp, 2232 struct mlxsw_sp_neigh_entry *neigh_entry) 2233 { 2234 if (!neigh_entry->counter_valid) 2235 return; 2236 mlxsw_sp_flow_counter_free(mlxsw_sp, 2237 neigh_entry->counter_index); 2238 neigh_entry->counter_valid = false; 2239 } 2240 2241 static struct mlxsw_sp_neigh_entry * 2242 mlxsw_sp_neigh_entry_create(struct mlxsw_sp *mlxsw_sp, struct neighbour *n) 2243 { 2244 struct mlxsw_sp_neigh_entry *neigh_entry; 2245 struct mlxsw_sp_rif *rif; 2246 int err; 2247 2248 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, n->dev); 2249 if (!rif) 2250 return ERR_PTR(-EINVAL); 2251 2252 neigh_entry = mlxsw_sp_neigh_entry_alloc(mlxsw_sp, n, rif->rif_index); 2253 if (!neigh_entry) 2254 return ERR_PTR(-ENOMEM); 2255 2256 err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry); 2257 if (err) 2258 goto err_neigh_entry_insert; 2259 2260 mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry); 2261 atomic_inc(&mlxsw_sp->router->neighs_update.neigh_count); 2262 list_add(&neigh_entry->rif_list_node, &rif->neigh_list); 2263 2264 return neigh_entry; 2265 2266 err_neigh_entry_insert: 2267 mlxsw_sp_neigh_entry_free(neigh_entry); 2268 return ERR_PTR(err); 2269 } 2270 2271 static void 2272 mlxsw_sp_neigh_entry_destroy(struct mlxsw_sp *mlxsw_sp, 2273 struct mlxsw_sp_neigh_entry *neigh_entry) 2274 { 2275 list_del(&neigh_entry->rif_list_node); 2276 atomic_dec(&mlxsw_sp->router->neighs_update.neigh_count); 2277 mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry); 2278 mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry); 2279 mlxsw_sp_neigh_entry_free(neigh_entry); 2280 } 2281 2282 static struct mlxsw_sp_neigh_entry * 2283 mlxsw_sp_neigh_entry_lookup(struct mlxsw_sp *mlxsw_sp, struct neighbour *n) 2284 { 2285 struct mlxsw_sp_neigh_key key; 2286 2287 key.n = n; 2288 return rhashtable_lookup_fast(&mlxsw_sp->router->neigh_ht, 2289 &key, mlxsw_sp_neigh_ht_params); 2290 } 2291 2292 static void 2293 mlxsw_sp_router_neighs_update_interval_init(struct mlxsw_sp *mlxsw_sp) 2294 { 2295 unsigned long interval; 2296 2297 #if IS_ENABLED(CONFIG_IPV6) 2298 interval = min_t(unsigned long, 2299 NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME), 2300 NEIGH_VAR(&nd_tbl.parms, DELAY_PROBE_TIME)); 2301 #else 2302 interval = NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME); 2303 #endif 2304 mlxsw_sp->router->neighs_update.interval = jiffies_to_msecs(interval); 2305 } 2306 2307 static void mlxsw_sp_router_neigh_ent_ipv4_process(struct mlxsw_sp *mlxsw_sp, 2308 char *rauhtd_pl, 2309 int ent_index) 2310 { 2311 u64 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); 2312 struct net_device *dev; 2313 struct neighbour *n; 2314 __be32 dipn; 2315 u32 dip; 2316 u16 rif; 2317 2318 mlxsw_reg_rauhtd_ent_ipv4_unpack(rauhtd_pl, ent_index, &rif, &dip); 2319 2320 if (WARN_ON_ONCE(rif >= max_rifs)) 2321 return; 2322 if (!mlxsw_sp->router->rifs[rif]) { 2323 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n"); 2324 return; 2325 } 2326 2327 dipn = htonl(dip); 2328 dev = mlxsw_sp->router->rifs[rif]->dev; 2329 n = neigh_lookup(&arp_tbl, &dipn, dev); 2330 if (!n) 2331 return; 2332 2333 netdev_dbg(dev, "Updating neighbour with IP=%pI4h\n", &dip); 2334 neigh_event_send(n, NULL); 2335 neigh_release(n); 2336 } 2337 2338 #if IS_ENABLED(CONFIG_IPV6) 2339 static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp, 2340 char *rauhtd_pl, 2341 int rec_index) 2342 { 2343 struct net_device *dev; 2344 struct neighbour *n; 2345 struct in6_addr dip; 2346 u16 rif; 2347 2348 mlxsw_reg_rauhtd_ent_ipv6_unpack(rauhtd_pl, rec_index, &rif, 2349 (char *) &dip); 2350 2351 if (!mlxsw_sp->router->rifs[rif]) { 2352 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n"); 2353 return; 2354 } 2355 2356 dev = mlxsw_sp->router->rifs[rif]->dev; 2357 n = neigh_lookup(&nd_tbl, &dip, dev); 2358 if (!n) 2359 return; 2360 2361 netdev_dbg(dev, "Updating neighbour with IP=%pI6c\n", &dip); 2362 neigh_event_send(n, NULL); 2363 neigh_release(n); 2364 } 2365 #else 2366 static void mlxsw_sp_router_neigh_ent_ipv6_process(struct mlxsw_sp *mlxsw_sp, 2367 char *rauhtd_pl, 2368 int rec_index) 2369 { 2370 } 2371 #endif 2372 2373 static void mlxsw_sp_router_neigh_rec_ipv4_process(struct mlxsw_sp *mlxsw_sp, 2374 char *rauhtd_pl, 2375 int rec_index) 2376 { 2377 u8 num_entries; 2378 int i; 2379 2380 num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl, 2381 rec_index); 2382 /* Hardware starts counting at 0, so add 1. */ 2383 num_entries++; 2384 2385 /* Each record consists of several neighbour entries. */ 2386 for (i = 0; i < num_entries; i++) { 2387 int ent_index; 2388 2389 ent_index = rec_index * MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC + i; 2390 mlxsw_sp_router_neigh_ent_ipv4_process(mlxsw_sp, rauhtd_pl, 2391 ent_index); 2392 } 2393 2394 } 2395 2396 static void mlxsw_sp_router_neigh_rec_ipv6_process(struct mlxsw_sp *mlxsw_sp, 2397 char *rauhtd_pl, 2398 int rec_index) 2399 { 2400 /* One record contains one entry. */ 2401 mlxsw_sp_router_neigh_ent_ipv6_process(mlxsw_sp, rauhtd_pl, 2402 rec_index); 2403 } 2404 2405 static void mlxsw_sp_router_neigh_rec_process(struct mlxsw_sp *mlxsw_sp, 2406 char *rauhtd_pl, int rec_index) 2407 { 2408 switch (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, rec_index)) { 2409 case MLXSW_REG_RAUHTD_TYPE_IPV4: 2410 mlxsw_sp_router_neigh_rec_ipv4_process(mlxsw_sp, rauhtd_pl, 2411 rec_index); 2412 break; 2413 case MLXSW_REG_RAUHTD_TYPE_IPV6: 2414 mlxsw_sp_router_neigh_rec_ipv6_process(mlxsw_sp, rauhtd_pl, 2415 rec_index); 2416 break; 2417 } 2418 } 2419 2420 static bool mlxsw_sp_router_rauhtd_is_full(char *rauhtd_pl) 2421 { 2422 u8 num_rec, last_rec_index, num_entries; 2423 2424 num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl); 2425 last_rec_index = num_rec - 1; 2426 2427 if (num_rec < MLXSW_REG_RAUHTD_REC_MAX_NUM) 2428 return false; 2429 if (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, last_rec_index) == 2430 MLXSW_REG_RAUHTD_TYPE_IPV6) 2431 return true; 2432 2433 num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl, 2434 last_rec_index); 2435 if (++num_entries == MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC) 2436 return true; 2437 return false; 2438 } 2439 2440 static int 2441 __mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp, 2442 char *rauhtd_pl, 2443 enum mlxsw_reg_rauhtd_type type) 2444 { 2445 int i, num_rec; 2446 int err; 2447 2448 /* Ensure the RIF we read from the device does not change mid-dump. */ 2449 mutex_lock(&mlxsw_sp->router->lock); 2450 do { 2451 mlxsw_reg_rauhtd_pack(rauhtd_pl, type); 2452 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(rauhtd), 2453 rauhtd_pl); 2454 if (err) { 2455 dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Failed to dump neighbour table\n"); 2456 break; 2457 } 2458 num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl); 2459 for (i = 0; i < num_rec; i++) 2460 mlxsw_sp_router_neigh_rec_process(mlxsw_sp, rauhtd_pl, 2461 i); 2462 } while (mlxsw_sp_router_rauhtd_is_full(rauhtd_pl)); 2463 mutex_unlock(&mlxsw_sp->router->lock); 2464 2465 return err; 2466 } 2467 2468 static int mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp) 2469 { 2470 enum mlxsw_reg_rauhtd_type type; 2471 char *rauhtd_pl; 2472 int err; 2473 2474 if (!atomic_read(&mlxsw_sp->router->neighs_update.neigh_count)) 2475 return 0; 2476 2477 rauhtd_pl = kmalloc(MLXSW_REG_RAUHTD_LEN, GFP_KERNEL); 2478 if (!rauhtd_pl) 2479 return -ENOMEM; 2480 2481 type = MLXSW_REG_RAUHTD_TYPE_IPV4; 2482 err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type); 2483 if (err) 2484 goto out; 2485 2486 type = MLXSW_REG_RAUHTD_TYPE_IPV6; 2487 err = __mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp, rauhtd_pl, type); 2488 out: 2489 kfree(rauhtd_pl); 2490 return err; 2491 } 2492 2493 static void mlxsw_sp_router_neighs_update_nh(struct mlxsw_sp *mlxsw_sp) 2494 { 2495 struct mlxsw_sp_neigh_entry *neigh_entry; 2496 2497 mutex_lock(&mlxsw_sp->router->lock); 2498 list_for_each_entry(neigh_entry, &mlxsw_sp->router->nexthop_neighs_list, 2499 nexthop_neighs_list_node) 2500 /* If this neigh have nexthops, make the kernel think this neigh 2501 * is active regardless of the traffic. 2502 */ 2503 neigh_event_send(neigh_entry->key.n, NULL); 2504 mutex_unlock(&mlxsw_sp->router->lock); 2505 } 2506 2507 static void 2508 mlxsw_sp_router_neighs_update_work_schedule(struct mlxsw_sp *mlxsw_sp) 2509 { 2510 unsigned long interval = mlxsw_sp->router->neighs_update.interval; 2511 2512 mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw, 2513 msecs_to_jiffies(interval)); 2514 } 2515 2516 static void mlxsw_sp_router_neighs_update_work(struct work_struct *work) 2517 { 2518 struct mlxsw_sp_router *router; 2519 int err; 2520 2521 router = container_of(work, struct mlxsw_sp_router, 2522 neighs_update.dw.work); 2523 err = mlxsw_sp_router_neighs_update_rauhtd(router->mlxsw_sp); 2524 if (err) 2525 dev_err(router->mlxsw_sp->bus_info->dev, "Could not update kernel for neigh activity"); 2526 2527 mlxsw_sp_router_neighs_update_nh(router->mlxsw_sp); 2528 2529 mlxsw_sp_router_neighs_update_work_schedule(router->mlxsw_sp); 2530 } 2531 2532 static void mlxsw_sp_router_probe_unresolved_nexthops(struct work_struct *work) 2533 { 2534 struct mlxsw_sp_neigh_entry *neigh_entry; 2535 struct mlxsw_sp_router *router; 2536 2537 router = container_of(work, struct mlxsw_sp_router, 2538 nexthop_probe_dw.work); 2539 /* Iterate over nexthop neighbours, find those who are unresolved and 2540 * send arp on them. This solves the chicken-egg problem when 2541 * the nexthop wouldn't get offloaded until the neighbor is resolved 2542 * but it wouldn't get resolved ever in case traffic is flowing in HW 2543 * using different nexthop. 2544 */ 2545 mutex_lock(&router->lock); 2546 list_for_each_entry(neigh_entry, &router->nexthop_neighs_list, 2547 nexthop_neighs_list_node) 2548 if (!neigh_entry->connected) 2549 neigh_event_send(neigh_entry->key.n, NULL); 2550 mutex_unlock(&router->lock); 2551 2552 mlxsw_core_schedule_dw(&router->nexthop_probe_dw, 2553 MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL); 2554 } 2555 2556 static void 2557 mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp, 2558 struct mlxsw_sp_neigh_entry *neigh_entry, 2559 bool removing, bool dead); 2560 2561 static enum mlxsw_reg_rauht_op mlxsw_sp_rauht_op(bool adding) 2562 { 2563 return adding ? MLXSW_REG_RAUHT_OP_WRITE_ADD : 2564 MLXSW_REG_RAUHT_OP_WRITE_DELETE; 2565 } 2566 2567 static int 2568 mlxsw_sp_router_neigh_entry_op4(struct mlxsw_sp *mlxsw_sp, 2569 struct mlxsw_sp_neigh_entry *neigh_entry, 2570 enum mlxsw_reg_rauht_op op) 2571 { 2572 struct neighbour *n = neigh_entry->key.n; 2573 u32 dip = ntohl(*((__be32 *) n->primary_key)); 2574 char rauht_pl[MLXSW_REG_RAUHT_LEN]; 2575 2576 mlxsw_reg_rauht_pack4(rauht_pl, op, neigh_entry->rif, neigh_entry->ha, 2577 dip); 2578 if (neigh_entry->counter_valid) 2579 mlxsw_reg_rauht_pack_counter(rauht_pl, 2580 neigh_entry->counter_index); 2581 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl); 2582 } 2583 2584 static int 2585 mlxsw_sp_router_neigh_entry_op6(struct mlxsw_sp *mlxsw_sp, 2586 struct mlxsw_sp_neigh_entry *neigh_entry, 2587 enum mlxsw_reg_rauht_op op) 2588 { 2589 struct neighbour *n = neigh_entry->key.n; 2590 char rauht_pl[MLXSW_REG_RAUHT_LEN]; 2591 const char *dip = n->primary_key; 2592 2593 mlxsw_reg_rauht_pack6(rauht_pl, op, neigh_entry->rif, neigh_entry->ha, 2594 dip); 2595 if (neigh_entry->counter_valid) 2596 mlxsw_reg_rauht_pack_counter(rauht_pl, 2597 neigh_entry->counter_index); 2598 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), rauht_pl); 2599 } 2600 2601 bool mlxsw_sp_neigh_ipv6_ignore(struct mlxsw_sp_neigh_entry *neigh_entry) 2602 { 2603 struct neighbour *n = neigh_entry->key.n; 2604 2605 /* Packets with a link-local destination address are trapped 2606 * after LPM lookup and never reach the neighbour table, so 2607 * there is no need to program such neighbours to the device. 2608 */ 2609 if (ipv6_addr_type((struct in6_addr *) &n->primary_key) & 2610 IPV6_ADDR_LINKLOCAL) 2611 return true; 2612 return false; 2613 } 2614 2615 static void 2616 mlxsw_sp_neigh_entry_update(struct mlxsw_sp *mlxsw_sp, 2617 struct mlxsw_sp_neigh_entry *neigh_entry, 2618 bool adding) 2619 { 2620 enum mlxsw_reg_rauht_op op = mlxsw_sp_rauht_op(adding); 2621 int err; 2622 2623 if (!adding && !neigh_entry->connected) 2624 return; 2625 neigh_entry->connected = adding; 2626 if (neigh_entry->key.n->tbl->family == AF_INET) { 2627 err = mlxsw_sp_router_neigh_entry_op4(mlxsw_sp, neigh_entry, 2628 op); 2629 if (err) 2630 return; 2631 } else if (neigh_entry->key.n->tbl->family == AF_INET6) { 2632 if (mlxsw_sp_neigh_ipv6_ignore(neigh_entry)) 2633 return; 2634 err = mlxsw_sp_router_neigh_entry_op6(mlxsw_sp, neigh_entry, 2635 op); 2636 if (err) 2637 return; 2638 } else { 2639 WARN_ON_ONCE(1); 2640 return; 2641 } 2642 2643 if (adding) 2644 neigh_entry->key.n->flags |= NTF_OFFLOADED; 2645 else 2646 neigh_entry->key.n->flags &= ~NTF_OFFLOADED; 2647 } 2648 2649 void 2650 mlxsw_sp_neigh_entry_counter_update(struct mlxsw_sp *mlxsw_sp, 2651 struct mlxsw_sp_neigh_entry *neigh_entry, 2652 bool adding) 2653 { 2654 if (adding) 2655 mlxsw_sp_neigh_counter_alloc(mlxsw_sp, neigh_entry); 2656 else 2657 mlxsw_sp_neigh_counter_free(mlxsw_sp, neigh_entry); 2658 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, true); 2659 } 2660 2661 struct mlxsw_sp_netevent_work { 2662 struct work_struct work; 2663 struct mlxsw_sp *mlxsw_sp; 2664 struct neighbour *n; 2665 }; 2666 2667 static void mlxsw_sp_router_neigh_event_work(struct work_struct *work) 2668 { 2669 struct mlxsw_sp_netevent_work *net_work = 2670 container_of(work, struct mlxsw_sp_netevent_work, work); 2671 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp; 2672 struct mlxsw_sp_neigh_entry *neigh_entry; 2673 struct neighbour *n = net_work->n; 2674 unsigned char ha[ETH_ALEN]; 2675 bool entry_connected; 2676 u8 nud_state, dead; 2677 2678 /* If these parameters are changed after we release the lock, 2679 * then we are guaranteed to receive another event letting us 2680 * know about it. 2681 */ 2682 read_lock_bh(&n->lock); 2683 memcpy(ha, n->ha, ETH_ALEN); 2684 nud_state = n->nud_state; 2685 dead = n->dead; 2686 read_unlock_bh(&n->lock); 2687 2688 mutex_lock(&mlxsw_sp->router->lock); 2689 mlxsw_sp_span_respin(mlxsw_sp); 2690 2691 entry_connected = nud_state & NUD_VALID && !dead; 2692 neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n); 2693 if (!entry_connected && !neigh_entry) 2694 goto out; 2695 if (!neigh_entry) { 2696 neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n); 2697 if (IS_ERR(neigh_entry)) 2698 goto out; 2699 } 2700 2701 if (neigh_entry->connected && entry_connected && 2702 !memcmp(neigh_entry->ha, ha, ETH_ALEN)) 2703 goto out; 2704 2705 memcpy(neigh_entry->ha, ha, ETH_ALEN); 2706 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, entry_connected); 2707 mlxsw_sp_nexthop_neigh_update(mlxsw_sp, neigh_entry, !entry_connected, 2708 dead); 2709 2710 if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list)) 2711 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry); 2712 2713 out: 2714 mutex_unlock(&mlxsw_sp->router->lock); 2715 neigh_release(n); 2716 kfree(net_work); 2717 } 2718 2719 static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp); 2720 2721 static void mlxsw_sp_router_mp_hash_event_work(struct work_struct *work) 2722 { 2723 struct mlxsw_sp_netevent_work *net_work = 2724 container_of(work, struct mlxsw_sp_netevent_work, work); 2725 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp; 2726 2727 mlxsw_sp_mp_hash_init(mlxsw_sp); 2728 kfree(net_work); 2729 } 2730 2731 static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp); 2732 2733 static void mlxsw_sp_router_update_priority_work(struct work_struct *work) 2734 { 2735 struct mlxsw_sp_netevent_work *net_work = 2736 container_of(work, struct mlxsw_sp_netevent_work, work); 2737 struct mlxsw_sp *mlxsw_sp = net_work->mlxsw_sp; 2738 2739 __mlxsw_sp_router_init(mlxsw_sp); 2740 kfree(net_work); 2741 } 2742 2743 static int mlxsw_sp_router_schedule_work(struct net *net, 2744 struct notifier_block *nb, 2745 void (*cb)(struct work_struct *)) 2746 { 2747 struct mlxsw_sp_netevent_work *net_work; 2748 struct mlxsw_sp_router *router; 2749 2750 router = container_of(nb, struct mlxsw_sp_router, netevent_nb); 2751 if (!net_eq(net, mlxsw_sp_net(router->mlxsw_sp))) 2752 return NOTIFY_DONE; 2753 2754 net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC); 2755 if (!net_work) 2756 return NOTIFY_BAD; 2757 2758 INIT_WORK(&net_work->work, cb); 2759 net_work->mlxsw_sp = router->mlxsw_sp; 2760 mlxsw_core_schedule_work(&net_work->work); 2761 return NOTIFY_DONE; 2762 } 2763 2764 static int mlxsw_sp_router_netevent_event(struct notifier_block *nb, 2765 unsigned long event, void *ptr) 2766 { 2767 struct mlxsw_sp_netevent_work *net_work; 2768 struct mlxsw_sp_port *mlxsw_sp_port; 2769 struct mlxsw_sp *mlxsw_sp; 2770 unsigned long interval; 2771 struct neigh_parms *p; 2772 struct neighbour *n; 2773 2774 switch (event) { 2775 case NETEVENT_DELAY_PROBE_TIME_UPDATE: 2776 p = ptr; 2777 2778 /* We don't care about changes in the default table. */ 2779 if (!p->dev || (p->tbl->family != AF_INET && 2780 p->tbl->family != AF_INET6)) 2781 return NOTIFY_DONE; 2782 2783 /* We are in atomic context and can't take RTNL mutex, 2784 * so use RCU variant to walk the device chain. 2785 */ 2786 mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(p->dev); 2787 if (!mlxsw_sp_port) 2788 return NOTIFY_DONE; 2789 2790 mlxsw_sp = mlxsw_sp_port->mlxsw_sp; 2791 interval = jiffies_to_msecs(NEIGH_VAR(p, DELAY_PROBE_TIME)); 2792 mlxsw_sp->router->neighs_update.interval = interval; 2793 2794 mlxsw_sp_port_dev_put(mlxsw_sp_port); 2795 break; 2796 case NETEVENT_NEIGH_UPDATE: 2797 n = ptr; 2798 2799 if (n->tbl->family != AF_INET && n->tbl->family != AF_INET6) 2800 return NOTIFY_DONE; 2801 2802 mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(n->dev); 2803 if (!mlxsw_sp_port) 2804 return NOTIFY_DONE; 2805 2806 net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC); 2807 if (!net_work) { 2808 mlxsw_sp_port_dev_put(mlxsw_sp_port); 2809 return NOTIFY_BAD; 2810 } 2811 2812 INIT_WORK(&net_work->work, mlxsw_sp_router_neigh_event_work); 2813 net_work->mlxsw_sp = mlxsw_sp_port->mlxsw_sp; 2814 net_work->n = n; 2815 2816 /* Take a reference to ensure the neighbour won't be 2817 * destructed until we drop the reference in delayed 2818 * work. 2819 */ 2820 neigh_clone(n); 2821 mlxsw_core_schedule_work(&net_work->work); 2822 mlxsw_sp_port_dev_put(mlxsw_sp_port); 2823 break; 2824 case NETEVENT_IPV4_MPATH_HASH_UPDATE: 2825 case NETEVENT_IPV6_MPATH_HASH_UPDATE: 2826 return mlxsw_sp_router_schedule_work(ptr, nb, 2827 mlxsw_sp_router_mp_hash_event_work); 2828 2829 case NETEVENT_IPV4_FWD_UPDATE_PRIORITY_UPDATE: 2830 return mlxsw_sp_router_schedule_work(ptr, nb, 2831 mlxsw_sp_router_update_priority_work); 2832 } 2833 2834 return NOTIFY_DONE; 2835 } 2836 2837 static int mlxsw_sp_neigh_init(struct mlxsw_sp *mlxsw_sp) 2838 { 2839 int err; 2840 2841 err = rhashtable_init(&mlxsw_sp->router->neigh_ht, 2842 &mlxsw_sp_neigh_ht_params); 2843 if (err) 2844 return err; 2845 2846 /* Initialize the polling interval according to the default 2847 * table. 2848 */ 2849 mlxsw_sp_router_neighs_update_interval_init(mlxsw_sp); 2850 2851 /* Create the delayed works for the activity_update */ 2852 INIT_DELAYED_WORK(&mlxsw_sp->router->neighs_update.dw, 2853 mlxsw_sp_router_neighs_update_work); 2854 INIT_DELAYED_WORK(&mlxsw_sp->router->nexthop_probe_dw, 2855 mlxsw_sp_router_probe_unresolved_nexthops); 2856 atomic_set(&mlxsw_sp->router->neighs_update.neigh_count, 0); 2857 mlxsw_core_schedule_dw(&mlxsw_sp->router->neighs_update.dw, 0); 2858 mlxsw_core_schedule_dw(&mlxsw_sp->router->nexthop_probe_dw, 0); 2859 return 0; 2860 } 2861 2862 static void mlxsw_sp_neigh_fini(struct mlxsw_sp *mlxsw_sp) 2863 { 2864 cancel_delayed_work_sync(&mlxsw_sp->router->neighs_update.dw); 2865 cancel_delayed_work_sync(&mlxsw_sp->router->nexthop_probe_dw); 2866 rhashtable_destroy(&mlxsw_sp->router->neigh_ht); 2867 } 2868 2869 static void mlxsw_sp_neigh_rif_gone_sync(struct mlxsw_sp *mlxsw_sp, 2870 struct mlxsw_sp_rif *rif) 2871 { 2872 struct mlxsw_sp_neigh_entry *neigh_entry, *tmp; 2873 2874 list_for_each_entry_safe(neigh_entry, tmp, &rif->neigh_list, 2875 rif_list_node) { 2876 mlxsw_sp_neigh_entry_update(mlxsw_sp, neigh_entry, false); 2877 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry); 2878 } 2879 } 2880 2881 enum mlxsw_sp_nexthop_type { 2882 MLXSW_SP_NEXTHOP_TYPE_ETH, 2883 MLXSW_SP_NEXTHOP_TYPE_IPIP, 2884 }; 2885 2886 enum mlxsw_sp_nexthop_action { 2887 /* Nexthop forwards packets to an egress RIF */ 2888 MLXSW_SP_NEXTHOP_ACTION_FORWARD, 2889 /* Nexthop discards packets */ 2890 MLXSW_SP_NEXTHOP_ACTION_DISCARD, 2891 /* Nexthop traps packets */ 2892 MLXSW_SP_NEXTHOP_ACTION_TRAP, 2893 }; 2894 2895 struct mlxsw_sp_nexthop_key { 2896 struct fib_nh *fib_nh; 2897 }; 2898 2899 struct mlxsw_sp_nexthop { 2900 struct list_head neigh_list_node; /* member of neigh entry list */ 2901 struct list_head rif_list_node; 2902 struct list_head router_list_node; 2903 struct mlxsw_sp_nexthop_group_info *nhgi; /* pointer back to the group 2904 * this nexthop belongs to 2905 */ 2906 struct rhash_head ht_node; 2907 struct neigh_table *neigh_tbl; 2908 struct mlxsw_sp_nexthop_key key; 2909 unsigned char gw_addr[sizeof(struct in6_addr)]; 2910 int ifindex; 2911 int nh_weight; 2912 int norm_nh_weight; 2913 int num_adj_entries; 2914 struct mlxsw_sp_rif *rif; 2915 u8 should_offload:1, /* set indicates this nexthop should be written 2916 * to the adjacency table. 2917 */ 2918 offloaded:1, /* set indicates this nexthop was written to the 2919 * adjacency table. 2920 */ 2921 update:1; /* set indicates this nexthop should be updated in the 2922 * adjacency table (f.e., its MAC changed). 2923 */ 2924 enum mlxsw_sp_nexthop_action action; 2925 enum mlxsw_sp_nexthop_type type; 2926 union { 2927 struct mlxsw_sp_neigh_entry *neigh_entry; 2928 struct mlxsw_sp_ipip_entry *ipip_entry; 2929 }; 2930 unsigned int counter_index; 2931 bool counter_valid; 2932 }; 2933 2934 enum mlxsw_sp_nexthop_group_type { 2935 MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4, 2936 MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6, 2937 MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ, 2938 }; 2939 2940 struct mlxsw_sp_nexthop_group_info { 2941 struct mlxsw_sp_nexthop_group *nh_grp; 2942 u32 adj_index; 2943 u16 ecmp_size; 2944 u16 count; 2945 int sum_norm_weight; 2946 u8 adj_index_valid:1, 2947 gateway:1, /* routes using the group use a gateway */ 2948 is_resilient:1; 2949 struct list_head list; /* member in nh_res_grp_list */ 2950 struct mlxsw_sp_nexthop nexthops[0]; 2951 #define nh_rif nexthops[0].rif 2952 }; 2953 2954 struct mlxsw_sp_nexthop_group_vr_key { 2955 u16 vr_id; 2956 enum mlxsw_sp_l3proto proto; 2957 }; 2958 2959 struct mlxsw_sp_nexthop_group_vr_entry { 2960 struct list_head list; /* member in vr_list */ 2961 struct rhash_head ht_node; /* member in vr_ht */ 2962 refcount_t ref_count; 2963 struct mlxsw_sp_nexthop_group_vr_key key; 2964 }; 2965 2966 struct mlxsw_sp_nexthop_group { 2967 struct rhash_head ht_node; 2968 struct list_head fib_list; /* list of fib entries that use this group */ 2969 union { 2970 struct { 2971 struct fib_info *fi; 2972 } ipv4; 2973 struct { 2974 u32 id; 2975 } obj; 2976 }; 2977 struct mlxsw_sp_nexthop_group_info *nhgi; 2978 struct list_head vr_list; 2979 struct rhashtable vr_ht; 2980 enum mlxsw_sp_nexthop_group_type type; 2981 bool can_destroy; 2982 }; 2983 2984 void mlxsw_sp_nexthop_counter_alloc(struct mlxsw_sp *mlxsw_sp, 2985 struct mlxsw_sp_nexthop *nh) 2986 { 2987 struct devlink *devlink; 2988 2989 devlink = priv_to_devlink(mlxsw_sp->core); 2990 if (!devlink_dpipe_table_counter_enabled(devlink, 2991 MLXSW_SP_DPIPE_TABLE_NAME_ADJ)) 2992 return; 2993 2994 if (mlxsw_sp_flow_counter_alloc(mlxsw_sp, &nh->counter_index)) 2995 return; 2996 2997 nh->counter_valid = true; 2998 } 2999 3000 void mlxsw_sp_nexthop_counter_free(struct mlxsw_sp *mlxsw_sp, 3001 struct mlxsw_sp_nexthop *nh) 3002 { 3003 if (!nh->counter_valid) 3004 return; 3005 mlxsw_sp_flow_counter_free(mlxsw_sp, nh->counter_index); 3006 nh->counter_valid = false; 3007 } 3008 3009 int mlxsw_sp_nexthop_counter_get(struct mlxsw_sp *mlxsw_sp, 3010 struct mlxsw_sp_nexthop *nh, u64 *p_counter) 3011 { 3012 if (!nh->counter_valid) 3013 return -EINVAL; 3014 3015 return mlxsw_sp_flow_counter_get(mlxsw_sp, nh->counter_index, 3016 p_counter, NULL); 3017 } 3018 3019 struct mlxsw_sp_nexthop *mlxsw_sp_nexthop_next(struct mlxsw_sp_router *router, 3020 struct mlxsw_sp_nexthop *nh) 3021 { 3022 if (!nh) { 3023 if (list_empty(&router->nexthop_list)) 3024 return NULL; 3025 else 3026 return list_first_entry(&router->nexthop_list, 3027 typeof(*nh), router_list_node); 3028 } 3029 if (list_is_last(&nh->router_list_node, &router->nexthop_list)) 3030 return NULL; 3031 return list_next_entry(nh, router_list_node); 3032 } 3033 3034 bool mlxsw_sp_nexthop_is_forward(const struct mlxsw_sp_nexthop *nh) 3035 { 3036 return nh->offloaded && nh->action == MLXSW_SP_NEXTHOP_ACTION_FORWARD; 3037 } 3038 3039 unsigned char *mlxsw_sp_nexthop_ha(struct mlxsw_sp_nexthop *nh) 3040 { 3041 if (nh->type != MLXSW_SP_NEXTHOP_TYPE_ETH || 3042 !mlxsw_sp_nexthop_is_forward(nh)) 3043 return NULL; 3044 return nh->neigh_entry->ha; 3045 } 3046 3047 int mlxsw_sp_nexthop_indexes(struct mlxsw_sp_nexthop *nh, u32 *p_adj_index, 3048 u32 *p_adj_size, u32 *p_adj_hash_index) 3049 { 3050 struct mlxsw_sp_nexthop_group_info *nhgi = nh->nhgi; 3051 u32 adj_hash_index = 0; 3052 int i; 3053 3054 if (!nh->offloaded || !nhgi->adj_index_valid) 3055 return -EINVAL; 3056 3057 *p_adj_index = nhgi->adj_index; 3058 *p_adj_size = nhgi->ecmp_size; 3059 3060 for (i = 0; i < nhgi->count; i++) { 3061 struct mlxsw_sp_nexthop *nh_iter = &nhgi->nexthops[i]; 3062 3063 if (nh_iter == nh) 3064 break; 3065 if (nh_iter->offloaded) 3066 adj_hash_index += nh_iter->num_adj_entries; 3067 } 3068 3069 *p_adj_hash_index = adj_hash_index; 3070 return 0; 3071 } 3072 3073 struct mlxsw_sp_rif *mlxsw_sp_nexthop_rif(struct mlxsw_sp_nexthop *nh) 3074 { 3075 return nh->rif; 3076 } 3077 3078 bool mlxsw_sp_nexthop_group_has_ipip(struct mlxsw_sp_nexthop *nh) 3079 { 3080 struct mlxsw_sp_nexthop_group_info *nhgi = nh->nhgi; 3081 int i; 3082 3083 for (i = 0; i < nhgi->count; i++) { 3084 struct mlxsw_sp_nexthop *nh_iter = &nhgi->nexthops[i]; 3085 3086 if (nh_iter->type == MLXSW_SP_NEXTHOP_TYPE_IPIP) 3087 return true; 3088 } 3089 return false; 3090 } 3091 3092 static const struct rhashtable_params mlxsw_sp_nexthop_group_vr_ht_params = { 3093 .key_offset = offsetof(struct mlxsw_sp_nexthop_group_vr_entry, key), 3094 .head_offset = offsetof(struct mlxsw_sp_nexthop_group_vr_entry, ht_node), 3095 .key_len = sizeof(struct mlxsw_sp_nexthop_group_vr_key), 3096 .automatic_shrinking = true, 3097 }; 3098 3099 static struct mlxsw_sp_nexthop_group_vr_entry * 3100 mlxsw_sp_nexthop_group_vr_entry_lookup(struct mlxsw_sp_nexthop_group *nh_grp, 3101 const struct mlxsw_sp_fib *fib) 3102 { 3103 struct mlxsw_sp_nexthop_group_vr_key key; 3104 3105 memset(&key, 0, sizeof(key)); 3106 key.vr_id = fib->vr->id; 3107 key.proto = fib->proto; 3108 return rhashtable_lookup_fast(&nh_grp->vr_ht, &key, 3109 mlxsw_sp_nexthop_group_vr_ht_params); 3110 } 3111 3112 static int 3113 mlxsw_sp_nexthop_group_vr_entry_create(struct mlxsw_sp_nexthop_group *nh_grp, 3114 const struct mlxsw_sp_fib *fib) 3115 { 3116 struct mlxsw_sp_nexthop_group_vr_entry *vr_entry; 3117 int err; 3118 3119 vr_entry = kzalloc(sizeof(*vr_entry), GFP_KERNEL); 3120 if (!vr_entry) 3121 return -ENOMEM; 3122 3123 vr_entry->key.vr_id = fib->vr->id; 3124 vr_entry->key.proto = fib->proto; 3125 refcount_set(&vr_entry->ref_count, 1); 3126 3127 err = rhashtable_insert_fast(&nh_grp->vr_ht, &vr_entry->ht_node, 3128 mlxsw_sp_nexthop_group_vr_ht_params); 3129 if (err) 3130 goto err_hashtable_insert; 3131 3132 list_add(&vr_entry->list, &nh_grp->vr_list); 3133 3134 return 0; 3135 3136 err_hashtable_insert: 3137 kfree(vr_entry); 3138 return err; 3139 } 3140 3141 static void 3142 mlxsw_sp_nexthop_group_vr_entry_destroy(struct mlxsw_sp_nexthop_group *nh_grp, 3143 struct mlxsw_sp_nexthop_group_vr_entry *vr_entry) 3144 { 3145 list_del(&vr_entry->list); 3146 rhashtable_remove_fast(&nh_grp->vr_ht, &vr_entry->ht_node, 3147 mlxsw_sp_nexthop_group_vr_ht_params); 3148 kfree(vr_entry); 3149 } 3150 3151 static int 3152 mlxsw_sp_nexthop_group_vr_link(struct mlxsw_sp_nexthop_group *nh_grp, 3153 const struct mlxsw_sp_fib *fib) 3154 { 3155 struct mlxsw_sp_nexthop_group_vr_entry *vr_entry; 3156 3157 vr_entry = mlxsw_sp_nexthop_group_vr_entry_lookup(nh_grp, fib); 3158 if (vr_entry) { 3159 refcount_inc(&vr_entry->ref_count); 3160 return 0; 3161 } 3162 3163 return mlxsw_sp_nexthop_group_vr_entry_create(nh_grp, fib); 3164 } 3165 3166 static void 3167 mlxsw_sp_nexthop_group_vr_unlink(struct mlxsw_sp_nexthop_group *nh_grp, 3168 const struct mlxsw_sp_fib *fib) 3169 { 3170 struct mlxsw_sp_nexthop_group_vr_entry *vr_entry; 3171 3172 vr_entry = mlxsw_sp_nexthop_group_vr_entry_lookup(nh_grp, fib); 3173 if (WARN_ON_ONCE(!vr_entry)) 3174 return; 3175 3176 if (!refcount_dec_and_test(&vr_entry->ref_count)) 3177 return; 3178 3179 mlxsw_sp_nexthop_group_vr_entry_destroy(nh_grp, vr_entry); 3180 } 3181 3182 struct mlxsw_sp_nexthop_group_cmp_arg { 3183 enum mlxsw_sp_nexthop_group_type type; 3184 union { 3185 struct fib_info *fi; 3186 struct mlxsw_sp_fib6_entry *fib6_entry; 3187 u32 id; 3188 }; 3189 }; 3190 3191 static bool 3192 mlxsw_sp_nexthop6_group_has_nexthop(const struct mlxsw_sp_nexthop_group *nh_grp, 3193 const struct in6_addr *gw, int ifindex, 3194 int weight) 3195 { 3196 int i; 3197 3198 for (i = 0; i < nh_grp->nhgi->count; i++) { 3199 const struct mlxsw_sp_nexthop *nh; 3200 3201 nh = &nh_grp->nhgi->nexthops[i]; 3202 if (nh->ifindex == ifindex && nh->nh_weight == weight && 3203 ipv6_addr_equal(gw, (struct in6_addr *) nh->gw_addr)) 3204 return true; 3205 } 3206 3207 return false; 3208 } 3209 3210 static bool 3211 mlxsw_sp_nexthop6_group_cmp(const struct mlxsw_sp_nexthop_group *nh_grp, 3212 const struct mlxsw_sp_fib6_entry *fib6_entry) 3213 { 3214 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 3215 3216 if (nh_grp->nhgi->count != fib6_entry->nrt6) 3217 return false; 3218 3219 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) { 3220 struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh; 3221 struct in6_addr *gw; 3222 int ifindex, weight; 3223 3224 ifindex = fib6_nh->fib_nh_dev->ifindex; 3225 weight = fib6_nh->fib_nh_weight; 3226 gw = &fib6_nh->fib_nh_gw6; 3227 if (!mlxsw_sp_nexthop6_group_has_nexthop(nh_grp, gw, ifindex, 3228 weight)) 3229 return false; 3230 } 3231 3232 return true; 3233 } 3234 3235 static int 3236 mlxsw_sp_nexthop_group_cmp(struct rhashtable_compare_arg *arg, const void *ptr) 3237 { 3238 const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = arg->key; 3239 const struct mlxsw_sp_nexthop_group *nh_grp = ptr; 3240 3241 if (nh_grp->type != cmp_arg->type) 3242 return 1; 3243 3244 switch (cmp_arg->type) { 3245 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4: 3246 return cmp_arg->fi != nh_grp->ipv4.fi; 3247 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6: 3248 return !mlxsw_sp_nexthop6_group_cmp(nh_grp, 3249 cmp_arg->fib6_entry); 3250 case MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ: 3251 return cmp_arg->id != nh_grp->obj.id; 3252 default: 3253 WARN_ON(1); 3254 return 1; 3255 } 3256 } 3257 3258 static u32 mlxsw_sp_nexthop_group_hash_obj(const void *data, u32 len, u32 seed) 3259 { 3260 const struct mlxsw_sp_nexthop_group *nh_grp = data; 3261 const struct mlxsw_sp_nexthop *nh; 3262 struct fib_info *fi; 3263 unsigned int val; 3264 int i; 3265 3266 switch (nh_grp->type) { 3267 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4: 3268 fi = nh_grp->ipv4.fi; 3269 return jhash(&fi, sizeof(fi), seed); 3270 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6: 3271 val = nh_grp->nhgi->count; 3272 for (i = 0; i < nh_grp->nhgi->count; i++) { 3273 nh = &nh_grp->nhgi->nexthops[i]; 3274 val ^= jhash(&nh->ifindex, sizeof(nh->ifindex), seed); 3275 val ^= jhash(&nh->gw_addr, sizeof(nh->gw_addr), seed); 3276 } 3277 return jhash(&val, sizeof(val), seed); 3278 case MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ: 3279 return jhash(&nh_grp->obj.id, sizeof(nh_grp->obj.id), seed); 3280 default: 3281 WARN_ON(1); 3282 return 0; 3283 } 3284 } 3285 3286 static u32 3287 mlxsw_sp_nexthop6_group_hash(struct mlxsw_sp_fib6_entry *fib6_entry, u32 seed) 3288 { 3289 unsigned int val = fib6_entry->nrt6; 3290 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 3291 3292 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) { 3293 struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh; 3294 struct net_device *dev = fib6_nh->fib_nh_dev; 3295 struct in6_addr *gw = &fib6_nh->fib_nh_gw6; 3296 3297 val ^= jhash(&dev->ifindex, sizeof(dev->ifindex), seed); 3298 val ^= jhash(gw, sizeof(*gw), seed); 3299 } 3300 3301 return jhash(&val, sizeof(val), seed); 3302 } 3303 3304 static u32 3305 mlxsw_sp_nexthop_group_hash(const void *data, u32 len, u32 seed) 3306 { 3307 const struct mlxsw_sp_nexthop_group_cmp_arg *cmp_arg = data; 3308 3309 switch (cmp_arg->type) { 3310 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4: 3311 return jhash(&cmp_arg->fi, sizeof(cmp_arg->fi), seed); 3312 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6: 3313 return mlxsw_sp_nexthop6_group_hash(cmp_arg->fib6_entry, seed); 3314 case MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ: 3315 return jhash(&cmp_arg->id, sizeof(cmp_arg->id), seed); 3316 default: 3317 WARN_ON(1); 3318 return 0; 3319 } 3320 } 3321 3322 static const struct rhashtable_params mlxsw_sp_nexthop_group_ht_params = { 3323 .head_offset = offsetof(struct mlxsw_sp_nexthop_group, ht_node), 3324 .hashfn = mlxsw_sp_nexthop_group_hash, 3325 .obj_hashfn = mlxsw_sp_nexthop_group_hash_obj, 3326 .obj_cmpfn = mlxsw_sp_nexthop_group_cmp, 3327 }; 3328 3329 static int mlxsw_sp_nexthop_group_insert(struct mlxsw_sp *mlxsw_sp, 3330 struct mlxsw_sp_nexthop_group *nh_grp) 3331 { 3332 if (nh_grp->type == MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6 && 3333 !nh_grp->nhgi->gateway) 3334 return 0; 3335 3336 return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_group_ht, 3337 &nh_grp->ht_node, 3338 mlxsw_sp_nexthop_group_ht_params); 3339 } 3340 3341 static void mlxsw_sp_nexthop_group_remove(struct mlxsw_sp *mlxsw_sp, 3342 struct mlxsw_sp_nexthop_group *nh_grp) 3343 { 3344 if (nh_grp->type == MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6 && 3345 !nh_grp->nhgi->gateway) 3346 return; 3347 3348 rhashtable_remove_fast(&mlxsw_sp->router->nexthop_group_ht, 3349 &nh_grp->ht_node, 3350 mlxsw_sp_nexthop_group_ht_params); 3351 } 3352 3353 static struct mlxsw_sp_nexthop_group * 3354 mlxsw_sp_nexthop4_group_lookup(struct mlxsw_sp *mlxsw_sp, 3355 struct fib_info *fi) 3356 { 3357 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg; 3358 3359 cmp_arg.type = MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4; 3360 cmp_arg.fi = fi; 3361 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht, 3362 &cmp_arg, 3363 mlxsw_sp_nexthop_group_ht_params); 3364 } 3365 3366 static struct mlxsw_sp_nexthop_group * 3367 mlxsw_sp_nexthop6_group_lookup(struct mlxsw_sp *mlxsw_sp, 3368 struct mlxsw_sp_fib6_entry *fib6_entry) 3369 { 3370 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg; 3371 3372 cmp_arg.type = MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6; 3373 cmp_arg.fib6_entry = fib6_entry; 3374 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht, 3375 &cmp_arg, 3376 mlxsw_sp_nexthop_group_ht_params); 3377 } 3378 3379 static const struct rhashtable_params mlxsw_sp_nexthop_ht_params = { 3380 .key_offset = offsetof(struct mlxsw_sp_nexthop, key), 3381 .head_offset = offsetof(struct mlxsw_sp_nexthop, ht_node), 3382 .key_len = sizeof(struct mlxsw_sp_nexthop_key), 3383 }; 3384 3385 static int mlxsw_sp_nexthop_insert(struct mlxsw_sp *mlxsw_sp, 3386 struct mlxsw_sp_nexthop *nh) 3387 { 3388 return rhashtable_insert_fast(&mlxsw_sp->router->nexthop_ht, 3389 &nh->ht_node, mlxsw_sp_nexthop_ht_params); 3390 } 3391 3392 static void mlxsw_sp_nexthop_remove(struct mlxsw_sp *mlxsw_sp, 3393 struct mlxsw_sp_nexthop *nh) 3394 { 3395 rhashtable_remove_fast(&mlxsw_sp->router->nexthop_ht, &nh->ht_node, 3396 mlxsw_sp_nexthop_ht_params); 3397 } 3398 3399 static struct mlxsw_sp_nexthop * 3400 mlxsw_sp_nexthop_lookup(struct mlxsw_sp *mlxsw_sp, 3401 struct mlxsw_sp_nexthop_key key) 3402 { 3403 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_ht, &key, 3404 mlxsw_sp_nexthop_ht_params); 3405 } 3406 3407 static int mlxsw_sp_adj_index_mass_update_vr(struct mlxsw_sp *mlxsw_sp, 3408 enum mlxsw_sp_l3proto proto, 3409 u16 vr_id, 3410 u32 adj_index, u16 ecmp_size, 3411 u32 new_adj_index, 3412 u16 new_ecmp_size) 3413 { 3414 char raleu_pl[MLXSW_REG_RALEU_LEN]; 3415 3416 mlxsw_reg_raleu_pack(raleu_pl, 3417 (enum mlxsw_reg_ralxx_protocol) proto, vr_id, 3418 adj_index, ecmp_size, new_adj_index, 3419 new_ecmp_size); 3420 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raleu), raleu_pl); 3421 } 3422 3423 static int mlxsw_sp_adj_index_mass_update(struct mlxsw_sp *mlxsw_sp, 3424 struct mlxsw_sp_nexthop_group *nh_grp, 3425 u32 old_adj_index, u16 old_ecmp_size) 3426 { 3427 struct mlxsw_sp_nexthop_group_info *nhgi = nh_grp->nhgi; 3428 struct mlxsw_sp_nexthop_group_vr_entry *vr_entry; 3429 int err; 3430 3431 list_for_each_entry(vr_entry, &nh_grp->vr_list, list) { 3432 err = mlxsw_sp_adj_index_mass_update_vr(mlxsw_sp, 3433 vr_entry->key.proto, 3434 vr_entry->key.vr_id, 3435 old_adj_index, 3436 old_ecmp_size, 3437 nhgi->adj_index, 3438 nhgi->ecmp_size); 3439 if (err) 3440 goto err_mass_update_vr; 3441 } 3442 return 0; 3443 3444 err_mass_update_vr: 3445 list_for_each_entry_continue_reverse(vr_entry, &nh_grp->vr_list, list) 3446 mlxsw_sp_adj_index_mass_update_vr(mlxsw_sp, vr_entry->key.proto, 3447 vr_entry->key.vr_id, 3448 nhgi->adj_index, 3449 nhgi->ecmp_size, 3450 old_adj_index, old_ecmp_size); 3451 return err; 3452 } 3453 3454 static int __mlxsw_sp_nexthop_eth_update(struct mlxsw_sp *mlxsw_sp, 3455 u32 adj_index, 3456 struct mlxsw_sp_nexthop *nh, 3457 bool force, char *ratr_pl) 3458 { 3459 struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry; 3460 enum mlxsw_reg_ratr_op op; 3461 u16 rif_index; 3462 3463 rif_index = nh->rif ? nh->rif->rif_index : 3464 mlxsw_sp->router->lb_rif_index; 3465 op = force ? MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY : 3466 MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY_ON_ACTIVITY; 3467 mlxsw_reg_ratr_pack(ratr_pl, op, true, MLXSW_REG_RATR_TYPE_ETHERNET, 3468 adj_index, rif_index); 3469 switch (nh->action) { 3470 case MLXSW_SP_NEXTHOP_ACTION_FORWARD: 3471 mlxsw_reg_ratr_eth_entry_pack(ratr_pl, neigh_entry->ha); 3472 break; 3473 case MLXSW_SP_NEXTHOP_ACTION_DISCARD: 3474 mlxsw_reg_ratr_trap_action_set(ratr_pl, 3475 MLXSW_REG_RATR_TRAP_ACTION_DISCARD_ERRORS); 3476 break; 3477 case MLXSW_SP_NEXTHOP_ACTION_TRAP: 3478 mlxsw_reg_ratr_trap_action_set(ratr_pl, 3479 MLXSW_REG_RATR_TRAP_ACTION_TRAP); 3480 mlxsw_reg_ratr_trap_id_set(ratr_pl, MLXSW_TRAP_ID_RTR_EGRESS0); 3481 break; 3482 default: 3483 WARN_ON_ONCE(1); 3484 return -EINVAL; 3485 } 3486 if (nh->counter_valid) 3487 mlxsw_reg_ratr_counter_pack(ratr_pl, nh->counter_index, true); 3488 else 3489 mlxsw_reg_ratr_counter_pack(ratr_pl, 0, false); 3490 3491 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl); 3492 } 3493 3494 int mlxsw_sp_nexthop_eth_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index, 3495 struct mlxsw_sp_nexthop *nh, bool force, 3496 char *ratr_pl) 3497 { 3498 int i; 3499 3500 for (i = 0; i < nh->num_adj_entries; i++) { 3501 int err; 3502 3503 err = __mlxsw_sp_nexthop_eth_update(mlxsw_sp, adj_index + i, 3504 nh, force, ratr_pl); 3505 if (err) 3506 return err; 3507 } 3508 3509 return 0; 3510 } 3511 3512 static int __mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp, 3513 u32 adj_index, 3514 struct mlxsw_sp_nexthop *nh, 3515 bool force, char *ratr_pl) 3516 { 3517 const struct mlxsw_sp_ipip_ops *ipip_ops; 3518 3519 ipip_ops = mlxsw_sp->router->ipip_ops_arr[nh->ipip_entry->ipipt]; 3520 return ipip_ops->nexthop_update(mlxsw_sp, adj_index, nh->ipip_entry, 3521 force, ratr_pl); 3522 } 3523 3524 static int mlxsw_sp_nexthop_ipip_update(struct mlxsw_sp *mlxsw_sp, 3525 u32 adj_index, 3526 struct mlxsw_sp_nexthop *nh, bool force, 3527 char *ratr_pl) 3528 { 3529 int i; 3530 3531 for (i = 0; i < nh->num_adj_entries; i++) { 3532 int err; 3533 3534 err = __mlxsw_sp_nexthop_ipip_update(mlxsw_sp, adj_index + i, 3535 nh, force, ratr_pl); 3536 if (err) 3537 return err; 3538 } 3539 3540 return 0; 3541 } 3542 3543 static int mlxsw_sp_nexthop_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index, 3544 struct mlxsw_sp_nexthop *nh, bool force, 3545 char *ratr_pl) 3546 { 3547 /* When action is discard or trap, the nexthop must be 3548 * programmed as an Ethernet nexthop. 3549 */ 3550 if (nh->type == MLXSW_SP_NEXTHOP_TYPE_ETH || 3551 nh->action == MLXSW_SP_NEXTHOP_ACTION_DISCARD || 3552 nh->action == MLXSW_SP_NEXTHOP_ACTION_TRAP) 3553 return mlxsw_sp_nexthop_eth_update(mlxsw_sp, adj_index, nh, 3554 force, ratr_pl); 3555 else 3556 return mlxsw_sp_nexthop_ipip_update(mlxsw_sp, adj_index, nh, 3557 force, ratr_pl); 3558 } 3559 3560 static int 3561 mlxsw_sp_nexthop_group_update(struct mlxsw_sp *mlxsw_sp, 3562 struct mlxsw_sp_nexthop_group_info *nhgi, 3563 bool reallocate) 3564 { 3565 char ratr_pl[MLXSW_REG_RATR_LEN]; 3566 u32 adj_index = nhgi->adj_index; /* base */ 3567 struct mlxsw_sp_nexthop *nh; 3568 int i; 3569 3570 for (i = 0; i < nhgi->count; i++) { 3571 nh = &nhgi->nexthops[i]; 3572 3573 if (!nh->should_offload) { 3574 nh->offloaded = 0; 3575 continue; 3576 } 3577 3578 if (nh->update || reallocate) { 3579 int err = 0; 3580 3581 err = mlxsw_sp_nexthop_update(mlxsw_sp, adj_index, nh, 3582 true, ratr_pl); 3583 if (err) 3584 return err; 3585 nh->update = 0; 3586 nh->offloaded = 1; 3587 } 3588 adj_index += nh->num_adj_entries; 3589 } 3590 return 0; 3591 } 3592 3593 static int 3594 mlxsw_sp_nexthop_fib_entries_update(struct mlxsw_sp *mlxsw_sp, 3595 struct mlxsw_sp_nexthop_group *nh_grp) 3596 { 3597 struct mlxsw_sp_fib_entry *fib_entry; 3598 int err; 3599 3600 list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) { 3601 err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); 3602 if (err) 3603 return err; 3604 } 3605 return 0; 3606 } 3607 3608 struct mlxsw_sp_adj_grp_size_range { 3609 u16 start; /* Inclusive */ 3610 u16 end; /* Inclusive */ 3611 }; 3612 3613 /* Ordered by range start value */ 3614 static const struct mlxsw_sp_adj_grp_size_range 3615 mlxsw_sp1_adj_grp_size_ranges[] = { 3616 { .start = 1, .end = 64 }, 3617 { .start = 512, .end = 512 }, 3618 { .start = 1024, .end = 1024 }, 3619 { .start = 2048, .end = 2048 }, 3620 { .start = 4096, .end = 4096 }, 3621 }; 3622 3623 /* Ordered by range start value */ 3624 static const struct mlxsw_sp_adj_grp_size_range 3625 mlxsw_sp2_adj_grp_size_ranges[] = { 3626 { .start = 1, .end = 128 }, 3627 { .start = 256, .end = 256 }, 3628 { .start = 512, .end = 512 }, 3629 { .start = 1024, .end = 1024 }, 3630 { .start = 2048, .end = 2048 }, 3631 { .start = 4096, .end = 4096 }, 3632 }; 3633 3634 static void mlxsw_sp_adj_grp_size_round_up(const struct mlxsw_sp *mlxsw_sp, 3635 u16 *p_adj_grp_size) 3636 { 3637 int i; 3638 3639 for (i = 0; i < mlxsw_sp->router->adj_grp_size_ranges_count; i++) { 3640 const struct mlxsw_sp_adj_grp_size_range *size_range; 3641 3642 size_range = &mlxsw_sp->router->adj_grp_size_ranges[i]; 3643 3644 if (*p_adj_grp_size >= size_range->start && 3645 *p_adj_grp_size <= size_range->end) 3646 return; 3647 3648 if (*p_adj_grp_size <= size_range->end) { 3649 *p_adj_grp_size = size_range->end; 3650 return; 3651 } 3652 } 3653 } 3654 3655 static void mlxsw_sp_adj_grp_size_round_down(const struct mlxsw_sp *mlxsw_sp, 3656 u16 *p_adj_grp_size, 3657 unsigned int alloc_size) 3658 { 3659 int i; 3660 3661 for (i = mlxsw_sp->router->adj_grp_size_ranges_count - 1; i >= 0; i--) { 3662 const struct mlxsw_sp_adj_grp_size_range *size_range; 3663 3664 size_range = &mlxsw_sp->router->adj_grp_size_ranges[i]; 3665 3666 if (alloc_size >= size_range->end) { 3667 *p_adj_grp_size = size_range->end; 3668 return; 3669 } 3670 } 3671 } 3672 3673 static int mlxsw_sp_fix_adj_grp_size(struct mlxsw_sp *mlxsw_sp, 3674 u16 *p_adj_grp_size) 3675 { 3676 unsigned int alloc_size; 3677 int err; 3678 3679 /* Round up the requested group size to the next size supported 3680 * by the device and make sure the request can be satisfied. 3681 */ 3682 mlxsw_sp_adj_grp_size_round_up(mlxsw_sp, p_adj_grp_size); 3683 err = mlxsw_sp_kvdl_alloc_count_query(mlxsw_sp, 3684 MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 3685 *p_adj_grp_size, &alloc_size); 3686 if (err) 3687 return err; 3688 /* It is possible the allocation results in more allocated 3689 * entries than requested. Try to use as much of them as 3690 * possible. 3691 */ 3692 mlxsw_sp_adj_grp_size_round_down(mlxsw_sp, p_adj_grp_size, alloc_size); 3693 3694 return 0; 3695 } 3696 3697 static void 3698 mlxsw_sp_nexthop_group_normalize(struct mlxsw_sp_nexthop_group_info *nhgi) 3699 { 3700 int i, g = 0, sum_norm_weight = 0; 3701 struct mlxsw_sp_nexthop *nh; 3702 3703 for (i = 0; i < nhgi->count; i++) { 3704 nh = &nhgi->nexthops[i]; 3705 3706 if (!nh->should_offload) 3707 continue; 3708 if (g > 0) 3709 g = gcd(nh->nh_weight, g); 3710 else 3711 g = nh->nh_weight; 3712 } 3713 3714 for (i = 0; i < nhgi->count; i++) { 3715 nh = &nhgi->nexthops[i]; 3716 3717 if (!nh->should_offload) 3718 continue; 3719 nh->norm_nh_weight = nh->nh_weight / g; 3720 sum_norm_weight += nh->norm_nh_weight; 3721 } 3722 3723 nhgi->sum_norm_weight = sum_norm_weight; 3724 } 3725 3726 static void 3727 mlxsw_sp_nexthop_group_rebalance(struct mlxsw_sp_nexthop_group_info *nhgi) 3728 { 3729 int i, weight = 0, lower_bound = 0; 3730 int total = nhgi->sum_norm_weight; 3731 u16 ecmp_size = nhgi->ecmp_size; 3732 3733 for (i = 0; i < nhgi->count; i++) { 3734 struct mlxsw_sp_nexthop *nh = &nhgi->nexthops[i]; 3735 int upper_bound; 3736 3737 if (!nh->should_offload) 3738 continue; 3739 weight += nh->norm_nh_weight; 3740 upper_bound = DIV_ROUND_CLOSEST(ecmp_size * weight, total); 3741 nh->num_adj_entries = upper_bound - lower_bound; 3742 lower_bound = upper_bound; 3743 } 3744 } 3745 3746 static struct mlxsw_sp_nexthop * 3747 mlxsw_sp_rt6_nexthop(struct mlxsw_sp_nexthop_group *nh_grp, 3748 const struct mlxsw_sp_rt6 *mlxsw_sp_rt6); 3749 3750 static void 3751 mlxsw_sp_nexthop4_group_offload_refresh(struct mlxsw_sp *mlxsw_sp, 3752 struct mlxsw_sp_nexthop_group *nh_grp) 3753 { 3754 int i; 3755 3756 for (i = 0; i < nh_grp->nhgi->count; i++) { 3757 struct mlxsw_sp_nexthop *nh = &nh_grp->nhgi->nexthops[i]; 3758 3759 if (nh->offloaded) 3760 nh->key.fib_nh->fib_nh_flags |= RTNH_F_OFFLOAD; 3761 else 3762 nh->key.fib_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD; 3763 } 3764 } 3765 3766 static void 3767 __mlxsw_sp_nexthop6_group_offload_refresh(struct mlxsw_sp_nexthop_group *nh_grp, 3768 struct mlxsw_sp_fib6_entry *fib6_entry) 3769 { 3770 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 3771 3772 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) { 3773 struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh; 3774 struct mlxsw_sp_nexthop *nh; 3775 3776 nh = mlxsw_sp_rt6_nexthop(nh_grp, mlxsw_sp_rt6); 3777 if (nh && nh->offloaded) 3778 fib6_nh->fib_nh_flags |= RTNH_F_OFFLOAD; 3779 else 3780 fib6_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD; 3781 } 3782 } 3783 3784 static void 3785 mlxsw_sp_nexthop6_group_offload_refresh(struct mlxsw_sp *mlxsw_sp, 3786 struct mlxsw_sp_nexthop_group *nh_grp) 3787 { 3788 struct mlxsw_sp_fib6_entry *fib6_entry; 3789 3790 /* Unfortunately, in IPv6 the route and the nexthop are described by 3791 * the same struct, so we need to iterate over all the routes using the 3792 * nexthop group and set / clear the offload indication for them. 3793 */ 3794 list_for_each_entry(fib6_entry, &nh_grp->fib_list, 3795 common.nexthop_group_node) 3796 __mlxsw_sp_nexthop6_group_offload_refresh(nh_grp, fib6_entry); 3797 } 3798 3799 static void 3800 mlxsw_sp_nexthop_bucket_offload_refresh(struct mlxsw_sp *mlxsw_sp, 3801 const struct mlxsw_sp_nexthop *nh, 3802 u16 bucket_index) 3803 { 3804 struct mlxsw_sp_nexthop_group *nh_grp = nh->nhgi->nh_grp; 3805 bool offload = false, trap = false; 3806 3807 if (nh->offloaded) { 3808 if (nh->action == MLXSW_SP_NEXTHOP_ACTION_TRAP) 3809 trap = true; 3810 else 3811 offload = true; 3812 } 3813 nexthop_bucket_set_hw_flags(mlxsw_sp_net(mlxsw_sp), nh_grp->obj.id, 3814 bucket_index, offload, trap); 3815 } 3816 3817 static void 3818 mlxsw_sp_nexthop_obj_group_offload_refresh(struct mlxsw_sp *mlxsw_sp, 3819 struct mlxsw_sp_nexthop_group *nh_grp) 3820 { 3821 int i; 3822 3823 /* Do not update the flags if the nexthop group is being destroyed 3824 * since: 3825 * 1. The nexthop objects is being deleted, in which case the flags are 3826 * irrelevant. 3827 * 2. The nexthop group was replaced by a newer group, in which case 3828 * the flags of the nexthop object were already updated based on the 3829 * new group. 3830 */ 3831 if (nh_grp->can_destroy) 3832 return; 3833 3834 nexthop_set_hw_flags(mlxsw_sp_net(mlxsw_sp), nh_grp->obj.id, 3835 nh_grp->nhgi->adj_index_valid, false); 3836 3837 /* Update flags of individual nexthop buckets in case of a resilient 3838 * nexthop group. 3839 */ 3840 if (!nh_grp->nhgi->is_resilient) 3841 return; 3842 3843 for (i = 0; i < nh_grp->nhgi->count; i++) { 3844 struct mlxsw_sp_nexthop *nh = &nh_grp->nhgi->nexthops[i]; 3845 3846 mlxsw_sp_nexthop_bucket_offload_refresh(mlxsw_sp, nh, i); 3847 } 3848 } 3849 3850 static void 3851 mlxsw_sp_nexthop_group_offload_refresh(struct mlxsw_sp *mlxsw_sp, 3852 struct mlxsw_sp_nexthop_group *nh_grp) 3853 { 3854 switch (nh_grp->type) { 3855 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4: 3856 mlxsw_sp_nexthop4_group_offload_refresh(mlxsw_sp, nh_grp); 3857 break; 3858 case MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6: 3859 mlxsw_sp_nexthop6_group_offload_refresh(mlxsw_sp, nh_grp); 3860 break; 3861 case MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ: 3862 mlxsw_sp_nexthop_obj_group_offload_refresh(mlxsw_sp, nh_grp); 3863 break; 3864 } 3865 } 3866 3867 static int 3868 mlxsw_sp_nexthop_group_refresh(struct mlxsw_sp *mlxsw_sp, 3869 struct mlxsw_sp_nexthop_group *nh_grp) 3870 { 3871 struct mlxsw_sp_nexthop_group_info *nhgi = nh_grp->nhgi; 3872 u16 ecmp_size, old_ecmp_size; 3873 struct mlxsw_sp_nexthop *nh; 3874 bool offload_change = false; 3875 u32 adj_index; 3876 bool old_adj_index_valid; 3877 u32 old_adj_index; 3878 int i, err2, err; 3879 3880 if (!nhgi->gateway) 3881 return mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp); 3882 3883 for (i = 0; i < nhgi->count; i++) { 3884 nh = &nhgi->nexthops[i]; 3885 3886 if (nh->should_offload != nh->offloaded) { 3887 offload_change = true; 3888 if (nh->should_offload) 3889 nh->update = 1; 3890 } 3891 } 3892 if (!offload_change) { 3893 /* Nothing was added or removed, so no need to reallocate. Just 3894 * update MAC on existing adjacency indexes. 3895 */ 3896 err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nhgi, false); 3897 if (err) { 3898 dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n"); 3899 goto set_trap; 3900 } 3901 /* Flags of individual nexthop buckets might need to be 3902 * updated. 3903 */ 3904 mlxsw_sp_nexthop_group_offload_refresh(mlxsw_sp, nh_grp); 3905 return 0; 3906 } 3907 mlxsw_sp_nexthop_group_normalize(nhgi); 3908 if (!nhgi->sum_norm_weight) { 3909 /* No neigh of this group is connected so we just set 3910 * the trap and let everthing flow through kernel. 3911 */ 3912 err = 0; 3913 goto set_trap; 3914 } 3915 3916 ecmp_size = nhgi->sum_norm_weight; 3917 err = mlxsw_sp_fix_adj_grp_size(mlxsw_sp, &ecmp_size); 3918 if (err) 3919 /* No valid allocation size available. */ 3920 goto set_trap; 3921 3922 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 3923 ecmp_size, &adj_index); 3924 if (err) { 3925 /* We ran out of KVD linear space, just set the 3926 * trap and let everything flow through kernel. 3927 */ 3928 dev_warn(mlxsw_sp->bus_info->dev, "Failed to allocate KVD linear area for nexthop group.\n"); 3929 goto set_trap; 3930 } 3931 old_adj_index_valid = nhgi->adj_index_valid; 3932 old_adj_index = nhgi->adj_index; 3933 old_ecmp_size = nhgi->ecmp_size; 3934 nhgi->adj_index_valid = 1; 3935 nhgi->adj_index = adj_index; 3936 nhgi->ecmp_size = ecmp_size; 3937 mlxsw_sp_nexthop_group_rebalance(nhgi); 3938 err = mlxsw_sp_nexthop_group_update(mlxsw_sp, nhgi, true); 3939 if (err) { 3940 dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n"); 3941 goto set_trap; 3942 } 3943 3944 mlxsw_sp_nexthop_group_offload_refresh(mlxsw_sp, nh_grp); 3945 3946 if (!old_adj_index_valid) { 3947 /* The trap was set for fib entries, so we have to call 3948 * fib entry update to unset it and use adjacency index. 3949 */ 3950 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp); 3951 if (err) { 3952 dev_warn(mlxsw_sp->bus_info->dev, "Failed to add adjacency index to fib entries.\n"); 3953 goto set_trap; 3954 } 3955 return 0; 3956 } 3957 3958 err = mlxsw_sp_adj_index_mass_update(mlxsw_sp, nh_grp, 3959 old_adj_index, old_ecmp_size); 3960 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 3961 old_ecmp_size, old_adj_index); 3962 if (err) { 3963 dev_warn(mlxsw_sp->bus_info->dev, "Failed to mass-update adjacency index for nexthop group.\n"); 3964 goto set_trap; 3965 } 3966 3967 return 0; 3968 3969 set_trap: 3970 old_adj_index_valid = nhgi->adj_index_valid; 3971 nhgi->adj_index_valid = 0; 3972 for (i = 0; i < nhgi->count; i++) { 3973 nh = &nhgi->nexthops[i]; 3974 nh->offloaded = 0; 3975 } 3976 err2 = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp); 3977 if (err2) 3978 dev_warn(mlxsw_sp->bus_info->dev, "Failed to set traps for fib entries.\n"); 3979 mlxsw_sp_nexthop_group_offload_refresh(mlxsw_sp, nh_grp); 3980 if (old_adj_index_valid) 3981 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 3982 nhgi->ecmp_size, nhgi->adj_index); 3983 return err; 3984 } 3985 3986 static void __mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp_nexthop *nh, 3987 bool removing) 3988 { 3989 if (!removing) { 3990 nh->action = MLXSW_SP_NEXTHOP_ACTION_FORWARD; 3991 nh->should_offload = 1; 3992 } else if (nh->nhgi->is_resilient) { 3993 nh->action = MLXSW_SP_NEXTHOP_ACTION_TRAP; 3994 nh->should_offload = 1; 3995 } else { 3996 nh->should_offload = 0; 3997 } 3998 nh->update = 1; 3999 } 4000 4001 static int 4002 mlxsw_sp_nexthop_dead_neigh_replace(struct mlxsw_sp *mlxsw_sp, 4003 struct mlxsw_sp_neigh_entry *neigh_entry) 4004 { 4005 struct neighbour *n, *old_n = neigh_entry->key.n; 4006 struct mlxsw_sp_nexthop *nh; 4007 bool entry_connected; 4008 u8 nud_state, dead; 4009 int err; 4010 4011 nh = list_first_entry(&neigh_entry->nexthop_list, 4012 struct mlxsw_sp_nexthop, neigh_list_node); 4013 4014 n = neigh_lookup(nh->neigh_tbl, &nh->gw_addr, nh->rif->dev); 4015 if (!n) { 4016 n = neigh_create(nh->neigh_tbl, &nh->gw_addr, nh->rif->dev); 4017 if (IS_ERR(n)) 4018 return PTR_ERR(n); 4019 neigh_event_send(n, NULL); 4020 } 4021 4022 mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry); 4023 neigh_entry->key.n = n; 4024 err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry); 4025 if (err) 4026 goto err_neigh_entry_insert; 4027 4028 read_lock_bh(&n->lock); 4029 nud_state = n->nud_state; 4030 dead = n->dead; 4031 read_unlock_bh(&n->lock); 4032 entry_connected = nud_state & NUD_VALID && !dead; 4033 4034 list_for_each_entry(nh, &neigh_entry->nexthop_list, 4035 neigh_list_node) { 4036 neigh_release(old_n); 4037 neigh_clone(n); 4038 __mlxsw_sp_nexthop_neigh_update(nh, !entry_connected); 4039 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nhgi->nh_grp); 4040 } 4041 4042 neigh_release(n); 4043 4044 return 0; 4045 4046 err_neigh_entry_insert: 4047 neigh_entry->key.n = old_n; 4048 mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry); 4049 neigh_release(n); 4050 return err; 4051 } 4052 4053 static void 4054 mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp, 4055 struct mlxsw_sp_neigh_entry *neigh_entry, 4056 bool removing, bool dead) 4057 { 4058 struct mlxsw_sp_nexthop *nh; 4059 4060 if (list_empty(&neigh_entry->nexthop_list)) 4061 return; 4062 4063 if (dead) { 4064 int err; 4065 4066 err = mlxsw_sp_nexthop_dead_neigh_replace(mlxsw_sp, 4067 neigh_entry); 4068 if (err) 4069 dev_err(mlxsw_sp->bus_info->dev, "Failed to replace dead neigh\n"); 4070 return; 4071 } 4072 4073 list_for_each_entry(nh, &neigh_entry->nexthop_list, 4074 neigh_list_node) { 4075 __mlxsw_sp_nexthop_neigh_update(nh, removing); 4076 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nhgi->nh_grp); 4077 } 4078 } 4079 4080 static void mlxsw_sp_nexthop_rif_init(struct mlxsw_sp_nexthop *nh, 4081 struct mlxsw_sp_rif *rif) 4082 { 4083 if (nh->rif) 4084 return; 4085 4086 nh->rif = rif; 4087 list_add(&nh->rif_list_node, &rif->nexthop_list); 4088 } 4089 4090 static void mlxsw_sp_nexthop_rif_fini(struct mlxsw_sp_nexthop *nh) 4091 { 4092 if (!nh->rif) 4093 return; 4094 4095 list_del(&nh->rif_list_node); 4096 nh->rif = NULL; 4097 } 4098 4099 static int mlxsw_sp_nexthop_neigh_init(struct mlxsw_sp *mlxsw_sp, 4100 struct mlxsw_sp_nexthop *nh) 4101 { 4102 struct mlxsw_sp_neigh_entry *neigh_entry; 4103 struct neighbour *n; 4104 u8 nud_state, dead; 4105 int err; 4106 4107 if (!nh->nhgi->gateway || nh->neigh_entry) 4108 return 0; 4109 4110 /* Take a reference of neigh here ensuring that neigh would 4111 * not be destructed before the nexthop entry is finished. 4112 * The reference is taken either in neigh_lookup() or 4113 * in neigh_create() in case n is not found. 4114 */ 4115 n = neigh_lookup(nh->neigh_tbl, &nh->gw_addr, nh->rif->dev); 4116 if (!n) { 4117 n = neigh_create(nh->neigh_tbl, &nh->gw_addr, nh->rif->dev); 4118 if (IS_ERR(n)) 4119 return PTR_ERR(n); 4120 neigh_event_send(n, NULL); 4121 } 4122 neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, n); 4123 if (!neigh_entry) { 4124 neigh_entry = mlxsw_sp_neigh_entry_create(mlxsw_sp, n); 4125 if (IS_ERR(neigh_entry)) { 4126 err = -EINVAL; 4127 goto err_neigh_entry_create; 4128 } 4129 } 4130 4131 /* If that is the first nexthop connected to that neigh, add to 4132 * nexthop_neighs_list 4133 */ 4134 if (list_empty(&neigh_entry->nexthop_list)) 4135 list_add_tail(&neigh_entry->nexthop_neighs_list_node, 4136 &mlxsw_sp->router->nexthop_neighs_list); 4137 4138 nh->neigh_entry = neigh_entry; 4139 list_add_tail(&nh->neigh_list_node, &neigh_entry->nexthop_list); 4140 read_lock_bh(&n->lock); 4141 nud_state = n->nud_state; 4142 dead = n->dead; 4143 read_unlock_bh(&n->lock); 4144 __mlxsw_sp_nexthop_neigh_update(nh, !(nud_state & NUD_VALID && !dead)); 4145 4146 return 0; 4147 4148 err_neigh_entry_create: 4149 neigh_release(n); 4150 return err; 4151 } 4152 4153 static void mlxsw_sp_nexthop_neigh_fini(struct mlxsw_sp *mlxsw_sp, 4154 struct mlxsw_sp_nexthop *nh) 4155 { 4156 struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry; 4157 struct neighbour *n; 4158 4159 if (!neigh_entry) 4160 return; 4161 n = neigh_entry->key.n; 4162 4163 __mlxsw_sp_nexthop_neigh_update(nh, true); 4164 list_del(&nh->neigh_list_node); 4165 nh->neigh_entry = NULL; 4166 4167 /* If that is the last nexthop connected to that neigh, remove from 4168 * nexthop_neighs_list 4169 */ 4170 if (list_empty(&neigh_entry->nexthop_list)) 4171 list_del(&neigh_entry->nexthop_neighs_list_node); 4172 4173 if (!neigh_entry->connected && list_empty(&neigh_entry->nexthop_list)) 4174 mlxsw_sp_neigh_entry_destroy(mlxsw_sp, neigh_entry); 4175 4176 neigh_release(n); 4177 } 4178 4179 static bool mlxsw_sp_ipip_netdev_ul_up(struct net_device *ol_dev) 4180 { 4181 struct net_device *ul_dev; 4182 bool is_up; 4183 4184 rcu_read_lock(); 4185 ul_dev = mlxsw_sp_ipip_netdev_ul_dev_get(ol_dev); 4186 is_up = ul_dev ? (ul_dev->flags & IFF_UP) : true; 4187 rcu_read_unlock(); 4188 4189 return is_up; 4190 } 4191 4192 static void mlxsw_sp_nexthop_ipip_init(struct mlxsw_sp *mlxsw_sp, 4193 struct mlxsw_sp_nexthop *nh, 4194 struct mlxsw_sp_ipip_entry *ipip_entry) 4195 { 4196 bool removing; 4197 4198 if (!nh->nhgi->gateway || nh->ipip_entry) 4199 return; 4200 4201 nh->ipip_entry = ipip_entry; 4202 removing = !mlxsw_sp_ipip_netdev_ul_up(ipip_entry->ol_dev); 4203 __mlxsw_sp_nexthop_neigh_update(nh, removing); 4204 mlxsw_sp_nexthop_rif_init(nh, &ipip_entry->ol_lb->common); 4205 } 4206 4207 static void mlxsw_sp_nexthop_ipip_fini(struct mlxsw_sp *mlxsw_sp, 4208 struct mlxsw_sp_nexthop *nh) 4209 { 4210 struct mlxsw_sp_ipip_entry *ipip_entry = nh->ipip_entry; 4211 4212 if (!ipip_entry) 4213 return; 4214 4215 __mlxsw_sp_nexthop_neigh_update(nh, true); 4216 nh->ipip_entry = NULL; 4217 } 4218 4219 static bool mlxsw_sp_nexthop4_ipip_type(const struct mlxsw_sp *mlxsw_sp, 4220 const struct fib_nh *fib_nh, 4221 enum mlxsw_sp_ipip_type *p_ipipt) 4222 { 4223 struct net_device *dev = fib_nh->fib_nh_dev; 4224 4225 return dev && 4226 fib_nh->nh_parent->fib_type == RTN_UNICAST && 4227 mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, p_ipipt); 4228 } 4229 4230 static int mlxsw_sp_nexthop_type_init(struct mlxsw_sp *mlxsw_sp, 4231 struct mlxsw_sp_nexthop *nh, 4232 const struct net_device *dev) 4233 { 4234 const struct mlxsw_sp_ipip_ops *ipip_ops; 4235 struct mlxsw_sp_ipip_entry *ipip_entry; 4236 struct mlxsw_sp_rif *rif; 4237 int err; 4238 4239 ipip_entry = mlxsw_sp_ipip_entry_find_by_ol_dev(mlxsw_sp, dev); 4240 if (ipip_entry) { 4241 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]; 4242 if (ipip_ops->can_offload(mlxsw_sp, dev)) { 4243 nh->type = MLXSW_SP_NEXTHOP_TYPE_IPIP; 4244 mlxsw_sp_nexthop_ipip_init(mlxsw_sp, nh, ipip_entry); 4245 return 0; 4246 } 4247 } 4248 4249 nh->type = MLXSW_SP_NEXTHOP_TYPE_ETH; 4250 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 4251 if (!rif) 4252 return 0; 4253 4254 mlxsw_sp_nexthop_rif_init(nh, rif); 4255 err = mlxsw_sp_nexthop_neigh_init(mlxsw_sp, nh); 4256 if (err) 4257 goto err_neigh_init; 4258 4259 return 0; 4260 4261 err_neigh_init: 4262 mlxsw_sp_nexthop_rif_fini(nh); 4263 return err; 4264 } 4265 4266 static void mlxsw_sp_nexthop_type_fini(struct mlxsw_sp *mlxsw_sp, 4267 struct mlxsw_sp_nexthop *nh) 4268 { 4269 switch (nh->type) { 4270 case MLXSW_SP_NEXTHOP_TYPE_ETH: 4271 mlxsw_sp_nexthop_neigh_fini(mlxsw_sp, nh); 4272 mlxsw_sp_nexthop_rif_fini(nh); 4273 break; 4274 case MLXSW_SP_NEXTHOP_TYPE_IPIP: 4275 mlxsw_sp_nexthop_rif_fini(nh); 4276 mlxsw_sp_nexthop_ipip_fini(mlxsw_sp, nh); 4277 break; 4278 } 4279 } 4280 4281 static int mlxsw_sp_nexthop4_init(struct mlxsw_sp *mlxsw_sp, 4282 struct mlxsw_sp_nexthop_group *nh_grp, 4283 struct mlxsw_sp_nexthop *nh, 4284 struct fib_nh *fib_nh) 4285 { 4286 struct net_device *dev = fib_nh->fib_nh_dev; 4287 struct in_device *in_dev; 4288 int err; 4289 4290 nh->nhgi = nh_grp->nhgi; 4291 nh->key.fib_nh = fib_nh; 4292 #ifdef CONFIG_IP_ROUTE_MULTIPATH 4293 nh->nh_weight = fib_nh->fib_nh_weight; 4294 #else 4295 nh->nh_weight = 1; 4296 #endif 4297 memcpy(&nh->gw_addr, &fib_nh->fib_nh_gw4, sizeof(fib_nh->fib_nh_gw4)); 4298 nh->neigh_tbl = &arp_tbl; 4299 err = mlxsw_sp_nexthop_insert(mlxsw_sp, nh); 4300 if (err) 4301 return err; 4302 4303 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh); 4304 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list); 4305 4306 if (!dev) 4307 return 0; 4308 nh->ifindex = dev->ifindex; 4309 4310 rcu_read_lock(); 4311 in_dev = __in_dev_get_rcu(dev); 4312 if (in_dev && IN_DEV_IGNORE_ROUTES_WITH_LINKDOWN(in_dev) && 4313 fib_nh->fib_nh_flags & RTNH_F_LINKDOWN) { 4314 rcu_read_unlock(); 4315 return 0; 4316 } 4317 rcu_read_unlock(); 4318 4319 err = mlxsw_sp_nexthop_type_init(mlxsw_sp, nh, dev); 4320 if (err) 4321 goto err_nexthop_neigh_init; 4322 4323 return 0; 4324 4325 err_nexthop_neigh_init: 4326 list_del(&nh->router_list_node); 4327 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh); 4328 mlxsw_sp_nexthop_remove(mlxsw_sp, nh); 4329 return err; 4330 } 4331 4332 static void mlxsw_sp_nexthop4_fini(struct mlxsw_sp *mlxsw_sp, 4333 struct mlxsw_sp_nexthop *nh) 4334 { 4335 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh); 4336 list_del(&nh->router_list_node); 4337 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh); 4338 mlxsw_sp_nexthop_remove(mlxsw_sp, nh); 4339 } 4340 4341 static void mlxsw_sp_nexthop4_event(struct mlxsw_sp *mlxsw_sp, 4342 unsigned long event, struct fib_nh *fib_nh) 4343 { 4344 struct mlxsw_sp_nexthop_key key; 4345 struct mlxsw_sp_nexthop *nh; 4346 4347 key.fib_nh = fib_nh; 4348 nh = mlxsw_sp_nexthop_lookup(mlxsw_sp, key); 4349 if (!nh) 4350 return; 4351 4352 switch (event) { 4353 case FIB_EVENT_NH_ADD: 4354 mlxsw_sp_nexthop_type_init(mlxsw_sp, nh, fib_nh->fib_nh_dev); 4355 break; 4356 case FIB_EVENT_NH_DEL: 4357 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh); 4358 break; 4359 } 4360 4361 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nhgi->nh_grp); 4362 } 4363 4364 static void mlxsw_sp_nexthop_rif_update(struct mlxsw_sp *mlxsw_sp, 4365 struct mlxsw_sp_rif *rif) 4366 { 4367 struct mlxsw_sp_nexthop *nh; 4368 bool removing; 4369 4370 list_for_each_entry(nh, &rif->nexthop_list, rif_list_node) { 4371 switch (nh->type) { 4372 case MLXSW_SP_NEXTHOP_TYPE_ETH: 4373 removing = false; 4374 break; 4375 case MLXSW_SP_NEXTHOP_TYPE_IPIP: 4376 removing = !mlxsw_sp_ipip_netdev_ul_up(rif->dev); 4377 break; 4378 default: 4379 WARN_ON(1); 4380 continue; 4381 } 4382 4383 __mlxsw_sp_nexthop_neigh_update(nh, removing); 4384 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nhgi->nh_grp); 4385 } 4386 } 4387 4388 static void mlxsw_sp_nexthop_rif_migrate(struct mlxsw_sp *mlxsw_sp, 4389 struct mlxsw_sp_rif *old_rif, 4390 struct mlxsw_sp_rif *new_rif) 4391 { 4392 struct mlxsw_sp_nexthop *nh; 4393 4394 list_splice_init(&old_rif->nexthop_list, &new_rif->nexthop_list); 4395 list_for_each_entry(nh, &new_rif->nexthop_list, rif_list_node) 4396 nh->rif = new_rif; 4397 mlxsw_sp_nexthop_rif_update(mlxsw_sp, new_rif); 4398 } 4399 4400 static void mlxsw_sp_nexthop_rif_gone_sync(struct mlxsw_sp *mlxsw_sp, 4401 struct mlxsw_sp_rif *rif) 4402 { 4403 struct mlxsw_sp_nexthop *nh, *tmp; 4404 4405 list_for_each_entry_safe(nh, tmp, &rif->nexthop_list, rif_list_node) { 4406 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh); 4407 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nhgi->nh_grp); 4408 } 4409 } 4410 4411 static int mlxsw_sp_adj_trap_entry_init(struct mlxsw_sp *mlxsw_sp) 4412 { 4413 enum mlxsw_reg_ratr_trap_action trap_action; 4414 char ratr_pl[MLXSW_REG_RATR_LEN]; 4415 int err; 4416 4417 err = mlxsw_sp_kvdl_alloc(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1, 4418 &mlxsw_sp->router->adj_trap_index); 4419 if (err) 4420 return err; 4421 4422 trap_action = MLXSW_REG_RATR_TRAP_ACTION_TRAP; 4423 mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY, true, 4424 MLXSW_REG_RATR_TYPE_ETHERNET, 4425 mlxsw_sp->router->adj_trap_index, 4426 mlxsw_sp->router->lb_rif_index); 4427 mlxsw_reg_ratr_trap_action_set(ratr_pl, trap_action); 4428 mlxsw_reg_ratr_trap_id_set(ratr_pl, MLXSW_TRAP_ID_RTR_EGRESS0); 4429 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl); 4430 if (err) 4431 goto err_ratr_write; 4432 4433 return 0; 4434 4435 err_ratr_write: 4436 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1, 4437 mlxsw_sp->router->adj_trap_index); 4438 return err; 4439 } 4440 4441 static void mlxsw_sp_adj_trap_entry_fini(struct mlxsw_sp *mlxsw_sp) 4442 { 4443 mlxsw_sp_kvdl_free(mlxsw_sp, MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 1, 4444 mlxsw_sp->router->adj_trap_index); 4445 } 4446 4447 static int mlxsw_sp_nexthop_group_inc(struct mlxsw_sp *mlxsw_sp) 4448 { 4449 int err; 4450 4451 if (refcount_inc_not_zero(&mlxsw_sp->router->num_groups)) 4452 return 0; 4453 4454 err = mlxsw_sp_adj_trap_entry_init(mlxsw_sp); 4455 if (err) 4456 return err; 4457 4458 refcount_set(&mlxsw_sp->router->num_groups, 1); 4459 4460 return 0; 4461 } 4462 4463 static void mlxsw_sp_nexthop_group_dec(struct mlxsw_sp *mlxsw_sp) 4464 { 4465 if (!refcount_dec_and_test(&mlxsw_sp->router->num_groups)) 4466 return; 4467 4468 mlxsw_sp_adj_trap_entry_fini(mlxsw_sp); 4469 } 4470 4471 static void 4472 mlxsw_sp_nh_grp_activity_get(struct mlxsw_sp *mlxsw_sp, 4473 const struct mlxsw_sp_nexthop_group *nh_grp, 4474 unsigned long *activity) 4475 { 4476 char *ratrad_pl; 4477 int i, err; 4478 4479 ratrad_pl = kmalloc(MLXSW_REG_RATRAD_LEN, GFP_KERNEL); 4480 if (!ratrad_pl) 4481 return; 4482 4483 mlxsw_reg_ratrad_pack(ratrad_pl, nh_grp->nhgi->adj_index, 4484 nh_grp->nhgi->count); 4485 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ratrad), ratrad_pl); 4486 if (err) 4487 goto out; 4488 4489 for (i = 0; i < nh_grp->nhgi->count; i++) { 4490 if (!mlxsw_reg_ratrad_activity_vector_get(ratrad_pl, i)) 4491 continue; 4492 bitmap_set(activity, i, 1); 4493 } 4494 4495 out: 4496 kfree(ratrad_pl); 4497 } 4498 4499 #define MLXSW_SP_NH_GRP_ACTIVITY_UPDATE_INTERVAL 1000 /* ms */ 4500 4501 static void 4502 mlxsw_sp_nh_grp_activity_update(struct mlxsw_sp *mlxsw_sp, 4503 const struct mlxsw_sp_nexthop_group *nh_grp) 4504 { 4505 unsigned long *activity; 4506 4507 activity = bitmap_zalloc(nh_grp->nhgi->count, GFP_KERNEL); 4508 if (!activity) 4509 return; 4510 4511 mlxsw_sp_nh_grp_activity_get(mlxsw_sp, nh_grp, activity); 4512 nexthop_res_grp_activity_update(mlxsw_sp_net(mlxsw_sp), nh_grp->obj.id, 4513 nh_grp->nhgi->count, activity); 4514 4515 bitmap_free(activity); 4516 } 4517 4518 static void 4519 mlxsw_sp_nh_grp_activity_work_schedule(struct mlxsw_sp *mlxsw_sp) 4520 { 4521 unsigned int interval = MLXSW_SP_NH_GRP_ACTIVITY_UPDATE_INTERVAL; 4522 4523 mlxsw_core_schedule_dw(&mlxsw_sp->router->nh_grp_activity_dw, 4524 msecs_to_jiffies(interval)); 4525 } 4526 4527 static void mlxsw_sp_nh_grp_activity_work(struct work_struct *work) 4528 { 4529 struct mlxsw_sp_nexthop_group_info *nhgi; 4530 struct mlxsw_sp_router *router; 4531 bool reschedule = false; 4532 4533 router = container_of(work, struct mlxsw_sp_router, 4534 nh_grp_activity_dw.work); 4535 4536 mutex_lock(&router->lock); 4537 4538 list_for_each_entry(nhgi, &router->nh_res_grp_list, list) { 4539 mlxsw_sp_nh_grp_activity_update(router->mlxsw_sp, nhgi->nh_grp); 4540 reschedule = true; 4541 } 4542 4543 mutex_unlock(&router->lock); 4544 4545 if (!reschedule) 4546 return; 4547 mlxsw_sp_nh_grp_activity_work_schedule(router->mlxsw_sp); 4548 } 4549 4550 static int 4551 mlxsw_sp_nexthop_obj_single_validate(struct mlxsw_sp *mlxsw_sp, 4552 const struct nh_notifier_single_info *nh, 4553 struct netlink_ext_ack *extack) 4554 { 4555 int err = -EINVAL; 4556 4557 if (nh->is_fdb) 4558 NL_SET_ERR_MSG_MOD(extack, "FDB nexthops are not supported"); 4559 else if (nh->has_encap) 4560 NL_SET_ERR_MSG_MOD(extack, "Encapsulating nexthops are not supported"); 4561 else 4562 err = 0; 4563 4564 return err; 4565 } 4566 4567 static int 4568 mlxsw_sp_nexthop_obj_group_entry_validate(struct mlxsw_sp *mlxsw_sp, 4569 const struct nh_notifier_single_info *nh, 4570 struct netlink_ext_ack *extack) 4571 { 4572 int err; 4573 4574 err = mlxsw_sp_nexthop_obj_single_validate(mlxsw_sp, nh, extack); 4575 if (err) 4576 return err; 4577 4578 /* Device only nexthops with an IPIP device are programmed as 4579 * encapsulating adjacency entries. 4580 */ 4581 if (!nh->gw_family && !nh->is_reject && 4582 !mlxsw_sp_netdev_ipip_type(mlxsw_sp, nh->dev, NULL)) { 4583 NL_SET_ERR_MSG_MOD(extack, "Nexthop group entry does not have a gateway"); 4584 return -EINVAL; 4585 } 4586 4587 return 0; 4588 } 4589 4590 static int 4591 mlxsw_sp_nexthop_obj_group_validate(struct mlxsw_sp *mlxsw_sp, 4592 const struct nh_notifier_grp_info *nh_grp, 4593 struct netlink_ext_ack *extack) 4594 { 4595 int i; 4596 4597 if (nh_grp->is_fdb) { 4598 NL_SET_ERR_MSG_MOD(extack, "FDB nexthop groups are not supported"); 4599 return -EINVAL; 4600 } 4601 4602 for (i = 0; i < nh_grp->num_nh; i++) { 4603 const struct nh_notifier_single_info *nh; 4604 int err; 4605 4606 nh = &nh_grp->nh_entries[i].nh; 4607 err = mlxsw_sp_nexthop_obj_group_entry_validate(mlxsw_sp, nh, 4608 extack); 4609 if (err) 4610 return err; 4611 } 4612 4613 return 0; 4614 } 4615 4616 static int 4617 mlxsw_sp_nexthop_obj_res_group_size_validate(struct mlxsw_sp *mlxsw_sp, 4618 const struct nh_notifier_res_table_info *nh_res_table, 4619 struct netlink_ext_ack *extack) 4620 { 4621 unsigned int alloc_size; 4622 bool valid_size = false; 4623 int err, i; 4624 4625 if (nh_res_table->num_nh_buckets < 32) { 4626 NL_SET_ERR_MSG_MOD(extack, "Minimum number of buckets is 32"); 4627 return -EINVAL; 4628 } 4629 4630 for (i = 0; i < mlxsw_sp->router->adj_grp_size_ranges_count; i++) { 4631 const struct mlxsw_sp_adj_grp_size_range *size_range; 4632 4633 size_range = &mlxsw_sp->router->adj_grp_size_ranges[i]; 4634 4635 if (nh_res_table->num_nh_buckets >= size_range->start && 4636 nh_res_table->num_nh_buckets <= size_range->end) { 4637 valid_size = true; 4638 break; 4639 } 4640 } 4641 4642 if (!valid_size) { 4643 NL_SET_ERR_MSG_MOD(extack, "Invalid number of buckets"); 4644 return -EINVAL; 4645 } 4646 4647 err = mlxsw_sp_kvdl_alloc_count_query(mlxsw_sp, 4648 MLXSW_SP_KVDL_ENTRY_TYPE_ADJ, 4649 nh_res_table->num_nh_buckets, 4650 &alloc_size); 4651 if (err || nh_res_table->num_nh_buckets != alloc_size) { 4652 NL_SET_ERR_MSG_MOD(extack, "Number of buckets does not fit allocation size of any KVDL partition"); 4653 return -EINVAL; 4654 } 4655 4656 return 0; 4657 } 4658 4659 static int 4660 mlxsw_sp_nexthop_obj_res_group_validate(struct mlxsw_sp *mlxsw_sp, 4661 const struct nh_notifier_res_table_info *nh_res_table, 4662 struct netlink_ext_ack *extack) 4663 { 4664 int err; 4665 u16 i; 4666 4667 err = mlxsw_sp_nexthop_obj_res_group_size_validate(mlxsw_sp, 4668 nh_res_table, 4669 extack); 4670 if (err) 4671 return err; 4672 4673 for (i = 0; i < nh_res_table->num_nh_buckets; i++) { 4674 const struct nh_notifier_single_info *nh; 4675 int err; 4676 4677 nh = &nh_res_table->nhs[i]; 4678 err = mlxsw_sp_nexthop_obj_group_entry_validate(mlxsw_sp, nh, 4679 extack); 4680 if (err) 4681 return err; 4682 } 4683 4684 return 0; 4685 } 4686 4687 static int mlxsw_sp_nexthop_obj_validate(struct mlxsw_sp *mlxsw_sp, 4688 unsigned long event, 4689 struct nh_notifier_info *info) 4690 { 4691 struct nh_notifier_single_info *nh; 4692 4693 if (event != NEXTHOP_EVENT_REPLACE && 4694 event != NEXTHOP_EVENT_RES_TABLE_PRE_REPLACE && 4695 event != NEXTHOP_EVENT_BUCKET_REPLACE) 4696 return 0; 4697 4698 switch (info->type) { 4699 case NH_NOTIFIER_INFO_TYPE_SINGLE: 4700 return mlxsw_sp_nexthop_obj_single_validate(mlxsw_sp, info->nh, 4701 info->extack); 4702 case NH_NOTIFIER_INFO_TYPE_GRP: 4703 return mlxsw_sp_nexthop_obj_group_validate(mlxsw_sp, 4704 info->nh_grp, 4705 info->extack); 4706 case NH_NOTIFIER_INFO_TYPE_RES_TABLE: 4707 return mlxsw_sp_nexthop_obj_res_group_validate(mlxsw_sp, 4708 info->nh_res_table, 4709 info->extack); 4710 case NH_NOTIFIER_INFO_TYPE_RES_BUCKET: 4711 nh = &info->nh_res_bucket->new_nh; 4712 return mlxsw_sp_nexthop_obj_group_entry_validate(mlxsw_sp, nh, 4713 info->extack); 4714 default: 4715 NL_SET_ERR_MSG_MOD(info->extack, "Unsupported nexthop type"); 4716 return -EOPNOTSUPP; 4717 } 4718 } 4719 4720 static bool mlxsw_sp_nexthop_obj_is_gateway(struct mlxsw_sp *mlxsw_sp, 4721 const struct nh_notifier_info *info) 4722 { 4723 const struct net_device *dev; 4724 4725 switch (info->type) { 4726 case NH_NOTIFIER_INFO_TYPE_SINGLE: 4727 dev = info->nh->dev; 4728 return info->nh->gw_family || info->nh->is_reject || 4729 mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL); 4730 case NH_NOTIFIER_INFO_TYPE_GRP: 4731 case NH_NOTIFIER_INFO_TYPE_RES_TABLE: 4732 /* Already validated earlier. */ 4733 return true; 4734 default: 4735 return false; 4736 } 4737 } 4738 4739 static void mlxsw_sp_nexthop_obj_blackhole_init(struct mlxsw_sp *mlxsw_sp, 4740 struct mlxsw_sp_nexthop *nh) 4741 { 4742 u16 lb_rif_index = mlxsw_sp->router->lb_rif_index; 4743 4744 nh->action = MLXSW_SP_NEXTHOP_ACTION_DISCARD; 4745 nh->should_offload = 1; 4746 /* While nexthops that discard packets do not forward packets 4747 * via an egress RIF, they still need to be programmed using a 4748 * valid RIF, so use the loopback RIF created during init. 4749 */ 4750 nh->rif = mlxsw_sp->router->rifs[lb_rif_index]; 4751 } 4752 4753 static void mlxsw_sp_nexthop_obj_blackhole_fini(struct mlxsw_sp *mlxsw_sp, 4754 struct mlxsw_sp_nexthop *nh) 4755 { 4756 nh->rif = NULL; 4757 nh->should_offload = 0; 4758 } 4759 4760 static int 4761 mlxsw_sp_nexthop_obj_init(struct mlxsw_sp *mlxsw_sp, 4762 struct mlxsw_sp_nexthop_group *nh_grp, 4763 struct mlxsw_sp_nexthop *nh, 4764 struct nh_notifier_single_info *nh_obj, int weight) 4765 { 4766 struct net_device *dev = nh_obj->dev; 4767 int err; 4768 4769 nh->nhgi = nh_grp->nhgi; 4770 nh->nh_weight = weight; 4771 4772 switch (nh_obj->gw_family) { 4773 case AF_INET: 4774 memcpy(&nh->gw_addr, &nh_obj->ipv4, sizeof(nh_obj->ipv4)); 4775 nh->neigh_tbl = &arp_tbl; 4776 break; 4777 case AF_INET6: 4778 memcpy(&nh->gw_addr, &nh_obj->ipv6, sizeof(nh_obj->ipv6)); 4779 #if IS_ENABLED(CONFIG_IPV6) 4780 nh->neigh_tbl = &nd_tbl; 4781 #endif 4782 break; 4783 } 4784 4785 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh); 4786 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list); 4787 nh->ifindex = dev->ifindex; 4788 4789 err = mlxsw_sp_nexthop_type_init(mlxsw_sp, nh, dev); 4790 if (err) 4791 goto err_type_init; 4792 4793 if (nh_obj->is_reject) 4794 mlxsw_sp_nexthop_obj_blackhole_init(mlxsw_sp, nh); 4795 4796 /* In a resilient nexthop group, all the nexthops must be written to 4797 * the adjacency table. Even if they do not have a valid neighbour or 4798 * RIF. 4799 */ 4800 if (nh_grp->nhgi->is_resilient && !nh->should_offload) { 4801 nh->action = MLXSW_SP_NEXTHOP_ACTION_TRAP; 4802 nh->should_offload = 1; 4803 } 4804 4805 return 0; 4806 4807 err_type_init: 4808 list_del(&nh->router_list_node); 4809 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh); 4810 return err; 4811 } 4812 4813 static void mlxsw_sp_nexthop_obj_fini(struct mlxsw_sp *mlxsw_sp, 4814 struct mlxsw_sp_nexthop *nh) 4815 { 4816 if (nh->action == MLXSW_SP_NEXTHOP_ACTION_DISCARD) 4817 mlxsw_sp_nexthop_obj_blackhole_fini(mlxsw_sp, nh); 4818 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh); 4819 list_del(&nh->router_list_node); 4820 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh); 4821 nh->should_offload = 0; 4822 } 4823 4824 static int 4825 mlxsw_sp_nexthop_obj_group_info_init(struct mlxsw_sp *mlxsw_sp, 4826 struct mlxsw_sp_nexthop_group *nh_grp, 4827 struct nh_notifier_info *info) 4828 { 4829 struct mlxsw_sp_nexthop_group_info *nhgi; 4830 struct mlxsw_sp_nexthop *nh; 4831 bool is_resilient = false; 4832 unsigned int nhs; 4833 int err, i; 4834 4835 switch (info->type) { 4836 case NH_NOTIFIER_INFO_TYPE_SINGLE: 4837 nhs = 1; 4838 break; 4839 case NH_NOTIFIER_INFO_TYPE_GRP: 4840 nhs = info->nh_grp->num_nh; 4841 break; 4842 case NH_NOTIFIER_INFO_TYPE_RES_TABLE: 4843 nhs = info->nh_res_table->num_nh_buckets; 4844 is_resilient = true; 4845 break; 4846 default: 4847 return -EINVAL; 4848 } 4849 4850 nhgi = kzalloc(struct_size(nhgi, nexthops, nhs), GFP_KERNEL); 4851 if (!nhgi) 4852 return -ENOMEM; 4853 nh_grp->nhgi = nhgi; 4854 nhgi->nh_grp = nh_grp; 4855 nhgi->gateway = mlxsw_sp_nexthop_obj_is_gateway(mlxsw_sp, info); 4856 nhgi->is_resilient = is_resilient; 4857 nhgi->count = nhs; 4858 for (i = 0; i < nhgi->count; i++) { 4859 struct nh_notifier_single_info *nh_obj; 4860 int weight; 4861 4862 nh = &nhgi->nexthops[i]; 4863 switch (info->type) { 4864 case NH_NOTIFIER_INFO_TYPE_SINGLE: 4865 nh_obj = info->nh; 4866 weight = 1; 4867 break; 4868 case NH_NOTIFIER_INFO_TYPE_GRP: 4869 nh_obj = &info->nh_grp->nh_entries[i].nh; 4870 weight = info->nh_grp->nh_entries[i].weight; 4871 break; 4872 case NH_NOTIFIER_INFO_TYPE_RES_TABLE: 4873 nh_obj = &info->nh_res_table->nhs[i]; 4874 weight = 1; 4875 break; 4876 default: 4877 err = -EINVAL; 4878 goto err_nexthop_obj_init; 4879 } 4880 err = mlxsw_sp_nexthop_obj_init(mlxsw_sp, nh_grp, nh, nh_obj, 4881 weight); 4882 if (err) 4883 goto err_nexthop_obj_init; 4884 } 4885 err = mlxsw_sp_nexthop_group_inc(mlxsw_sp); 4886 if (err) 4887 goto err_group_inc; 4888 err = mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); 4889 if (err) { 4890 NL_SET_ERR_MSG_MOD(info->extack, "Failed to write adjacency entries to the device"); 4891 goto err_group_refresh; 4892 } 4893 4894 /* Add resilient nexthop groups to a list so that the activity of their 4895 * nexthop buckets will be periodically queried and cleared. 4896 */ 4897 if (nhgi->is_resilient) { 4898 if (list_empty(&mlxsw_sp->router->nh_res_grp_list)) 4899 mlxsw_sp_nh_grp_activity_work_schedule(mlxsw_sp); 4900 list_add(&nhgi->list, &mlxsw_sp->router->nh_res_grp_list); 4901 } 4902 4903 return 0; 4904 4905 err_group_refresh: 4906 mlxsw_sp_nexthop_group_dec(mlxsw_sp); 4907 err_group_inc: 4908 i = nhgi->count; 4909 err_nexthop_obj_init: 4910 for (i--; i >= 0; i--) { 4911 nh = &nhgi->nexthops[i]; 4912 mlxsw_sp_nexthop_obj_fini(mlxsw_sp, nh); 4913 } 4914 kfree(nhgi); 4915 return err; 4916 } 4917 4918 static void 4919 mlxsw_sp_nexthop_obj_group_info_fini(struct mlxsw_sp *mlxsw_sp, 4920 struct mlxsw_sp_nexthop_group *nh_grp) 4921 { 4922 struct mlxsw_sp_nexthop_group_info *nhgi = nh_grp->nhgi; 4923 struct mlxsw_sp_router *router = mlxsw_sp->router; 4924 int i; 4925 4926 if (nhgi->is_resilient) { 4927 list_del(&nhgi->list); 4928 if (list_empty(&mlxsw_sp->router->nh_res_grp_list)) 4929 cancel_delayed_work(&router->nh_grp_activity_dw); 4930 } 4931 4932 mlxsw_sp_nexthop_group_dec(mlxsw_sp); 4933 for (i = nhgi->count - 1; i >= 0; i--) { 4934 struct mlxsw_sp_nexthop *nh = &nhgi->nexthops[i]; 4935 4936 mlxsw_sp_nexthop_obj_fini(mlxsw_sp, nh); 4937 } 4938 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); 4939 WARN_ON_ONCE(nhgi->adj_index_valid); 4940 kfree(nhgi); 4941 } 4942 4943 static struct mlxsw_sp_nexthop_group * 4944 mlxsw_sp_nexthop_obj_group_create(struct mlxsw_sp *mlxsw_sp, 4945 struct nh_notifier_info *info) 4946 { 4947 struct mlxsw_sp_nexthop_group *nh_grp; 4948 int err; 4949 4950 nh_grp = kzalloc(sizeof(*nh_grp), GFP_KERNEL); 4951 if (!nh_grp) 4952 return ERR_PTR(-ENOMEM); 4953 INIT_LIST_HEAD(&nh_grp->vr_list); 4954 err = rhashtable_init(&nh_grp->vr_ht, 4955 &mlxsw_sp_nexthop_group_vr_ht_params); 4956 if (err) 4957 goto err_nexthop_group_vr_ht_init; 4958 INIT_LIST_HEAD(&nh_grp->fib_list); 4959 nh_grp->type = MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ; 4960 nh_grp->obj.id = info->id; 4961 4962 err = mlxsw_sp_nexthop_obj_group_info_init(mlxsw_sp, nh_grp, info); 4963 if (err) 4964 goto err_nexthop_group_info_init; 4965 4966 nh_grp->can_destroy = false; 4967 4968 return nh_grp; 4969 4970 err_nexthop_group_info_init: 4971 rhashtable_destroy(&nh_grp->vr_ht); 4972 err_nexthop_group_vr_ht_init: 4973 kfree(nh_grp); 4974 return ERR_PTR(err); 4975 } 4976 4977 static void 4978 mlxsw_sp_nexthop_obj_group_destroy(struct mlxsw_sp *mlxsw_sp, 4979 struct mlxsw_sp_nexthop_group *nh_grp) 4980 { 4981 if (!nh_grp->can_destroy) 4982 return; 4983 mlxsw_sp_nexthop_obj_group_info_fini(mlxsw_sp, nh_grp); 4984 WARN_ON_ONCE(!list_empty(&nh_grp->fib_list)); 4985 WARN_ON_ONCE(!list_empty(&nh_grp->vr_list)); 4986 rhashtable_destroy(&nh_grp->vr_ht); 4987 kfree(nh_grp); 4988 } 4989 4990 static struct mlxsw_sp_nexthop_group * 4991 mlxsw_sp_nexthop_obj_group_lookup(struct mlxsw_sp *mlxsw_sp, u32 id) 4992 { 4993 struct mlxsw_sp_nexthop_group_cmp_arg cmp_arg; 4994 4995 cmp_arg.type = MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ; 4996 cmp_arg.id = id; 4997 return rhashtable_lookup_fast(&mlxsw_sp->router->nexthop_group_ht, 4998 &cmp_arg, 4999 mlxsw_sp_nexthop_group_ht_params); 5000 } 5001 5002 static int mlxsw_sp_nexthop_obj_group_add(struct mlxsw_sp *mlxsw_sp, 5003 struct mlxsw_sp_nexthop_group *nh_grp) 5004 { 5005 return mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp); 5006 } 5007 5008 static int 5009 mlxsw_sp_nexthop_obj_group_replace(struct mlxsw_sp *mlxsw_sp, 5010 struct mlxsw_sp_nexthop_group *nh_grp, 5011 struct mlxsw_sp_nexthop_group *old_nh_grp, 5012 struct netlink_ext_ack *extack) 5013 { 5014 struct mlxsw_sp_nexthop_group_info *old_nhgi = old_nh_grp->nhgi; 5015 struct mlxsw_sp_nexthop_group_info *new_nhgi = nh_grp->nhgi; 5016 int err; 5017 5018 old_nh_grp->nhgi = new_nhgi; 5019 new_nhgi->nh_grp = old_nh_grp; 5020 nh_grp->nhgi = old_nhgi; 5021 old_nhgi->nh_grp = nh_grp; 5022 5023 if (old_nhgi->adj_index_valid && new_nhgi->adj_index_valid) { 5024 /* Both the old adjacency index and the new one are valid. 5025 * Routes are currently using the old one. Tell the device to 5026 * replace the old adjacency index with the new one. 5027 */ 5028 err = mlxsw_sp_adj_index_mass_update(mlxsw_sp, old_nh_grp, 5029 old_nhgi->adj_index, 5030 old_nhgi->ecmp_size); 5031 if (err) { 5032 NL_SET_ERR_MSG_MOD(extack, "Failed to replace old adjacency index with new one"); 5033 goto err_out; 5034 } 5035 } else if (old_nhgi->adj_index_valid && !new_nhgi->adj_index_valid) { 5036 /* The old adjacency index is valid, while the new one is not. 5037 * Iterate over all the routes using the group and change them 5038 * to trap packets to the CPU. 5039 */ 5040 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, old_nh_grp); 5041 if (err) { 5042 NL_SET_ERR_MSG_MOD(extack, "Failed to update routes to trap packets"); 5043 goto err_out; 5044 } 5045 } else if (!old_nhgi->adj_index_valid && new_nhgi->adj_index_valid) { 5046 /* The old adjacency index is invalid, while the new one is. 5047 * Iterate over all the routes using the group and change them 5048 * to forward packets using the new valid index. 5049 */ 5050 err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, old_nh_grp); 5051 if (err) { 5052 NL_SET_ERR_MSG_MOD(extack, "Failed to update routes to forward packets"); 5053 goto err_out; 5054 } 5055 } 5056 5057 /* Make sure the flags are set / cleared based on the new nexthop group 5058 * information. 5059 */ 5060 mlxsw_sp_nexthop_obj_group_offload_refresh(mlxsw_sp, old_nh_grp); 5061 5062 /* At this point 'nh_grp' is just a shell that is not used by anyone 5063 * and its nexthop group info is the old info that was just replaced 5064 * with the new one. Remove it. 5065 */ 5066 nh_grp->can_destroy = true; 5067 mlxsw_sp_nexthop_obj_group_destroy(mlxsw_sp, nh_grp); 5068 5069 return 0; 5070 5071 err_out: 5072 old_nhgi->nh_grp = old_nh_grp; 5073 nh_grp->nhgi = new_nhgi; 5074 new_nhgi->nh_grp = nh_grp; 5075 old_nh_grp->nhgi = old_nhgi; 5076 return err; 5077 } 5078 5079 static int mlxsw_sp_nexthop_obj_new(struct mlxsw_sp *mlxsw_sp, 5080 struct nh_notifier_info *info) 5081 { 5082 struct mlxsw_sp_nexthop_group *nh_grp, *old_nh_grp; 5083 struct netlink_ext_ack *extack = info->extack; 5084 int err; 5085 5086 nh_grp = mlxsw_sp_nexthop_obj_group_create(mlxsw_sp, info); 5087 if (IS_ERR(nh_grp)) 5088 return PTR_ERR(nh_grp); 5089 5090 old_nh_grp = mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, info->id); 5091 if (!old_nh_grp) 5092 err = mlxsw_sp_nexthop_obj_group_add(mlxsw_sp, nh_grp); 5093 else 5094 err = mlxsw_sp_nexthop_obj_group_replace(mlxsw_sp, nh_grp, 5095 old_nh_grp, extack); 5096 5097 if (err) { 5098 nh_grp->can_destroy = true; 5099 mlxsw_sp_nexthop_obj_group_destroy(mlxsw_sp, nh_grp); 5100 } 5101 5102 return err; 5103 } 5104 5105 static void mlxsw_sp_nexthop_obj_del(struct mlxsw_sp *mlxsw_sp, 5106 struct nh_notifier_info *info) 5107 { 5108 struct mlxsw_sp_nexthop_group *nh_grp; 5109 5110 nh_grp = mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, info->id); 5111 if (!nh_grp) 5112 return; 5113 5114 nh_grp->can_destroy = true; 5115 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp); 5116 5117 /* If the group still has routes using it, then defer the delete 5118 * operation until the last route using it is deleted. 5119 */ 5120 if (!list_empty(&nh_grp->fib_list)) 5121 return; 5122 mlxsw_sp_nexthop_obj_group_destroy(mlxsw_sp, nh_grp); 5123 } 5124 5125 static int mlxsw_sp_nexthop_obj_bucket_query(struct mlxsw_sp *mlxsw_sp, 5126 u32 adj_index, char *ratr_pl) 5127 { 5128 MLXSW_REG_ZERO(ratr, ratr_pl); 5129 mlxsw_reg_ratr_op_set(ratr_pl, MLXSW_REG_RATR_OP_QUERY_READ); 5130 mlxsw_reg_ratr_adjacency_index_low_set(ratr_pl, adj_index); 5131 mlxsw_reg_ratr_adjacency_index_high_set(ratr_pl, adj_index >> 16); 5132 5133 return mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl); 5134 } 5135 5136 static int mlxsw_sp_nexthop_obj_bucket_compare(char *ratr_pl, char *ratr_pl_new) 5137 { 5138 /* Clear the opcode and activity on both the old and new payload as 5139 * they are irrelevant for the comparison. 5140 */ 5141 mlxsw_reg_ratr_op_set(ratr_pl, MLXSW_REG_RATR_OP_QUERY_READ); 5142 mlxsw_reg_ratr_a_set(ratr_pl, 0); 5143 mlxsw_reg_ratr_op_set(ratr_pl_new, MLXSW_REG_RATR_OP_QUERY_READ); 5144 mlxsw_reg_ratr_a_set(ratr_pl_new, 0); 5145 5146 /* If the contents of the adjacency entry are consistent with the 5147 * replacement request, then replacement was successful. 5148 */ 5149 if (!memcmp(ratr_pl, ratr_pl_new, MLXSW_REG_RATR_LEN)) 5150 return 0; 5151 5152 return -EINVAL; 5153 } 5154 5155 static int 5156 mlxsw_sp_nexthop_obj_bucket_adj_update(struct mlxsw_sp *mlxsw_sp, 5157 struct mlxsw_sp_nexthop *nh, 5158 struct nh_notifier_info *info) 5159 { 5160 u16 bucket_index = info->nh_res_bucket->bucket_index; 5161 struct netlink_ext_ack *extack = info->extack; 5162 bool force = info->nh_res_bucket->force; 5163 char ratr_pl_new[MLXSW_REG_RATR_LEN]; 5164 char ratr_pl[MLXSW_REG_RATR_LEN]; 5165 u32 adj_index; 5166 int err; 5167 5168 /* No point in trying an atomic replacement if the idle timer interval 5169 * is smaller than the interval in which we query and clear activity. 5170 */ 5171 if (!force && info->nh_res_bucket->idle_timer_ms < 5172 MLXSW_SP_NH_GRP_ACTIVITY_UPDATE_INTERVAL) 5173 force = true; 5174 5175 adj_index = nh->nhgi->adj_index + bucket_index; 5176 err = mlxsw_sp_nexthop_update(mlxsw_sp, adj_index, nh, force, ratr_pl); 5177 if (err) { 5178 NL_SET_ERR_MSG_MOD(extack, "Failed to overwrite nexthop bucket"); 5179 return err; 5180 } 5181 5182 if (!force) { 5183 err = mlxsw_sp_nexthop_obj_bucket_query(mlxsw_sp, adj_index, 5184 ratr_pl_new); 5185 if (err) { 5186 NL_SET_ERR_MSG_MOD(extack, "Failed to query nexthop bucket state after replacement. State might be inconsistent"); 5187 return err; 5188 } 5189 5190 err = mlxsw_sp_nexthop_obj_bucket_compare(ratr_pl, ratr_pl_new); 5191 if (err) { 5192 NL_SET_ERR_MSG_MOD(extack, "Nexthop bucket was not replaced because it was active during replacement"); 5193 return err; 5194 } 5195 } 5196 5197 nh->update = 0; 5198 nh->offloaded = 1; 5199 mlxsw_sp_nexthop_bucket_offload_refresh(mlxsw_sp, nh, bucket_index); 5200 5201 return 0; 5202 } 5203 5204 static int mlxsw_sp_nexthop_obj_bucket_replace(struct mlxsw_sp *mlxsw_sp, 5205 struct nh_notifier_info *info) 5206 { 5207 u16 bucket_index = info->nh_res_bucket->bucket_index; 5208 struct netlink_ext_ack *extack = info->extack; 5209 struct mlxsw_sp_nexthop_group_info *nhgi; 5210 struct nh_notifier_single_info *nh_obj; 5211 struct mlxsw_sp_nexthop_group *nh_grp; 5212 struct mlxsw_sp_nexthop *nh; 5213 int err; 5214 5215 nh_grp = mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, info->id); 5216 if (!nh_grp) { 5217 NL_SET_ERR_MSG_MOD(extack, "Nexthop group was not found"); 5218 return -EINVAL; 5219 } 5220 5221 nhgi = nh_grp->nhgi; 5222 5223 if (bucket_index >= nhgi->count) { 5224 NL_SET_ERR_MSG_MOD(extack, "Nexthop bucket index out of range"); 5225 return -EINVAL; 5226 } 5227 5228 nh = &nhgi->nexthops[bucket_index]; 5229 mlxsw_sp_nexthop_obj_fini(mlxsw_sp, nh); 5230 5231 nh_obj = &info->nh_res_bucket->new_nh; 5232 err = mlxsw_sp_nexthop_obj_init(mlxsw_sp, nh_grp, nh, nh_obj, 1); 5233 if (err) { 5234 NL_SET_ERR_MSG_MOD(extack, "Failed to initialize nexthop object for nexthop bucket replacement"); 5235 goto err_nexthop_obj_init; 5236 } 5237 5238 err = mlxsw_sp_nexthop_obj_bucket_adj_update(mlxsw_sp, nh, info); 5239 if (err) 5240 goto err_nexthop_obj_bucket_adj_update; 5241 5242 return 0; 5243 5244 err_nexthop_obj_bucket_adj_update: 5245 mlxsw_sp_nexthop_obj_fini(mlxsw_sp, nh); 5246 err_nexthop_obj_init: 5247 nh_obj = &info->nh_res_bucket->old_nh; 5248 mlxsw_sp_nexthop_obj_init(mlxsw_sp, nh_grp, nh, nh_obj, 1); 5249 /* The old adjacency entry was not overwritten */ 5250 nh->update = 0; 5251 nh->offloaded = 1; 5252 return err; 5253 } 5254 5255 static int mlxsw_sp_nexthop_obj_event(struct notifier_block *nb, 5256 unsigned long event, void *ptr) 5257 { 5258 struct nh_notifier_info *info = ptr; 5259 struct mlxsw_sp_router *router; 5260 int err = 0; 5261 5262 router = container_of(nb, struct mlxsw_sp_router, nexthop_nb); 5263 err = mlxsw_sp_nexthop_obj_validate(router->mlxsw_sp, event, info); 5264 if (err) 5265 goto out; 5266 5267 mutex_lock(&router->lock); 5268 5269 switch (event) { 5270 case NEXTHOP_EVENT_REPLACE: 5271 err = mlxsw_sp_nexthop_obj_new(router->mlxsw_sp, info); 5272 break; 5273 case NEXTHOP_EVENT_DEL: 5274 mlxsw_sp_nexthop_obj_del(router->mlxsw_sp, info); 5275 break; 5276 case NEXTHOP_EVENT_BUCKET_REPLACE: 5277 err = mlxsw_sp_nexthop_obj_bucket_replace(router->mlxsw_sp, 5278 info); 5279 break; 5280 default: 5281 break; 5282 } 5283 5284 mutex_unlock(&router->lock); 5285 5286 out: 5287 return notifier_from_errno(err); 5288 } 5289 5290 static bool mlxsw_sp_fi_is_gateway(const struct mlxsw_sp *mlxsw_sp, 5291 struct fib_info *fi) 5292 { 5293 const struct fib_nh *nh = fib_info_nh(fi, 0); 5294 5295 return nh->fib_nh_gw_family || 5296 mlxsw_sp_nexthop4_ipip_type(mlxsw_sp, nh, NULL); 5297 } 5298 5299 static int 5300 mlxsw_sp_nexthop4_group_info_init(struct mlxsw_sp *mlxsw_sp, 5301 struct mlxsw_sp_nexthop_group *nh_grp) 5302 { 5303 unsigned int nhs = fib_info_num_path(nh_grp->ipv4.fi); 5304 struct mlxsw_sp_nexthop_group_info *nhgi; 5305 struct mlxsw_sp_nexthop *nh; 5306 int err, i; 5307 5308 nhgi = kzalloc(struct_size(nhgi, nexthops, nhs), GFP_KERNEL); 5309 if (!nhgi) 5310 return -ENOMEM; 5311 nh_grp->nhgi = nhgi; 5312 nhgi->nh_grp = nh_grp; 5313 nhgi->gateway = mlxsw_sp_fi_is_gateway(mlxsw_sp, nh_grp->ipv4.fi); 5314 nhgi->count = nhs; 5315 for (i = 0; i < nhgi->count; i++) { 5316 struct fib_nh *fib_nh; 5317 5318 nh = &nhgi->nexthops[i]; 5319 fib_nh = fib_info_nh(nh_grp->ipv4.fi, i); 5320 err = mlxsw_sp_nexthop4_init(mlxsw_sp, nh_grp, nh, fib_nh); 5321 if (err) 5322 goto err_nexthop4_init; 5323 } 5324 err = mlxsw_sp_nexthop_group_inc(mlxsw_sp); 5325 if (err) 5326 goto err_group_inc; 5327 err = mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); 5328 if (err) 5329 goto err_group_refresh; 5330 5331 return 0; 5332 5333 err_group_refresh: 5334 mlxsw_sp_nexthop_group_dec(mlxsw_sp); 5335 err_group_inc: 5336 i = nhgi->count; 5337 err_nexthop4_init: 5338 for (i--; i >= 0; i--) { 5339 nh = &nhgi->nexthops[i]; 5340 mlxsw_sp_nexthop4_fini(mlxsw_sp, nh); 5341 } 5342 kfree(nhgi); 5343 return err; 5344 } 5345 5346 static void 5347 mlxsw_sp_nexthop4_group_info_fini(struct mlxsw_sp *mlxsw_sp, 5348 struct mlxsw_sp_nexthop_group *nh_grp) 5349 { 5350 struct mlxsw_sp_nexthop_group_info *nhgi = nh_grp->nhgi; 5351 int i; 5352 5353 mlxsw_sp_nexthop_group_dec(mlxsw_sp); 5354 for (i = nhgi->count - 1; i >= 0; i--) { 5355 struct mlxsw_sp_nexthop *nh = &nhgi->nexthops[i]; 5356 5357 mlxsw_sp_nexthop4_fini(mlxsw_sp, nh); 5358 } 5359 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); 5360 WARN_ON_ONCE(nhgi->adj_index_valid); 5361 kfree(nhgi); 5362 } 5363 5364 static struct mlxsw_sp_nexthop_group * 5365 mlxsw_sp_nexthop4_group_create(struct mlxsw_sp *mlxsw_sp, struct fib_info *fi) 5366 { 5367 struct mlxsw_sp_nexthop_group *nh_grp; 5368 int err; 5369 5370 nh_grp = kzalloc(sizeof(*nh_grp), GFP_KERNEL); 5371 if (!nh_grp) 5372 return ERR_PTR(-ENOMEM); 5373 INIT_LIST_HEAD(&nh_grp->vr_list); 5374 err = rhashtable_init(&nh_grp->vr_ht, 5375 &mlxsw_sp_nexthop_group_vr_ht_params); 5376 if (err) 5377 goto err_nexthop_group_vr_ht_init; 5378 INIT_LIST_HEAD(&nh_grp->fib_list); 5379 nh_grp->type = MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV4; 5380 nh_grp->ipv4.fi = fi; 5381 fib_info_hold(fi); 5382 5383 err = mlxsw_sp_nexthop4_group_info_init(mlxsw_sp, nh_grp); 5384 if (err) 5385 goto err_nexthop_group_info_init; 5386 5387 err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp); 5388 if (err) 5389 goto err_nexthop_group_insert; 5390 5391 nh_grp->can_destroy = true; 5392 5393 return nh_grp; 5394 5395 err_nexthop_group_insert: 5396 mlxsw_sp_nexthop4_group_info_fini(mlxsw_sp, nh_grp); 5397 err_nexthop_group_info_init: 5398 fib_info_put(fi); 5399 rhashtable_destroy(&nh_grp->vr_ht); 5400 err_nexthop_group_vr_ht_init: 5401 kfree(nh_grp); 5402 return ERR_PTR(err); 5403 } 5404 5405 static void 5406 mlxsw_sp_nexthop4_group_destroy(struct mlxsw_sp *mlxsw_sp, 5407 struct mlxsw_sp_nexthop_group *nh_grp) 5408 { 5409 if (!nh_grp->can_destroy) 5410 return; 5411 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp); 5412 mlxsw_sp_nexthop4_group_info_fini(mlxsw_sp, nh_grp); 5413 fib_info_put(nh_grp->ipv4.fi); 5414 WARN_ON_ONCE(!list_empty(&nh_grp->vr_list)); 5415 rhashtable_destroy(&nh_grp->vr_ht); 5416 kfree(nh_grp); 5417 } 5418 5419 static int mlxsw_sp_nexthop4_group_get(struct mlxsw_sp *mlxsw_sp, 5420 struct mlxsw_sp_fib_entry *fib_entry, 5421 struct fib_info *fi) 5422 { 5423 struct mlxsw_sp_nexthop_group *nh_grp; 5424 5425 if (fi->nh) { 5426 nh_grp = mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, 5427 fi->nh->id); 5428 if (WARN_ON_ONCE(!nh_grp)) 5429 return -EINVAL; 5430 goto out; 5431 } 5432 5433 nh_grp = mlxsw_sp_nexthop4_group_lookup(mlxsw_sp, fi); 5434 if (!nh_grp) { 5435 nh_grp = mlxsw_sp_nexthop4_group_create(mlxsw_sp, fi); 5436 if (IS_ERR(nh_grp)) 5437 return PTR_ERR(nh_grp); 5438 } 5439 out: 5440 list_add_tail(&fib_entry->nexthop_group_node, &nh_grp->fib_list); 5441 fib_entry->nh_group = nh_grp; 5442 return 0; 5443 } 5444 5445 static void mlxsw_sp_nexthop4_group_put(struct mlxsw_sp *mlxsw_sp, 5446 struct mlxsw_sp_fib_entry *fib_entry) 5447 { 5448 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group; 5449 5450 list_del(&fib_entry->nexthop_group_node); 5451 if (!list_empty(&nh_grp->fib_list)) 5452 return; 5453 5454 if (nh_grp->type == MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ) { 5455 mlxsw_sp_nexthop_obj_group_destroy(mlxsw_sp, nh_grp); 5456 return; 5457 } 5458 5459 mlxsw_sp_nexthop4_group_destroy(mlxsw_sp, nh_grp); 5460 } 5461 5462 static bool 5463 mlxsw_sp_fib4_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry) 5464 { 5465 struct mlxsw_sp_fib4_entry *fib4_entry; 5466 5467 fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry, 5468 common); 5469 return !fib4_entry->dscp; 5470 } 5471 5472 static bool 5473 mlxsw_sp_fib_entry_should_offload(const struct mlxsw_sp_fib_entry *fib_entry) 5474 { 5475 struct mlxsw_sp_nexthop_group *nh_group = fib_entry->nh_group; 5476 5477 switch (fib_entry->fib_node->fib->proto) { 5478 case MLXSW_SP_L3_PROTO_IPV4: 5479 if (!mlxsw_sp_fib4_entry_should_offload(fib_entry)) 5480 return false; 5481 break; 5482 case MLXSW_SP_L3_PROTO_IPV6: 5483 break; 5484 } 5485 5486 switch (fib_entry->type) { 5487 case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE: 5488 return !!nh_group->nhgi->adj_index_valid; 5489 case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL: 5490 return !!nh_group->nhgi->nh_rif; 5491 case MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE: 5492 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP: 5493 case MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP: 5494 return true; 5495 default: 5496 return false; 5497 } 5498 } 5499 5500 static struct mlxsw_sp_nexthop * 5501 mlxsw_sp_rt6_nexthop(struct mlxsw_sp_nexthop_group *nh_grp, 5502 const struct mlxsw_sp_rt6 *mlxsw_sp_rt6) 5503 { 5504 int i; 5505 5506 for (i = 0; i < nh_grp->nhgi->count; i++) { 5507 struct mlxsw_sp_nexthop *nh = &nh_grp->nhgi->nexthops[i]; 5508 struct fib6_info *rt = mlxsw_sp_rt6->rt; 5509 5510 if (nh->rif && nh->rif->dev == rt->fib6_nh->fib_nh_dev && 5511 ipv6_addr_equal((const struct in6_addr *) &nh->gw_addr, 5512 &rt->fib6_nh->fib_nh_gw6)) 5513 return nh; 5514 } 5515 5516 return NULL; 5517 } 5518 5519 static void 5520 mlxsw_sp_fib4_offload_failed_flag_set(struct mlxsw_sp *mlxsw_sp, 5521 struct fib_entry_notifier_info *fen_info) 5522 { 5523 u32 *p_dst = (u32 *) &fen_info->dst; 5524 struct fib_rt_info fri; 5525 5526 fri.fi = fen_info->fi; 5527 fri.tb_id = fen_info->tb_id; 5528 fri.dst = cpu_to_be32(*p_dst); 5529 fri.dst_len = fen_info->dst_len; 5530 fri.dscp = fen_info->dscp; 5531 fri.type = fen_info->type; 5532 fri.offload = false; 5533 fri.trap = false; 5534 fri.offload_failed = true; 5535 fib_alias_hw_flags_set(mlxsw_sp_net(mlxsw_sp), &fri); 5536 } 5537 5538 static void 5539 mlxsw_sp_fib4_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp, 5540 struct mlxsw_sp_fib_entry *fib_entry) 5541 { 5542 u32 *p_dst = (u32 *) fib_entry->fib_node->key.addr; 5543 int dst_len = fib_entry->fib_node->key.prefix_len; 5544 struct mlxsw_sp_fib4_entry *fib4_entry; 5545 struct fib_rt_info fri; 5546 bool should_offload; 5547 5548 should_offload = mlxsw_sp_fib_entry_should_offload(fib_entry); 5549 fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry, 5550 common); 5551 fri.fi = fib4_entry->fi; 5552 fri.tb_id = fib4_entry->tb_id; 5553 fri.dst = cpu_to_be32(*p_dst); 5554 fri.dst_len = dst_len; 5555 fri.dscp = fib4_entry->dscp; 5556 fri.type = fib4_entry->type; 5557 fri.offload = should_offload; 5558 fri.trap = !should_offload; 5559 fri.offload_failed = false; 5560 fib_alias_hw_flags_set(mlxsw_sp_net(mlxsw_sp), &fri); 5561 } 5562 5563 static void 5564 mlxsw_sp_fib4_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp, 5565 struct mlxsw_sp_fib_entry *fib_entry) 5566 { 5567 u32 *p_dst = (u32 *) fib_entry->fib_node->key.addr; 5568 int dst_len = fib_entry->fib_node->key.prefix_len; 5569 struct mlxsw_sp_fib4_entry *fib4_entry; 5570 struct fib_rt_info fri; 5571 5572 fib4_entry = container_of(fib_entry, struct mlxsw_sp_fib4_entry, 5573 common); 5574 fri.fi = fib4_entry->fi; 5575 fri.tb_id = fib4_entry->tb_id; 5576 fri.dst = cpu_to_be32(*p_dst); 5577 fri.dst_len = dst_len; 5578 fri.dscp = fib4_entry->dscp; 5579 fri.type = fib4_entry->type; 5580 fri.offload = false; 5581 fri.trap = false; 5582 fri.offload_failed = false; 5583 fib_alias_hw_flags_set(mlxsw_sp_net(mlxsw_sp), &fri); 5584 } 5585 5586 #if IS_ENABLED(CONFIG_IPV6) 5587 static void 5588 mlxsw_sp_fib6_offload_failed_flag_set(struct mlxsw_sp *mlxsw_sp, 5589 struct fib6_info **rt_arr, 5590 unsigned int nrt6) 5591 { 5592 int i; 5593 5594 /* In IPv6 a multipath route is represented using multiple routes, so 5595 * we need to set the flags on all of them. 5596 */ 5597 for (i = 0; i < nrt6; i++) 5598 fib6_info_hw_flags_set(mlxsw_sp_net(mlxsw_sp), rt_arr[i], 5599 false, false, true); 5600 } 5601 #else 5602 static void 5603 mlxsw_sp_fib6_offload_failed_flag_set(struct mlxsw_sp *mlxsw_sp, 5604 struct fib6_info **rt_arr, 5605 unsigned int nrt6) 5606 { 5607 } 5608 #endif 5609 5610 #if IS_ENABLED(CONFIG_IPV6) 5611 static void 5612 mlxsw_sp_fib6_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp, 5613 struct mlxsw_sp_fib_entry *fib_entry) 5614 { 5615 struct mlxsw_sp_fib6_entry *fib6_entry; 5616 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 5617 bool should_offload; 5618 5619 should_offload = mlxsw_sp_fib_entry_should_offload(fib_entry); 5620 5621 /* In IPv6 a multipath route is represented using multiple routes, so 5622 * we need to set the flags on all of them. 5623 */ 5624 fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry, 5625 common); 5626 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) 5627 fib6_info_hw_flags_set(mlxsw_sp_net(mlxsw_sp), mlxsw_sp_rt6->rt, 5628 should_offload, !should_offload, false); 5629 } 5630 #else 5631 static void 5632 mlxsw_sp_fib6_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp, 5633 struct mlxsw_sp_fib_entry *fib_entry) 5634 { 5635 } 5636 #endif 5637 5638 #if IS_ENABLED(CONFIG_IPV6) 5639 static void 5640 mlxsw_sp_fib6_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp, 5641 struct mlxsw_sp_fib_entry *fib_entry) 5642 { 5643 struct mlxsw_sp_fib6_entry *fib6_entry; 5644 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 5645 5646 fib6_entry = container_of(fib_entry, struct mlxsw_sp_fib6_entry, 5647 common); 5648 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) 5649 fib6_info_hw_flags_set(mlxsw_sp_net(mlxsw_sp), mlxsw_sp_rt6->rt, 5650 false, false, false); 5651 } 5652 #else 5653 static void 5654 mlxsw_sp_fib6_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp, 5655 struct mlxsw_sp_fib_entry *fib_entry) 5656 { 5657 } 5658 #endif 5659 5660 static void 5661 mlxsw_sp_fib_entry_hw_flags_set(struct mlxsw_sp *mlxsw_sp, 5662 struct mlxsw_sp_fib_entry *fib_entry) 5663 { 5664 switch (fib_entry->fib_node->fib->proto) { 5665 case MLXSW_SP_L3_PROTO_IPV4: 5666 mlxsw_sp_fib4_entry_hw_flags_set(mlxsw_sp, fib_entry); 5667 break; 5668 case MLXSW_SP_L3_PROTO_IPV6: 5669 mlxsw_sp_fib6_entry_hw_flags_set(mlxsw_sp, fib_entry); 5670 break; 5671 } 5672 } 5673 5674 static void 5675 mlxsw_sp_fib_entry_hw_flags_clear(struct mlxsw_sp *mlxsw_sp, 5676 struct mlxsw_sp_fib_entry *fib_entry) 5677 { 5678 switch (fib_entry->fib_node->fib->proto) { 5679 case MLXSW_SP_L3_PROTO_IPV4: 5680 mlxsw_sp_fib4_entry_hw_flags_clear(mlxsw_sp, fib_entry); 5681 break; 5682 case MLXSW_SP_L3_PROTO_IPV6: 5683 mlxsw_sp_fib6_entry_hw_flags_clear(mlxsw_sp, fib_entry); 5684 break; 5685 } 5686 } 5687 5688 static void 5689 mlxsw_sp_fib_entry_hw_flags_refresh(struct mlxsw_sp *mlxsw_sp, 5690 struct mlxsw_sp_fib_entry *fib_entry, 5691 enum mlxsw_reg_ralue_op op) 5692 { 5693 switch (op) { 5694 case MLXSW_REG_RALUE_OP_WRITE_WRITE: 5695 mlxsw_sp_fib_entry_hw_flags_set(mlxsw_sp, fib_entry); 5696 break; 5697 case MLXSW_REG_RALUE_OP_WRITE_DELETE: 5698 mlxsw_sp_fib_entry_hw_flags_clear(mlxsw_sp, fib_entry); 5699 break; 5700 default: 5701 break; 5702 } 5703 } 5704 5705 static void 5706 mlxsw_sp_fib_entry_ralue_pack(char *ralue_pl, 5707 const struct mlxsw_sp_fib_entry *fib_entry, 5708 enum mlxsw_reg_ralue_op op) 5709 { 5710 struct mlxsw_sp_fib *fib = fib_entry->fib_node->fib; 5711 enum mlxsw_reg_ralxx_protocol proto; 5712 u32 *p_dip; 5713 5714 proto = (enum mlxsw_reg_ralxx_protocol) fib->proto; 5715 5716 switch (fib->proto) { 5717 case MLXSW_SP_L3_PROTO_IPV4: 5718 p_dip = (u32 *) fib_entry->fib_node->key.addr; 5719 mlxsw_reg_ralue_pack4(ralue_pl, proto, op, fib->vr->id, 5720 fib_entry->fib_node->key.prefix_len, 5721 *p_dip); 5722 break; 5723 case MLXSW_SP_L3_PROTO_IPV6: 5724 mlxsw_reg_ralue_pack6(ralue_pl, proto, op, fib->vr->id, 5725 fib_entry->fib_node->key.prefix_len, 5726 fib_entry->fib_node->key.addr); 5727 break; 5728 } 5729 } 5730 5731 static int mlxsw_sp_fib_entry_op_remote(struct mlxsw_sp *mlxsw_sp, 5732 struct mlxsw_sp_fib_entry *fib_entry, 5733 enum mlxsw_reg_ralue_op op) 5734 { 5735 struct mlxsw_sp_nexthop_group *nh_group = fib_entry->nh_group; 5736 struct mlxsw_sp_nexthop_group_info *nhgi = nh_group->nhgi; 5737 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5738 enum mlxsw_reg_ralue_trap_action trap_action; 5739 u16 trap_id = 0; 5740 u32 adjacency_index = 0; 5741 u16 ecmp_size = 0; 5742 5743 /* In case the nexthop group adjacency index is valid, use it 5744 * with provided ECMP size. Otherwise, setup trap and pass 5745 * traffic to kernel. 5746 */ 5747 if (mlxsw_sp_fib_entry_should_offload(fib_entry)) { 5748 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP; 5749 adjacency_index = nhgi->adj_index; 5750 ecmp_size = nhgi->ecmp_size; 5751 } else if (!nhgi->adj_index_valid && nhgi->count && nhgi->nh_rif) { 5752 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP; 5753 adjacency_index = mlxsw_sp->router->adj_trap_index; 5754 ecmp_size = 1; 5755 } else { 5756 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP; 5757 trap_id = MLXSW_TRAP_ID_RTR_INGRESS0; 5758 } 5759 5760 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5761 mlxsw_reg_ralue_act_remote_pack(ralue_pl, trap_action, trap_id, 5762 adjacency_index, ecmp_size); 5763 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5764 } 5765 5766 static int mlxsw_sp_fib_entry_op_local(struct mlxsw_sp *mlxsw_sp, 5767 struct mlxsw_sp_fib_entry *fib_entry, 5768 enum mlxsw_reg_ralue_op op) 5769 { 5770 struct mlxsw_sp_rif *rif = fib_entry->nh_group->nhgi->nh_rif; 5771 enum mlxsw_reg_ralue_trap_action trap_action; 5772 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5773 u16 trap_id = 0; 5774 u16 rif_index = 0; 5775 5776 if (mlxsw_sp_fib_entry_should_offload(fib_entry)) { 5777 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP; 5778 rif_index = rif->rif_index; 5779 } else { 5780 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP; 5781 trap_id = MLXSW_TRAP_ID_RTR_INGRESS0; 5782 } 5783 5784 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5785 mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, trap_id, 5786 rif_index); 5787 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5788 } 5789 5790 static int mlxsw_sp_fib_entry_op_trap(struct mlxsw_sp *mlxsw_sp, 5791 struct mlxsw_sp_fib_entry *fib_entry, 5792 enum mlxsw_reg_ralue_op op) 5793 { 5794 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5795 5796 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5797 mlxsw_reg_ralue_act_ip2me_pack(ralue_pl); 5798 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5799 } 5800 5801 static int mlxsw_sp_fib_entry_op_blackhole(struct mlxsw_sp *mlxsw_sp, 5802 struct mlxsw_sp_fib_entry *fib_entry, 5803 enum mlxsw_reg_ralue_op op) 5804 { 5805 enum mlxsw_reg_ralue_trap_action trap_action; 5806 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5807 5808 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_DISCARD_ERROR; 5809 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5810 mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, 0, 0); 5811 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5812 } 5813 5814 static int 5815 mlxsw_sp_fib_entry_op_unreachable(struct mlxsw_sp *mlxsw_sp, 5816 struct mlxsw_sp_fib_entry *fib_entry, 5817 enum mlxsw_reg_ralue_op op) 5818 { 5819 enum mlxsw_reg_ralue_trap_action trap_action; 5820 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5821 u16 trap_id; 5822 5823 trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP; 5824 trap_id = MLXSW_TRAP_ID_RTR_INGRESS1; 5825 5826 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5827 mlxsw_reg_ralue_act_local_pack(ralue_pl, trap_action, trap_id, 0); 5828 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5829 } 5830 5831 static int 5832 mlxsw_sp_fib_entry_op_ipip_decap(struct mlxsw_sp *mlxsw_sp, 5833 struct mlxsw_sp_fib_entry *fib_entry, 5834 enum mlxsw_reg_ralue_op op) 5835 { 5836 struct mlxsw_sp_ipip_entry *ipip_entry = fib_entry->decap.ipip_entry; 5837 const struct mlxsw_sp_ipip_ops *ipip_ops; 5838 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5839 int err; 5840 5841 if (WARN_ON(!ipip_entry)) 5842 return -EINVAL; 5843 5844 ipip_ops = mlxsw_sp->router->ipip_ops_arr[ipip_entry->ipipt]; 5845 err = ipip_ops->decap_config(mlxsw_sp, ipip_entry, 5846 fib_entry->decap.tunnel_index); 5847 if (err) 5848 return err; 5849 5850 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5851 mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl, 5852 fib_entry->decap.tunnel_index); 5853 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5854 } 5855 5856 static int mlxsw_sp_fib_entry_op_nve_decap(struct mlxsw_sp *mlxsw_sp, 5857 struct mlxsw_sp_fib_entry *fib_entry, 5858 enum mlxsw_reg_ralue_op op) 5859 { 5860 char ralue_pl[MLXSW_REG_RALUE_LEN]; 5861 5862 mlxsw_sp_fib_entry_ralue_pack(ralue_pl, fib_entry, op); 5863 mlxsw_reg_ralue_act_ip2me_tun_pack(ralue_pl, 5864 fib_entry->decap.tunnel_index); 5865 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); 5866 } 5867 5868 static int __mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp, 5869 struct mlxsw_sp_fib_entry *fib_entry, 5870 enum mlxsw_reg_ralue_op op) 5871 { 5872 switch (fib_entry->type) { 5873 case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE: 5874 return mlxsw_sp_fib_entry_op_remote(mlxsw_sp, fib_entry, op); 5875 case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL: 5876 return mlxsw_sp_fib_entry_op_local(mlxsw_sp, fib_entry, op); 5877 case MLXSW_SP_FIB_ENTRY_TYPE_TRAP: 5878 return mlxsw_sp_fib_entry_op_trap(mlxsw_sp, fib_entry, op); 5879 case MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE: 5880 return mlxsw_sp_fib_entry_op_blackhole(mlxsw_sp, fib_entry, op); 5881 case MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE: 5882 return mlxsw_sp_fib_entry_op_unreachable(mlxsw_sp, fib_entry, 5883 op); 5884 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP: 5885 return mlxsw_sp_fib_entry_op_ipip_decap(mlxsw_sp, 5886 fib_entry, op); 5887 case MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP: 5888 return mlxsw_sp_fib_entry_op_nve_decap(mlxsw_sp, fib_entry, op); 5889 } 5890 return -EINVAL; 5891 } 5892 5893 static int mlxsw_sp_fib_entry_op(struct mlxsw_sp *mlxsw_sp, 5894 struct mlxsw_sp_fib_entry *fib_entry, 5895 enum mlxsw_reg_ralue_op op) 5896 { 5897 int err = __mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry, op); 5898 5899 if (err) 5900 return err; 5901 5902 mlxsw_sp_fib_entry_hw_flags_refresh(mlxsw_sp, fib_entry, op); 5903 5904 return err; 5905 } 5906 5907 static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp, 5908 struct mlxsw_sp_fib_entry *fib_entry) 5909 { 5910 return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry, 5911 MLXSW_REG_RALUE_OP_WRITE_WRITE); 5912 } 5913 5914 static int mlxsw_sp_fib_entry_del(struct mlxsw_sp *mlxsw_sp, 5915 struct mlxsw_sp_fib_entry *fib_entry) 5916 { 5917 return mlxsw_sp_fib_entry_op(mlxsw_sp, fib_entry, 5918 MLXSW_REG_RALUE_OP_WRITE_DELETE); 5919 } 5920 5921 static int 5922 mlxsw_sp_fib4_entry_type_set(struct mlxsw_sp *mlxsw_sp, 5923 const struct fib_entry_notifier_info *fen_info, 5924 struct mlxsw_sp_fib_entry *fib_entry) 5925 { 5926 struct mlxsw_sp_nexthop_group_info *nhgi = fib_entry->nh_group->nhgi; 5927 union mlxsw_sp_l3addr dip = { .addr4 = htonl(fen_info->dst) }; 5928 struct mlxsw_sp_router *router = mlxsw_sp->router; 5929 u32 tb_id = mlxsw_sp_fix_tb_id(fen_info->tb_id); 5930 int ifindex = nhgi->nexthops[0].ifindex; 5931 struct mlxsw_sp_ipip_entry *ipip_entry; 5932 5933 switch (fen_info->type) { 5934 case RTN_LOCAL: 5935 ipip_entry = mlxsw_sp_ipip_entry_find_by_decap(mlxsw_sp, ifindex, 5936 MLXSW_SP_L3_PROTO_IPV4, dip); 5937 if (ipip_entry && ipip_entry->ol_dev->flags & IFF_UP) { 5938 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP; 5939 return mlxsw_sp_fib_entry_decap_init(mlxsw_sp, 5940 fib_entry, 5941 ipip_entry); 5942 } 5943 if (mlxsw_sp_router_nve_is_decap(mlxsw_sp, tb_id, 5944 MLXSW_SP_L3_PROTO_IPV4, 5945 &dip)) { 5946 u32 tunnel_index; 5947 5948 tunnel_index = router->nve_decap_config.tunnel_index; 5949 fib_entry->decap.tunnel_index = tunnel_index; 5950 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP; 5951 return 0; 5952 } 5953 fallthrough; 5954 case RTN_BROADCAST: 5955 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 5956 return 0; 5957 case RTN_BLACKHOLE: 5958 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE; 5959 return 0; 5960 case RTN_UNREACHABLE: 5961 case RTN_PROHIBIT: 5962 /* Packets hitting these routes need to be trapped, but 5963 * can do so with a lower priority than packets directed 5964 * at the host, so use action type local instead of trap. 5965 */ 5966 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE; 5967 return 0; 5968 case RTN_UNICAST: 5969 if (nhgi->gateway) 5970 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE; 5971 else 5972 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL; 5973 return 0; 5974 default: 5975 return -EINVAL; 5976 } 5977 } 5978 5979 static void 5980 mlxsw_sp_fib_entry_type_unset(struct mlxsw_sp *mlxsw_sp, 5981 struct mlxsw_sp_fib_entry *fib_entry) 5982 { 5983 switch (fib_entry->type) { 5984 case MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP: 5985 mlxsw_sp_fib_entry_decap_fini(mlxsw_sp, fib_entry); 5986 break; 5987 default: 5988 break; 5989 } 5990 } 5991 5992 static void 5993 mlxsw_sp_fib4_entry_type_unset(struct mlxsw_sp *mlxsw_sp, 5994 struct mlxsw_sp_fib4_entry *fib4_entry) 5995 { 5996 mlxsw_sp_fib_entry_type_unset(mlxsw_sp, &fib4_entry->common); 5997 } 5998 5999 static struct mlxsw_sp_fib4_entry * 6000 mlxsw_sp_fib4_entry_create(struct mlxsw_sp *mlxsw_sp, 6001 struct mlxsw_sp_fib_node *fib_node, 6002 const struct fib_entry_notifier_info *fen_info) 6003 { 6004 struct mlxsw_sp_fib4_entry *fib4_entry; 6005 struct mlxsw_sp_fib_entry *fib_entry; 6006 int err; 6007 6008 fib4_entry = kzalloc(sizeof(*fib4_entry), GFP_KERNEL); 6009 if (!fib4_entry) 6010 return ERR_PTR(-ENOMEM); 6011 fib_entry = &fib4_entry->common; 6012 6013 err = mlxsw_sp_nexthop4_group_get(mlxsw_sp, fib_entry, fen_info->fi); 6014 if (err) 6015 goto err_nexthop4_group_get; 6016 6017 err = mlxsw_sp_nexthop_group_vr_link(fib_entry->nh_group, 6018 fib_node->fib); 6019 if (err) 6020 goto err_nexthop_group_vr_link; 6021 6022 err = mlxsw_sp_fib4_entry_type_set(mlxsw_sp, fen_info, fib_entry); 6023 if (err) 6024 goto err_fib4_entry_type_set; 6025 6026 fib4_entry->fi = fen_info->fi; 6027 fib_info_hold(fib4_entry->fi); 6028 fib4_entry->tb_id = fen_info->tb_id; 6029 fib4_entry->type = fen_info->type; 6030 fib4_entry->dscp = fen_info->dscp; 6031 6032 fib_entry->fib_node = fib_node; 6033 6034 return fib4_entry; 6035 6036 err_fib4_entry_type_set: 6037 mlxsw_sp_nexthop_group_vr_unlink(fib_entry->nh_group, fib_node->fib); 6038 err_nexthop_group_vr_link: 6039 mlxsw_sp_nexthop4_group_put(mlxsw_sp, &fib4_entry->common); 6040 err_nexthop4_group_get: 6041 kfree(fib4_entry); 6042 return ERR_PTR(err); 6043 } 6044 6045 static void mlxsw_sp_fib4_entry_destroy(struct mlxsw_sp *mlxsw_sp, 6046 struct mlxsw_sp_fib4_entry *fib4_entry) 6047 { 6048 struct mlxsw_sp_fib_node *fib_node = fib4_entry->common.fib_node; 6049 6050 fib_info_put(fib4_entry->fi); 6051 mlxsw_sp_fib4_entry_type_unset(mlxsw_sp, fib4_entry); 6052 mlxsw_sp_nexthop_group_vr_unlink(fib4_entry->common.nh_group, 6053 fib_node->fib); 6054 mlxsw_sp_nexthop4_group_put(mlxsw_sp, &fib4_entry->common); 6055 kfree(fib4_entry); 6056 } 6057 6058 static struct mlxsw_sp_fib4_entry * 6059 mlxsw_sp_fib4_entry_lookup(struct mlxsw_sp *mlxsw_sp, 6060 const struct fib_entry_notifier_info *fen_info) 6061 { 6062 struct mlxsw_sp_fib4_entry *fib4_entry; 6063 struct mlxsw_sp_fib_node *fib_node; 6064 struct mlxsw_sp_fib *fib; 6065 struct mlxsw_sp_vr *vr; 6066 6067 vr = mlxsw_sp_vr_find(mlxsw_sp, fen_info->tb_id); 6068 if (!vr) 6069 return NULL; 6070 fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV4); 6071 6072 fib_node = mlxsw_sp_fib_node_lookup(fib, &fen_info->dst, 6073 sizeof(fen_info->dst), 6074 fen_info->dst_len); 6075 if (!fib_node) 6076 return NULL; 6077 6078 fib4_entry = container_of(fib_node->fib_entry, 6079 struct mlxsw_sp_fib4_entry, common); 6080 if (fib4_entry->tb_id == fen_info->tb_id && 6081 fib4_entry->dscp == fen_info->dscp && 6082 fib4_entry->type == fen_info->type && 6083 fib4_entry->fi == fen_info->fi) 6084 return fib4_entry; 6085 6086 return NULL; 6087 } 6088 6089 static const struct rhashtable_params mlxsw_sp_fib_ht_params = { 6090 .key_offset = offsetof(struct mlxsw_sp_fib_node, key), 6091 .head_offset = offsetof(struct mlxsw_sp_fib_node, ht_node), 6092 .key_len = sizeof(struct mlxsw_sp_fib_key), 6093 .automatic_shrinking = true, 6094 }; 6095 6096 static int mlxsw_sp_fib_node_insert(struct mlxsw_sp_fib *fib, 6097 struct mlxsw_sp_fib_node *fib_node) 6098 { 6099 return rhashtable_insert_fast(&fib->ht, &fib_node->ht_node, 6100 mlxsw_sp_fib_ht_params); 6101 } 6102 6103 static void mlxsw_sp_fib_node_remove(struct mlxsw_sp_fib *fib, 6104 struct mlxsw_sp_fib_node *fib_node) 6105 { 6106 rhashtable_remove_fast(&fib->ht, &fib_node->ht_node, 6107 mlxsw_sp_fib_ht_params); 6108 } 6109 6110 static struct mlxsw_sp_fib_node * 6111 mlxsw_sp_fib_node_lookup(struct mlxsw_sp_fib *fib, const void *addr, 6112 size_t addr_len, unsigned char prefix_len) 6113 { 6114 struct mlxsw_sp_fib_key key; 6115 6116 memset(&key, 0, sizeof(key)); 6117 memcpy(key.addr, addr, addr_len); 6118 key.prefix_len = prefix_len; 6119 return rhashtable_lookup_fast(&fib->ht, &key, mlxsw_sp_fib_ht_params); 6120 } 6121 6122 static struct mlxsw_sp_fib_node * 6123 mlxsw_sp_fib_node_create(struct mlxsw_sp_fib *fib, const void *addr, 6124 size_t addr_len, unsigned char prefix_len) 6125 { 6126 struct mlxsw_sp_fib_node *fib_node; 6127 6128 fib_node = kzalloc(sizeof(*fib_node), GFP_KERNEL); 6129 if (!fib_node) 6130 return NULL; 6131 6132 list_add(&fib_node->list, &fib->node_list); 6133 memcpy(fib_node->key.addr, addr, addr_len); 6134 fib_node->key.prefix_len = prefix_len; 6135 6136 return fib_node; 6137 } 6138 6139 static void mlxsw_sp_fib_node_destroy(struct mlxsw_sp_fib_node *fib_node) 6140 { 6141 list_del(&fib_node->list); 6142 kfree(fib_node); 6143 } 6144 6145 static int mlxsw_sp_fib_lpm_tree_link(struct mlxsw_sp *mlxsw_sp, 6146 struct mlxsw_sp_fib_node *fib_node) 6147 { 6148 struct mlxsw_sp_prefix_usage req_prefix_usage; 6149 struct mlxsw_sp_fib *fib = fib_node->fib; 6150 struct mlxsw_sp_lpm_tree *lpm_tree; 6151 int err; 6152 6153 lpm_tree = mlxsw_sp->router->lpm.proto_trees[fib->proto]; 6154 if (lpm_tree->prefix_ref_count[fib_node->key.prefix_len] != 0) 6155 goto out; 6156 6157 mlxsw_sp_prefix_usage_cpy(&req_prefix_usage, &lpm_tree->prefix_usage); 6158 mlxsw_sp_prefix_usage_set(&req_prefix_usage, fib_node->key.prefix_len); 6159 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage, 6160 fib->proto); 6161 if (IS_ERR(lpm_tree)) 6162 return PTR_ERR(lpm_tree); 6163 6164 err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree); 6165 if (err) 6166 goto err_lpm_tree_replace; 6167 6168 out: 6169 lpm_tree->prefix_ref_count[fib_node->key.prefix_len]++; 6170 return 0; 6171 6172 err_lpm_tree_replace: 6173 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree); 6174 return err; 6175 } 6176 6177 static void mlxsw_sp_fib_lpm_tree_unlink(struct mlxsw_sp *mlxsw_sp, 6178 struct mlxsw_sp_fib_node *fib_node) 6179 { 6180 struct mlxsw_sp_lpm_tree *lpm_tree = fib_node->fib->lpm_tree; 6181 struct mlxsw_sp_prefix_usage req_prefix_usage; 6182 struct mlxsw_sp_fib *fib = fib_node->fib; 6183 int err; 6184 6185 if (--lpm_tree->prefix_ref_count[fib_node->key.prefix_len] != 0) 6186 return; 6187 /* Try to construct a new LPM tree from the current prefix usage 6188 * minus the unused one. If we fail, continue using the old one. 6189 */ 6190 mlxsw_sp_prefix_usage_cpy(&req_prefix_usage, &lpm_tree->prefix_usage); 6191 mlxsw_sp_prefix_usage_clear(&req_prefix_usage, 6192 fib_node->key.prefix_len); 6193 lpm_tree = mlxsw_sp_lpm_tree_get(mlxsw_sp, &req_prefix_usage, 6194 fib->proto); 6195 if (IS_ERR(lpm_tree)) 6196 return; 6197 6198 err = mlxsw_sp_vrs_lpm_tree_replace(mlxsw_sp, fib, lpm_tree); 6199 if (err) 6200 goto err_lpm_tree_replace; 6201 6202 return; 6203 6204 err_lpm_tree_replace: 6205 mlxsw_sp_lpm_tree_put(mlxsw_sp, lpm_tree); 6206 } 6207 6208 static int mlxsw_sp_fib_node_init(struct mlxsw_sp *mlxsw_sp, 6209 struct mlxsw_sp_fib_node *fib_node, 6210 struct mlxsw_sp_fib *fib) 6211 { 6212 int err; 6213 6214 err = mlxsw_sp_fib_node_insert(fib, fib_node); 6215 if (err) 6216 return err; 6217 fib_node->fib = fib; 6218 6219 err = mlxsw_sp_fib_lpm_tree_link(mlxsw_sp, fib_node); 6220 if (err) 6221 goto err_fib_lpm_tree_link; 6222 6223 return 0; 6224 6225 err_fib_lpm_tree_link: 6226 fib_node->fib = NULL; 6227 mlxsw_sp_fib_node_remove(fib, fib_node); 6228 return err; 6229 } 6230 6231 static void mlxsw_sp_fib_node_fini(struct mlxsw_sp *mlxsw_sp, 6232 struct mlxsw_sp_fib_node *fib_node) 6233 { 6234 struct mlxsw_sp_fib *fib = fib_node->fib; 6235 6236 mlxsw_sp_fib_lpm_tree_unlink(mlxsw_sp, fib_node); 6237 fib_node->fib = NULL; 6238 mlxsw_sp_fib_node_remove(fib, fib_node); 6239 } 6240 6241 static struct mlxsw_sp_fib_node * 6242 mlxsw_sp_fib_node_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id, const void *addr, 6243 size_t addr_len, unsigned char prefix_len, 6244 enum mlxsw_sp_l3proto proto) 6245 { 6246 struct mlxsw_sp_fib_node *fib_node; 6247 struct mlxsw_sp_fib *fib; 6248 struct mlxsw_sp_vr *vr; 6249 int err; 6250 6251 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, NULL); 6252 if (IS_ERR(vr)) 6253 return ERR_CAST(vr); 6254 fib = mlxsw_sp_vr_fib(vr, proto); 6255 6256 fib_node = mlxsw_sp_fib_node_lookup(fib, addr, addr_len, prefix_len); 6257 if (fib_node) 6258 return fib_node; 6259 6260 fib_node = mlxsw_sp_fib_node_create(fib, addr, addr_len, prefix_len); 6261 if (!fib_node) { 6262 err = -ENOMEM; 6263 goto err_fib_node_create; 6264 } 6265 6266 err = mlxsw_sp_fib_node_init(mlxsw_sp, fib_node, fib); 6267 if (err) 6268 goto err_fib_node_init; 6269 6270 return fib_node; 6271 6272 err_fib_node_init: 6273 mlxsw_sp_fib_node_destroy(fib_node); 6274 err_fib_node_create: 6275 mlxsw_sp_vr_put(mlxsw_sp, vr); 6276 return ERR_PTR(err); 6277 } 6278 6279 static void mlxsw_sp_fib_node_put(struct mlxsw_sp *mlxsw_sp, 6280 struct mlxsw_sp_fib_node *fib_node) 6281 { 6282 struct mlxsw_sp_vr *vr = fib_node->fib->vr; 6283 6284 if (fib_node->fib_entry) 6285 return; 6286 mlxsw_sp_fib_node_fini(mlxsw_sp, fib_node); 6287 mlxsw_sp_fib_node_destroy(fib_node); 6288 mlxsw_sp_vr_put(mlxsw_sp, vr); 6289 } 6290 6291 static int mlxsw_sp_fib_node_entry_link(struct mlxsw_sp *mlxsw_sp, 6292 struct mlxsw_sp_fib_entry *fib_entry) 6293 { 6294 struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node; 6295 int err; 6296 6297 fib_node->fib_entry = fib_entry; 6298 6299 err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); 6300 if (err) 6301 goto err_fib_entry_update; 6302 6303 return 0; 6304 6305 err_fib_entry_update: 6306 fib_node->fib_entry = NULL; 6307 return err; 6308 } 6309 6310 static void 6311 mlxsw_sp_fib_node_entry_unlink(struct mlxsw_sp *mlxsw_sp, 6312 struct mlxsw_sp_fib_entry *fib_entry) 6313 { 6314 struct mlxsw_sp_fib_node *fib_node = fib_entry->fib_node; 6315 6316 mlxsw_sp_fib_entry_del(mlxsw_sp, fib_entry); 6317 fib_node->fib_entry = NULL; 6318 } 6319 6320 static bool mlxsw_sp_fib4_allow_replace(struct mlxsw_sp_fib4_entry *fib4_entry) 6321 { 6322 struct mlxsw_sp_fib_node *fib_node = fib4_entry->common.fib_node; 6323 struct mlxsw_sp_fib4_entry *fib4_replaced; 6324 6325 if (!fib_node->fib_entry) 6326 return true; 6327 6328 fib4_replaced = container_of(fib_node->fib_entry, 6329 struct mlxsw_sp_fib4_entry, common); 6330 if (fib4_entry->tb_id == RT_TABLE_MAIN && 6331 fib4_replaced->tb_id == RT_TABLE_LOCAL) 6332 return false; 6333 6334 return true; 6335 } 6336 6337 static int 6338 mlxsw_sp_router_fib4_replace(struct mlxsw_sp *mlxsw_sp, 6339 const struct fib_entry_notifier_info *fen_info) 6340 { 6341 struct mlxsw_sp_fib4_entry *fib4_entry, *fib4_replaced; 6342 struct mlxsw_sp_fib_entry *replaced; 6343 struct mlxsw_sp_fib_node *fib_node; 6344 int err; 6345 6346 if (fen_info->fi->nh && 6347 !mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, fen_info->fi->nh->id)) 6348 return 0; 6349 6350 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, fen_info->tb_id, 6351 &fen_info->dst, sizeof(fen_info->dst), 6352 fen_info->dst_len, 6353 MLXSW_SP_L3_PROTO_IPV4); 6354 if (IS_ERR(fib_node)) { 6355 dev_warn(mlxsw_sp->bus_info->dev, "Failed to get FIB node\n"); 6356 return PTR_ERR(fib_node); 6357 } 6358 6359 fib4_entry = mlxsw_sp_fib4_entry_create(mlxsw_sp, fib_node, fen_info); 6360 if (IS_ERR(fib4_entry)) { 6361 dev_warn(mlxsw_sp->bus_info->dev, "Failed to create FIB entry\n"); 6362 err = PTR_ERR(fib4_entry); 6363 goto err_fib4_entry_create; 6364 } 6365 6366 if (!mlxsw_sp_fib4_allow_replace(fib4_entry)) { 6367 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry); 6368 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 6369 return 0; 6370 } 6371 6372 replaced = fib_node->fib_entry; 6373 err = mlxsw_sp_fib_node_entry_link(mlxsw_sp, &fib4_entry->common); 6374 if (err) { 6375 dev_warn(mlxsw_sp->bus_info->dev, "Failed to link FIB entry to node\n"); 6376 goto err_fib_node_entry_link; 6377 } 6378 6379 /* Nothing to replace */ 6380 if (!replaced) 6381 return 0; 6382 6383 mlxsw_sp_fib_entry_hw_flags_clear(mlxsw_sp, replaced); 6384 fib4_replaced = container_of(replaced, struct mlxsw_sp_fib4_entry, 6385 common); 6386 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_replaced); 6387 6388 return 0; 6389 6390 err_fib_node_entry_link: 6391 fib_node->fib_entry = replaced; 6392 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry); 6393 err_fib4_entry_create: 6394 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 6395 return err; 6396 } 6397 6398 static void mlxsw_sp_router_fib4_del(struct mlxsw_sp *mlxsw_sp, 6399 struct fib_entry_notifier_info *fen_info) 6400 { 6401 struct mlxsw_sp_fib4_entry *fib4_entry; 6402 struct mlxsw_sp_fib_node *fib_node; 6403 6404 fib4_entry = mlxsw_sp_fib4_entry_lookup(mlxsw_sp, fen_info); 6405 if (!fib4_entry) 6406 return; 6407 fib_node = fib4_entry->common.fib_node; 6408 6409 mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, &fib4_entry->common); 6410 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry); 6411 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 6412 } 6413 6414 static bool mlxsw_sp_fib6_rt_should_ignore(const struct fib6_info *rt) 6415 { 6416 /* Multicast routes aren't supported, so ignore them. Neighbour 6417 * Discovery packets are specifically trapped. 6418 */ 6419 if (ipv6_addr_type(&rt->fib6_dst.addr) & IPV6_ADDR_MULTICAST) 6420 return true; 6421 6422 /* Cloned routes are irrelevant in the forwarding path. */ 6423 if (rt->fib6_flags & RTF_CACHE) 6424 return true; 6425 6426 return false; 6427 } 6428 6429 static struct mlxsw_sp_rt6 *mlxsw_sp_rt6_create(struct fib6_info *rt) 6430 { 6431 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 6432 6433 mlxsw_sp_rt6 = kzalloc(sizeof(*mlxsw_sp_rt6), GFP_KERNEL); 6434 if (!mlxsw_sp_rt6) 6435 return ERR_PTR(-ENOMEM); 6436 6437 /* In case of route replace, replaced route is deleted with 6438 * no notification. Take reference to prevent accessing freed 6439 * memory. 6440 */ 6441 mlxsw_sp_rt6->rt = rt; 6442 fib6_info_hold(rt); 6443 6444 return mlxsw_sp_rt6; 6445 } 6446 6447 #if IS_ENABLED(CONFIG_IPV6) 6448 static void mlxsw_sp_rt6_release(struct fib6_info *rt) 6449 { 6450 fib6_info_release(rt); 6451 } 6452 #else 6453 static void mlxsw_sp_rt6_release(struct fib6_info *rt) 6454 { 6455 } 6456 #endif 6457 6458 static void mlxsw_sp_rt6_destroy(struct mlxsw_sp_rt6 *mlxsw_sp_rt6) 6459 { 6460 struct fib6_nh *fib6_nh = mlxsw_sp_rt6->rt->fib6_nh; 6461 6462 if (!mlxsw_sp_rt6->rt->nh) 6463 fib6_nh->fib_nh_flags &= ~RTNH_F_OFFLOAD; 6464 mlxsw_sp_rt6_release(mlxsw_sp_rt6->rt); 6465 kfree(mlxsw_sp_rt6); 6466 } 6467 6468 static struct fib6_info * 6469 mlxsw_sp_fib6_entry_rt(const struct mlxsw_sp_fib6_entry *fib6_entry) 6470 { 6471 return list_first_entry(&fib6_entry->rt6_list, struct mlxsw_sp_rt6, 6472 list)->rt; 6473 } 6474 6475 static struct mlxsw_sp_rt6 * 6476 mlxsw_sp_fib6_entry_rt_find(const struct mlxsw_sp_fib6_entry *fib6_entry, 6477 const struct fib6_info *rt) 6478 { 6479 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 6480 6481 list_for_each_entry(mlxsw_sp_rt6, &fib6_entry->rt6_list, list) { 6482 if (mlxsw_sp_rt6->rt == rt) 6483 return mlxsw_sp_rt6; 6484 } 6485 6486 return NULL; 6487 } 6488 6489 static bool mlxsw_sp_nexthop6_ipip_type(const struct mlxsw_sp *mlxsw_sp, 6490 const struct fib6_info *rt, 6491 enum mlxsw_sp_ipip_type *ret) 6492 { 6493 return rt->fib6_nh->fib_nh_dev && 6494 mlxsw_sp_netdev_ipip_type(mlxsw_sp, rt->fib6_nh->fib_nh_dev, ret); 6495 } 6496 6497 static int mlxsw_sp_nexthop6_init(struct mlxsw_sp *mlxsw_sp, 6498 struct mlxsw_sp_nexthop_group *nh_grp, 6499 struct mlxsw_sp_nexthop *nh, 6500 const struct fib6_info *rt) 6501 { 6502 struct net_device *dev = rt->fib6_nh->fib_nh_dev; 6503 int err; 6504 6505 nh->nhgi = nh_grp->nhgi; 6506 nh->nh_weight = rt->fib6_nh->fib_nh_weight; 6507 memcpy(&nh->gw_addr, &rt->fib6_nh->fib_nh_gw6, sizeof(nh->gw_addr)); 6508 #if IS_ENABLED(CONFIG_IPV6) 6509 nh->neigh_tbl = &nd_tbl; 6510 #endif 6511 mlxsw_sp_nexthop_counter_alloc(mlxsw_sp, nh); 6512 6513 list_add_tail(&nh->router_list_node, &mlxsw_sp->router->nexthop_list); 6514 6515 if (!dev) 6516 return 0; 6517 nh->ifindex = dev->ifindex; 6518 6519 err = mlxsw_sp_nexthop_type_init(mlxsw_sp, nh, dev); 6520 if (err) 6521 goto err_nexthop_type_init; 6522 6523 return 0; 6524 6525 err_nexthop_type_init: 6526 list_del(&nh->router_list_node); 6527 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh); 6528 return err; 6529 } 6530 6531 static void mlxsw_sp_nexthop6_fini(struct mlxsw_sp *mlxsw_sp, 6532 struct mlxsw_sp_nexthop *nh) 6533 { 6534 mlxsw_sp_nexthop_type_fini(mlxsw_sp, nh); 6535 list_del(&nh->router_list_node); 6536 mlxsw_sp_nexthop_counter_free(mlxsw_sp, nh); 6537 } 6538 6539 static bool mlxsw_sp_rt6_is_gateway(const struct mlxsw_sp *mlxsw_sp, 6540 const struct fib6_info *rt) 6541 { 6542 return rt->fib6_nh->fib_nh_gw_family || 6543 mlxsw_sp_nexthop6_ipip_type(mlxsw_sp, rt, NULL); 6544 } 6545 6546 static int 6547 mlxsw_sp_nexthop6_group_info_init(struct mlxsw_sp *mlxsw_sp, 6548 struct mlxsw_sp_nexthop_group *nh_grp, 6549 struct mlxsw_sp_fib6_entry *fib6_entry) 6550 { 6551 struct mlxsw_sp_nexthop_group_info *nhgi; 6552 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 6553 struct mlxsw_sp_nexthop *nh; 6554 int err, i; 6555 6556 nhgi = kzalloc(struct_size(nhgi, nexthops, fib6_entry->nrt6), 6557 GFP_KERNEL); 6558 if (!nhgi) 6559 return -ENOMEM; 6560 nh_grp->nhgi = nhgi; 6561 nhgi->nh_grp = nh_grp; 6562 mlxsw_sp_rt6 = list_first_entry(&fib6_entry->rt6_list, 6563 struct mlxsw_sp_rt6, list); 6564 nhgi->gateway = mlxsw_sp_rt6_is_gateway(mlxsw_sp, mlxsw_sp_rt6->rt); 6565 nhgi->count = fib6_entry->nrt6; 6566 for (i = 0; i < nhgi->count; i++) { 6567 struct fib6_info *rt = mlxsw_sp_rt6->rt; 6568 6569 nh = &nhgi->nexthops[i]; 6570 err = mlxsw_sp_nexthop6_init(mlxsw_sp, nh_grp, nh, rt); 6571 if (err) 6572 goto err_nexthop6_init; 6573 mlxsw_sp_rt6 = list_next_entry(mlxsw_sp_rt6, list); 6574 } 6575 nh_grp->nhgi = nhgi; 6576 err = mlxsw_sp_nexthop_group_inc(mlxsw_sp); 6577 if (err) 6578 goto err_group_inc; 6579 err = mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); 6580 if (err) 6581 goto err_group_refresh; 6582 6583 return 0; 6584 6585 err_group_refresh: 6586 mlxsw_sp_nexthop_group_dec(mlxsw_sp); 6587 err_group_inc: 6588 i = nhgi->count; 6589 err_nexthop6_init: 6590 for (i--; i >= 0; i--) { 6591 nh = &nhgi->nexthops[i]; 6592 mlxsw_sp_nexthop6_fini(mlxsw_sp, nh); 6593 } 6594 kfree(nhgi); 6595 return err; 6596 } 6597 6598 static void 6599 mlxsw_sp_nexthop6_group_info_fini(struct mlxsw_sp *mlxsw_sp, 6600 struct mlxsw_sp_nexthop_group *nh_grp) 6601 { 6602 struct mlxsw_sp_nexthop_group_info *nhgi = nh_grp->nhgi; 6603 int i; 6604 6605 mlxsw_sp_nexthop_group_dec(mlxsw_sp); 6606 for (i = nhgi->count - 1; i >= 0; i--) { 6607 struct mlxsw_sp_nexthop *nh = &nhgi->nexthops[i]; 6608 6609 mlxsw_sp_nexthop6_fini(mlxsw_sp, nh); 6610 } 6611 mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); 6612 WARN_ON_ONCE(nhgi->adj_index_valid); 6613 kfree(nhgi); 6614 } 6615 6616 static struct mlxsw_sp_nexthop_group * 6617 mlxsw_sp_nexthop6_group_create(struct mlxsw_sp *mlxsw_sp, 6618 struct mlxsw_sp_fib6_entry *fib6_entry) 6619 { 6620 struct mlxsw_sp_nexthop_group *nh_grp; 6621 int err; 6622 6623 nh_grp = kzalloc(sizeof(*nh_grp), GFP_KERNEL); 6624 if (!nh_grp) 6625 return ERR_PTR(-ENOMEM); 6626 INIT_LIST_HEAD(&nh_grp->vr_list); 6627 err = rhashtable_init(&nh_grp->vr_ht, 6628 &mlxsw_sp_nexthop_group_vr_ht_params); 6629 if (err) 6630 goto err_nexthop_group_vr_ht_init; 6631 INIT_LIST_HEAD(&nh_grp->fib_list); 6632 nh_grp->type = MLXSW_SP_NEXTHOP_GROUP_TYPE_IPV6; 6633 6634 err = mlxsw_sp_nexthop6_group_info_init(mlxsw_sp, nh_grp, fib6_entry); 6635 if (err) 6636 goto err_nexthop_group_info_init; 6637 6638 err = mlxsw_sp_nexthop_group_insert(mlxsw_sp, nh_grp); 6639 if (err) 6640 goto err_nexthop_group_insert; 6641 6642 nh_grp->can_destroy = true; 6643 6644 return nh_grp; 6645 6646 err_nexthop_group_insert: 6647 mlxsw_sp_nexthop6_group_info_fini(mlxsw_sp, nh_grp); 6648 err_nexthop_group_info_init: 6649 rhashtable_destroy(&nh_grp->vr_ht); 6650 err_nexthop_group_vr_ht_init: 6651 kfree(nh_grp); 6652 return ERR_PTR(err); 6653 } 6654 6655 static void 6656 mlxsw_sp_nexthop6_group_destroy(struct mlxsw_sp *mlxsw_sp, 6657 struct mlxsw_sp_nexthop_group *nh_grp) 6658 { 6659 if (!nh_grp->can_destroy) 6660 return; 6661 mlxsw_sp_nexthop_group_remove(mlxsw_sp, nh_grp); 6662 mlxsw_sp_nexthop6_group_info_fini(mlxsw_sp, nh_grp); 6663 WARN_ON_ONCE(!list_empty(&nh_grp->vr_list)); 6664 rhashtable_destroy(&nh_grp->vr_ht); 6665 kfree(nh_grp); 6666 } 6667 6668 static int mlxsw_sp_nexthop6_group_get(struct mlxsw_sp *mlxsw_sp, 6669 struct mlxsw_sp_fib6_entry *fib6_entry) 6670 { 6671 struct fib6_info *rt = mlxsw_sp_fib6_entry_rt(fib6_entry); 6672 struct mlxsw_sp_nexthop_group *nh_grp; 6673 6674 if (rt->nh) { 6675 nh_grp = mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, 6676 rt->nh->id); 6677 if (WARN_ON_ONCE(!nh_grp)) 6678 return -EINVAL; 6679 goto out; 6680 } 6681 6682 nh_grp = mlxsw_sp_nexthop6_group_lookup(mlxsw_sp, fib6_entry); 6683 if (!nh_grp) { 6684 nh_grp = mlxsw_sp_nexthop6_group_create(mlxsw_sp, fib6_entry); 6685 if (IS_ERR(nh_grp)) 6686 return PTR_ERR(nh_grp); 6687 } 6688 6689 /* The route and the nexthop are described by the same struct, so we 6690 * need to the update the nexthop offload indication for the new route. 6691 */ 6692 __mlxsw_sp_nexthop6_group_offload_refresh(nh_grp, fib6_entry); 6693 6694 out: 6695 list_add_tail(&fib6_entry->common.nexthop_group_node, 6696 &nh_grp->fib_list); 6697 fib6_entry->common.nh_group = nh_grp; 6698 6699 return 0; 6700 } 6701 6702 static void mlxsw_sp_nexthop6_group_put(struct mlxsw_sp *mlxsw_sp, 6703 struct mlxsw_sp_fib_entry *fib_entry) 6704 { 6705 struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group; 6706 6707 list_del(&fib_entry->nexthop_group_node); 6708 if (!list_empty(&nh_grp->fib_list)) 6709 return; 6710 6711 if (nh_grp->type == MLXSW_SP_NEXTHOP_GROUP_TYPE_OBJ) { 6712 mlxsw_sp_nexthop_obj_group_destroy(mlxsw_sp, nh_grp); 6713 return; 6714 } 6715 6716 mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, nh_grp); 6717 } 6718 6719 static int 6720 mlxsw_sp_nexthop6_group_update(struct mlxsw_sp *mlxsw_sp, 6721 struct mlxsw_sp_fib6_entry *fib6_entry) 6722 { 6723 struct mlxsw_sp_nexthop_group *old_nh_grp = fib6_entry->common.nh_group; 6724 struct mlxsw_sp_fib_node *fib_node = fib6_entry->common.fib_node; 6725 int err; 6726 6727 mlxsw_sp_nexthop_group_vr_unlink(old_nh_grp, fib_node->fib); 6728 fib6_entry->common.nh_group = NULL; 6729 list_del(&fib6_entry->common.nexthop_group_node); 6730 6731 err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry); 6732 if (err) 6733 goto err_nexthop6_group_get; 6734 6735 err = mlxsw_sp_nexthop_group_vr_link(fib6_entry->common.nh_group, 6736 fib_node->fib); 6737 if (err) 6738 goto err_nexthop_group_vr_link; 6739 6740 /* In case this entry is offloaded, then the adjacency index 6741 * currently associated with it in the device's table is that 6742 * of the old group. Start using the new one instead. 6743 */ 6744 err = mlxsw_sp_fib_entry_update(mlxsw_sp, &fib6_entry->common); 6745 if (err) 6746 goto err_fib_entry_update; 6747 6748 if (list_empty(&old_nh_grp->fib_list)) 6749 mlxsw_sp_nexthop6_group_destroy(mlxsw_sp, old_nh_grp); 6750 6751 return 0; 6752 6753 err_fib_entry_update: 6754 mlxsw_sp_nexthop_group_vr_unlink(fib6_entry->common.nh_group, 6755 fib_node->fib); 6756 err_nexthop_group_vr_link: 6757 mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common); 6758 err_nexthop6_group_get: 6759 list_add_tail(&fib6_entry->common.nexthop_group_node, 6760 &old_nh_grp->fib_list); 6761 fib6_entry->common.nh_group = old_nh_grp; 6762 mlxsw_sp_nexthop_group_vr_link(old_nh_grp, fib_node->fib); 6763 return err; 6764 } 6765 6766 static int 6767 mlxsw_sp_fib6_entry_nexthop_add(struct mlxsw_sp *mlxsw_sp, 6768 struct mlxsw_sp_fib6_entry *fib6_entry, 6769 struct fib6_info **rt_arr, unsigned int nrt6) 6770 { 6771 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 6772 int err, i; 6773 6774 for (i = 0; i < nrt6; i++) { 6775 mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt_arr[i]); 6776 if (IS_ERR(mlxsw_sp_rt6)) { 6777 err = PTR_ERR(mlxsw_sp_rt6); 6778 goto err_rt6_unwind; 6779 } 6780 6781 list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list); 6782 fib6_entry->nrt6++; 6783 } 6784 6785 err = mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry); 6786 if (err) 6787 goto err_rt6_unwind; 6788 6789 return 0; 6790 6791 err_rt6_unwind: 6792 for (; i > 0; i--) { 6793 fib6_entry->nrt6--; 6794 mlxsw_sp_rt6 = list_last_entry(&fib6_entry->rt6_list, 6795 struct mlxsw_sp_rt6, list); 6796 list_del(&mlxsw_sp_rt6->list); 6797 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6); 6798 } 6799 return err; 6800 } 6801 6802 static void 6803 mlxsw_sp_fib6_entry_nexthop_del(struct mlxsw_sp *mlxsw_sp, 6804 struct mlxsw_sp_fib6_entry *fib6_entry, 6805 struct fib6_info **rt_arr, unsigned int nrt6) 6806 { 6807 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 6808 int i; 6809 6810 for (i = 0; i < nrt6; i++) { 6811 mlxsw_sp_rt6 = mlxsw_sp_fib6_entry_rt_find(fib6_entry, 6812 rt_arr[i]); 6813 if (WARN_ON_ONCE(!mlxsw_sp_rt6)) 6814 continue; 6815 6816 fib6_entry->nrt6--; 6817 list_del(&mlxsw_sp_rt6->list); 6818 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6); 6819 } 6820 6821 mlxsw_sp_nexthop6_group_update(mlxsw_sp, fib6_entry); 6822 } 6823 6824 static int 6825 mlxsw_sp_fib6_entry_type_set_local(struct mlxsw_sp *mlxsw_sp, 6826 struct mlxsw_sp_fib_entry *fib_entry, 6827 const struct fib6_info *rt) 6828 { 6829 struct mlxsw_sp_nexthop_group_info *nhgi = fib_entry->nh_group->nhgi; 6830 union mlxsw_sp_l3addr dip = { .addr6 = rt->fib6_dst.addr }; 6831 u32 tb_id = mlxsw_sp_fix_tb_id(rt->fib6_table->tb6_id); 6832 struct mlxsw_sp_router *router = mlxsw_sp->router; 6833 int ifindex = nhgi->nexthops[0].ifindex; 6834 struct mlxsw_sp_ipip_entry *ipip_entry; 6835 6836 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 6837 ipip_entry = mlxsw_sp_ipip_entry_find_by_decap(mlxsw_sp, ifindex, 6838 MLXSW_SP_L3_PROTO_IPV6, 6839 dip); 6840 6841 if (ipip_entry && ipip_entry->ol_dev->flags & IFF_UP) { 6842 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_IPIP_DECAP; 6843 return mlxsw_sp_fib_entry_decap_init(mlxsw_sp, fib_entry, 6844 ipip_entry); 6845 } 6846 if (mlxsw_sp_router_nve_is_decap(mlxsw_sp, tb_id, 6847 MLXSW_SP_L3_PROTO_IPV6, &dip)) { 6848 u32 tunnel_index; 6849 6850 tunnel_index = router->nve_decap_config.tunnel_index; 6851 fib_entry->decap.tunnel_index = tunnel_index; 6852 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_NVE_DECAP; 6853 } 6854 6855 return 0; 6856 } 6857 6858 static int mlxsw_sp_fib6_entry_type_set(struct mlxsw_sp *mlxsw_sp, 6859 struct mlxsw_sp_fib_entry *fib_entry, 6860 const struct fib6_info *rt) 6861 { 6862 if (rt->fib6_flags & RTF_LOCAL) 6863 return mlxsw_sp_fib6_entry_type_set_local(mlxsw_sp, fib_entry, 6864 rt); 6865 if (rt->fib6_flags & RTF_ANYCAST) 6866 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_TRAP; 6867 else if (rt->fib6_type == RTN_BLACKHOLE) 6868 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_BLACKHOLE; 6869 else if (rt->fib6_flags & RTF_REJECT) 6870 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_UNREACHABLE; 6871 else if (fib_entry->nh_group->nhgi->gateway) 6872 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE; 6873 else 6874 fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_LOCAL; 6875 6876 return 0; 6877 } 6878 6879 static void 6880 mlxsw_sp_fib6_entry_rt_destroy_all(struct mlxsw_sp_fib6_entry *fib6_entry) 6881 { 6882 struct mlxsw_sp_rt6 *mlxsw_sp_rt6, *tmp; 6883 6884 list_for_each_entry_safe(mlxsw_sp_rt6, tmp, &fib6_entry->rt6_list, 6885 list) { 6886 fib6_entry->nrt6--; 6887 list_del(&mlxsw_sp_rt6->list); 6888 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6); 6889 } 6890 } 6891 6892 static struct mlxsw_sp_fib6_entry * 6893 mlxsw_sp_fib6_entry_create(struct mlxsw_sp *mlxsw_sp, 6894 struct mlxsw_sp_fib_node *fib_node, 6895 struct fib6_info **rt_arr, unsigned int nrt6) 6896 { 6897 struct mlxsw_sp_fib6_entry *fib6_entry; 6898 struct mlxsw_sp_fib_entry *fib_entry; 6899 struct mlxsw_sp_rt6 *mlxsw_sp_rt6; 6900 int err, i; 6901 6902 fib6_entry = kzalloc(sizeof(*fib6_entry), GFP_KERNEL); 6903 if (!fib6_entry) 6904 return ERR_PTR(-ENOMEM); 6905 fib_entry = &fib6_entry->common; 6906 6907 INIT_LIST_HEAD(&fib6_entry->rt6_list); 6908 6909 for (i = 0; i < nrt6; i++) { 6910 mlxsw_sp_rt6 = mlxsw_sp_rt6_create(rt_arr[i]); 6911 if (IS_ERR(mlxsw_sp_rt6)) { 6912 err = PTR_ERR(mlxsw_sp_rt6); 6913 goto err_rt6_unwind; 6914 } 6915 list_add_tail(&mlxsw_sp_rt6->list, &fib6_entry->rt6_list); 6916 fib6_entry->nrt6++; 6917 } 6918 6919 err = mlxsw_sp_nexthop6_group_get(mlxsw_sp, fib6_entry); 6920 if (err) 6921 goto err_rt6_unwind; 6922 6923 err = mlxsw_sp_nexthop_group_vr_link(fib_entry->nh_group, 6924 fib_node->fib); 6925 if (err) 6926 goto err_nexthop_group_vr_link; 6927 6928 err = mlxsw_sp_fib6_entry_type_set(mlxsw_sp, fib_entry, rt_arr[0]); 6929 if (err) 6930 goto err_fib6_entry_type_set; 6931 6932 fib_entry->fib_node = fib_node; 6933 6934 return fib6_entry; 6935 6936 err_fib6_entry_type_set: 6937 mlxsw_sp_nexthop_group_vr_unlink(fib_entry->nh_group, fib_node->fib); 6938 err_nexthop_group_vr_link: 6939 mlxsw_sp_nexthop6_group_put(mlxsw_sp, fib_entry); 6940 err_rt6_unwind: 6941 for (; i > 0; i--) { 6942 fib6_entry->nrt6--; 6943 mlxsw_sp_rt6 = list_last_entry(&fib6_entry->rt6_list, 6944 struct mlxsw_sp_rt6, list); 6945 list_del(&mlxsw_sp_rt6->list); 6946 mlxsw_sp_rt6_destroy(mlxsw_sp_rt6); 6947 } 6948 kfree(fib6_entry); 6949 return ERR_PTR(err); 6950 } 6951 6952 static void 6953 mlxsw_sp_fib6_entry_type_unset(struct mlxsw_sp *mlxsw_sp, 6954 struct mlxsw_sp_fib6_entry *fib6_entry) 6955 { 6956 mlxsw_sp_fib_entry_type_unset(mlxsw_sp, &fib6_entry->common); 6957 } 6958 6959 static void mlxsw_sp_fib6_entry_destroy(struct mlxsw_sp *mlxsw_sp, 6960 struct mlxsw_sp_fib6_entry *fib6_entry) 6961 { 6962 struct mlxsw_sp_fib_node *fib_node = fib6_entry->common.fib_node; 6963 6964 mlxsw_sp_fib6_entry_type_unset(mlxsw_sp, fib6_entry); 6965 mlxsw_sp_nexthop_group_vr_unlink(fib6_entry->common.nh_group, 6966 fib_node->fib); 6967 mlxsw_sp_nexthop6_group_put(mlxsw_sp, &fib6_entry->common); 6968 mlxsw_sp_fib6_entry_rt_destroy_all(fib6_entry); 6969 WARN_ON(fib6_entry->nrt6); 6970 kfree(fib6_entry); 6971 } 6972 6973 static struct mlxsw_sp_fib6_entry * 6974 mlxsw_sp_fib6_entry_lookup(struct mlxsw_sp *mlxsw_sp, 6975 const struct fib6_info *rt) 6976 { 6977 struct mlxsw_sp_fib6_entry *fib6_entry; 6978 struct mlxsw_sp_fib_node *fib_node; 6979 struct mlxsw_sp_fib *fib; 6980 struct fib6_info *cmp_rt; 6981 struct mlxsw_sp_vr *vr; 6982 6983 vr = mlxsw_sp_vr_find(mlxsw_sp, rt->fib6_table->tb6_id); 6984 if (!vr) 6985 return NULL; 6986 fib = mlxsw_sp_vr_fib(vr, MLXSW_SP_L3_PROTO_IPV6); 6987 6988 fib_node = mlxsw_sp_fib_node_lookup(fib, &rt->fib6_dst.addr, 6989 sizeof(rt->fib6_dst.addr), 6990 rt->fib6_dst.plen); 6991 if (!fib_node) 6992 return NULL; 6993 6994 fib6_entry = container_of(fib_node->fib_entry, 6995 struct mlxsw_sp_fib6_entry, common); 6996 cmp_rt = mlxsw_sp_fib6_entry_rt(fib6_entry); 6997 if (rt->fib6_table->tb6_id == cmp_rt->fib6_table->tb6_id && 6998 rt->fib6_metric == cmp_rt->fib6_metric && 6999 mlxsw_sp_fib6_entry_rt_find(fib6_entry, rt)) 7000 return fib6_entry; 7001 7002 return NULL; 7003 } 7004 7005 static bool mlxsw_sp_fib6_allow_replace(struct mlxsw_sp_fib6_entry *fib6_entry) 7006 { 7007 struct mlxsw_sp_fib_node *fib_node = fib6_entry->common.fib_node; 7008 struct mlxsw_sp_fib6_entry *fib6_replaced; 7009 struct fib6_info *rt, *rt_replaced; 7010 7011 if (!fib_node->fib_entry) 7012 return true; 7013 7014 fib6_replaced = container_of(fib_node->fib_entry, 7015 struct mlxsw_sp_fib6_entry, 7016 common); 7017 rt = mlxsw_sp_fib6_entry_rt(fib6_entry); 7018 rt_replaced = mlxsw_sp_fib6_entry_rt(fib6_replaced); 7019 if (rt->fib6_table->tb6_id == RT_TABLE_MAIN && 7020 rt_replaced->fib6_table->tb6_id == RT_TABLE_LOCAL) 7021 return false; 7022 7023 return true; 7024 } 7025 7026 static int mlxsw_sp_router_fib6_replace(struct mlxsw_sp *mlxsw_sp, 7027 struct fib6_info **rt_arr, 7028 unsigned int nrt6) 7029 { 7030 struct mlxsw_sp_fib6_entry *fib6_entry, *fib6_replaced; 7031 struct mlxsw_sp_fib_entry *replaced; 7032 struct mlxsw_sp_fib_node *fib_node; 7033 struct fib6_info *rt = rt_arr[0]; 7034 int err; 7035 7036 if (rt->fib6_src.plen) 7037 return -EINVAL; 7038 7039 if (mlxsw_sp_fib6_rt_should_ignore(rt)) 7040 return 0; 7041 7042 if (rt->nh && !mlxsw_sp_nexthop_obj_group_lookup(mlxsw_sp, rt->nh->id)) 7043 return 0; 7044 7045 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, rt->fib6_table->tb6_id, 7046 &rt->fib6_dst.addr, 7047 sizeof(rt->fib6_dst.addr), 7048 rt->fib6_dst.plen, 7049 MLXSW_SP_L3_PROTO_IPV6); 7050 if (IS_ERR(fib_node)) 7051 return PTR_ERR(fib_node); 7052 7053 fib6_entry = mlxsw_sp_fib6_entry_create(mlxsw_sp, fib_node, rt_arr, 7054 nrt6); 7055 if (IS_ERR(fib6_entry)) { 7056 err = PTR_ERR(fib6_entry); 7057 goto err_fib6_entry_create; 7058 } 7059 7060 if (!mlxsw_sp_fib6_allow_replace(fib6_entry)) { 7061 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry); 7062 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7063 return 0; 7064 } 7065 7066 replaced = fib_node->fib_entry; 7067 err = mlxsw_sp_fib_node_entry_link(mlxsw_sp, &fib6_entry->common); 7068 if (err) 7069 goto err_fib_node_entry_link; 7070 7071 /* Nothing to replace */ 7072 if (!replaced) 7073 return 0; 7074 7075 mlxsw_sp_fib_entry_hw_flags_clear(mlxsw_sp, replaced); 7076 fib6_replaced = container_of(replaced, struct mlxsw_sp_fib6_entry, 7077 common); 7078 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_replaced); 7079 7080 return 0; 7081 7082 err_fib_node_entry_link: 7083 fib_node->fib_entry = replaced; 7084 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry); 7085 err_fib6_entry_create: 7086 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7087 return err; 7088 } 7089 7090 static int mlxsw_sp_router_fib6_append(struct mlxsw_sp *mlxsw_sp, 7091 struct fib6_info **rt_arr, 7092 unsigned int nrt6) 7093 { 7094 struct mlxsw_sp_fib6_entry *fib6_entry; 7095 struct mlxsw_sp_fib_node *fib_node; 7096 struct fib6_info *rt = rt_arr[0]; 7097 int err; 7098 7099 if (rt->fib6_src.plen) 7100 return -EINVAL; 7101 7102 if (mlxsw_sp_fib6_rt_should_ignore(rt)) 7103 return 0; 7104 7105 fib_node = mlxsw_sp_fib_node_get(mlxsw_sp, rt->fib6_table->tb6_id, 7106 &rt->fib6_dst.addr, 7107 sizeof(rt->fib6_dst.addr), 7108 rt->fib6_dst.plen, 7109 MLXSW_SP_L3_PROTO_IPV6); 7110 if (IS_ERR(fib_node)) 7111 return PTR_ERR(fib_node); 7112 7113 if (WARN_ON_ONCE(!fib_node->fib_entry)) { 7114 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7115 return -EINVAL; 7116 } 7117 7118 fib6_entry = container_of(fib_node->fib_entry, 7119 struct mlxsw_sp_fib6_entry, common); 7120 err = mlxsw_sp_fib6_entry_nexthop_add(mlxsw_sp, fib6_entry, rt_arr, 7121 nrt6); 7122 if (err) 7123 goto err_fib6_entry_nexthop_add; 7124 7125 return 0; 7126 7127 err_fib6_entry_nexthop_add: 7128 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7129 return err; 7130 } 7131 7132 static void mlxsw_sp_router_fib6_del(struct mlxsw_sp *mlxsw_sp, 7133 struct fib6_info **rt_arr, 7134 unsigned int nrt6) 7135 { 7136 struct mlxsw_sp_fib6_entry *fib6_entry; 7137 struct mlxsw_sp_fib_node *fib_node; 7138 struct fib6_info *rt = rt_arr[0]; 7139 7140 if (mlxsw_sp_fib6_rt_should_ignore(rt)) 7141 return; 7142 7143 /* Multipath routes are first added to the FIB trie and only then 7144 * notified. If we vetoed the addition, we will get a delete 7145 * notification for a route we do not have. Therefore, do not warn if 7146 * route was not found. 7147 */ 7148 fib6_entry = mlxsw_sp_fib6_entry_lookup(mlxsw_sp, rt); 7149 if (!fib6_entry) 7150 return; 7151 7152 /* If not all the nexthops are deleted, then only reduce the nexthop 7153 * group. 7154 */ 7155 if (nrt6 != fib6_entry->nrt6) { 7156 mlxsw_sp_fib6_entry_nexthop_del(mlxsw_sp, fib6_entry, rt_arr, 7157 nrt6); 7158 return; 7159 } 7160 7161 fib_node = fib6_entry->common.fib_node; 7162 7163 mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, &fib6_entry->common); 7164 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry); 7165 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7166 } 7167 7168 static struct mlxsw_sp_mr_table * 7169 mlxsw_sp_router_fibmr_family_to_table(struct mlxsw_sp_vr *vr, int family) 7170 { 7171 if (family == RTNL_FAMILY_IPMR) 7172 return vr->mr_table[MLXSW_SP_L3_PROTO_IPV4]; 7173 else 7174 return vr->mr_table[MLXSW_SP_L3_PROTO_IPV6]; 7175 } 7176 7177 static int mlxsw_sp_router_fibmr_add(struct mlxsw_sp *mlxsw_sp, 7178 struct mfc_entry_notifier_info *men_info, 7179 bool replace) 7180 { 7181 struct mlxsw_sp_mr_table *mrt; 7182 struct mlxsw_sp_vr *vr; 7183 7184 vr = mlxsw_sp_vr_get(mlxsw_sp, men_info->tb_id, NULL); 7185 if (IS_ERR(vr)) 7186 return PTR_ERR(vr); 7187 7188 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, men_info->info.family); 7189 return mlxsw_sp_mr_route_add(mrt, men_info->mfc, replace); 7190 } 7191 7192 static void mlxsw_sp_router_fibmr_del(struct mlxsw_sp *mlxsw_sp, 7193 struct mfc_entry_notifier_info *men_info) 7194 { 7195 struct mlxsw_sp_mr_table *mrt; 7196 struct mlxsw_sp_vr *vr; 7197 7198 vr = mlxsw_sp_vr_find(mlxsw_sp, men_info->tb_id); 7199 if (WARN_ON(!vr)) 7200 return; 7201 7202 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, men_info->info.family); 7203 mlxsw_sp_mr_route_del(mrt, men_info->mfc); 7204 mlxsw_sp_vr_put(mlxsw_sp, vr); 7205 } 7206 7207 static int 7208 mlxsw_sp_router_fibmr_vif_add(struct mlxsw_sp *mlxsw_sp, 7209 struct vif_entry_notifier_info *ven_info) 7210 { 7211 struct mlxsw_sp_mr_table *mrt; 7212 struct mlxsw_sp_rif *rif; 7213 struct mlxsw_sp_vr *vr; 7214 7215 vr = mlxsw_sp_vr_get(mlxsw_sp, ven_info->tb_id, NULL); 7216 if (IS_ERR(vr)) 7217 return PTR_ERR(vr); 7218 7219 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, ven_info->info.family); 7220 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, ven_info->dev); 7221 return mlxsw_sp_mr_vif_add(mrt, ven_info->dev, 7222 ven_info->vif_index, 7223 ven_info->vif_flags, rif); 7224 } 7225 7226 static void 7227 mlxsw_sp_router_fibmr_vif_del(struct mlxsw_sp *mlxsw_sp, 7228 struct vif_entry_notifier_info *ven_info) 7229 { 7230 struct mlxsw_sp_mr_table *mrt; 7231 struct mlxsw_sp_vr *vr; 7232 7233 vr = mlxsw_sp_vr_find(mlxsw_sp, ven_info->tb_id); 7234 if (WARN_ON(!vr)) 7235 return; 7236 7237 mrt = mlxsw_sp_router_fibmr_family_to_table(vr, ven_info->info.family); 7238 mlxsw_sp_mr_vif_del(mrt, ven_info->vif_index); 7239 mlxsw_sp_vr_put(mlxsw_sp, vr); 7240 } 7241 7242 static void mlxsw_sp_fib4_node_flush(struct mlxsw_sp *mlxsw_sp, 7243 struct mlxsw_sp_fib_node *fib_node) 7244 { 7245 struct mlxsw_sp_fib4_entry *fib4_entry; 7246 7247 fib4_entry = container_of(fib_node->fib_entry, 7248 struct mlxsw_sp_fib4_entry, common); 7249 mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, fib_node->fib_entry); 7250 mlxsw_sp_fib4_entry_destroy(mlxsw_sp, fib4_entry); 7251 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7252 } 7253 7254 static void mlxsw_sp_fib6_node_flush(struct mlxsw_sp *mlxsw_sp, 7255 struct mlxsw_sp_fib_node *fib_node) 7256 { 7257 struct mlxsw_sp_fib6_entry *fib6_entry; 7258 7259 fib6_entry = container_of(fib_node->fib_entry, 7260 struct mlxsw_sp_fib6_entry, common); 7261 mlxsw_sp_fib_node_entry_unlink(mlxsw_sp, fib_node->fib_entry); 7262 mlxsw_sp_fib6_entry_destroy(mlxsw_sp, fib6_entry); 7263 mlxsw_sp_fib_node_put(mlxsw_sp, fib_node); 7264 } 7265 7266 static void mlxsw_sp_fib_node_flush(struct mlxsw_sp *mlxsw_sp, 7267 struct mlxsw_sp_fib_node *fib_node) 7268 { 7269 switch (fib_node->fib->proto) { 7270 case MLXSW_SP_L3_PROTO_IPV4: 7271 mlxsw_sp_fib4_node_flush(mlxsw_sp, fib_node); 7272 break; 7273 case MLXSW_SP_L3_PROTO_IPV6: 7274 mlxsw_sp_fib6_node_flush(mlxsw_sp, fib_node); 7275 break; 7276 } 7277 } 7278 7279 static void mlxsw_sp_vr_fib_flush(struct mlxsw_sp *mlxsw_sp, 7280 struct mlxsw_sp_vr *vr, 7281 enum mlxsw_sp_l3proto proto) 7282 { 7283 struct mlxsw_sp_fib *fib = mlxsw_sp_vr_fib(vr, proto); 7284 struct mlxsw_sp_fib_node *fib_node, *tmp; 7285 7286 list_for_each_entry_safe(fib_node, tmp, &fib->node_list, list) { 7287 bool do_break = &tmp->list == &fib->node_list; 7288 7289 mlxsw_sp_fib_node_flush(mlxsw_sp, fib_node); 7290 if (do_break) 7291 break; 7292 } 7293 } 7294 7295 static void mlxsw_sp_router_fib_flush(struct mlxsw_sp *mlxsw_sp) 7296 { 7297 int i, j; 7298 7299 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_VRS); i++) { 7300 struct mlxsw_sp_vr *vr = &mlxsw_sp->router->vrs[i]; 7301 7302 if (!mlxsw_sp_vr_is_used(vr)) 7303 continue; 7304 7305 for (j = 0; j < MLXSW_SP_L3_PROTO_MAX; j++) 7306 mlxsw_sp_mr_table_flush(vr->mr_table[j]); 7307 mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV4); 7308 7309 /* If virtual router was only used for IPv4, then it's no 7310 * longer used. 7311 */ 7312 if (!mlxsw_sp_vr_is_used(vr)) 7313 continue; 7314 mlxsw_sp_vr_fib_flush(mlxsw_sp, vr, MLXSW_SP_L3_PROTO_IPV6); 7315 } 7316 } 7317 7318 struct mlxsw_sp_fib6_event_work { 7319 struct fib6_info **rt_arr; 7320 unsigned int nrt6; 7321 }; 7322 7323 struct mlxsw_sp_fib_event_work { 7324 struct work_struct work; 7325 union { 7326 struct mlxsw_sp_fib6_event_work fib6_work; 7327 struct fib_entry_notifier_info fen_info; 7328 struct fib_rule_notifier_info fr_info; 7329 struct fib_nh_notifier_info fnh_info; 7330 struct mfc_entry_notifier_info men_info; 7331 struct vif_entry_notifier_info ven_info; 7332 }; 7333 struct mlxsw_sp *mlxsw_sp; 7334 unsigned long event; 7335 }; 7336 7337 static int 7338 mlxsw_sp_router_fib6_work_init(struct mlxsw_sp_fib6_event_work *fib6_work, 7339 struct fib6_entry_notifier_info *fen6_info) 7340 { 7341 struct fib6_info *rt = fen6_info->rt; 7342 struct fib6_info **rt_arr; 7343 struct fib6_info *iter; 7344 unsigned int nrt6; 7345 int i = 0; 7346 7347 nrt6 = fen6_info->nsiblings + 1; 7348 7349 rt_arr = kcalloc(nrt6, sizeof(struct fib6_info *), GFP_ATOMIC); 7350 if (!rt_arr) 7351 return -ENOMEM; 7352 7353 fib6_work->rt_arr = rt_arr; 7354 fib6_work->nrt6 = nrt6; 7355 7356 rt_arr[0] = rt; 7357 fib6_info_hold(rt); 7358 7359 if (!fen6_info->nsiblings) 7360 return 0; 7361 7362 list_for_each_entry(iter, &rt->fib6_siblings, fib6_siblings) { 7363 if (i == fen6_info->nsiblings) 7364 break; 7365 7366 rt_arr[i + 1] = iter; 7367 fib6_info_hold(iter); 7368 i++; 7369 } 7370 WARN_ON_ONCE(i != fen6_info->nsiblings); 7371 7372 return 0; 7373 } 7374 7375 static void 7376 mlxsw_sp_router_fib6_work_fini(struct mlxsw_sp_fib6_event_work *fib6_work) 7377 { 7378 int i; 7379 7380 for (i = 0; i < fib6_work->nrt6; i++) 7381 mlxsw_sp_rt6_release(fib6_work->rt_arr[i]); 7382 kfree(fib6_work->rt_arr); 7383 } 7384 7385 static void mlxsw_sp_router_fib4_event_work(struct work_struct *work) 7386 { 7387 struct mlxsw_sp_fib_event_work *fib_work = 7388 container_of(work, struct mlxsw_sp_fib_event_work, work); 7389 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp; 7390 int err; 7391 7392 mutex_lock(&mlxsw_sp->router->lock); 7393 mlxsw_sp_span_respin(mlxsw_sp); 7394 7395 switch (fib_work->event) { 7396 case FIB_EVENT_ENTRY_REPLACE: 7397 err = mlxsw_sp_router_fib4_replace(mlxsw_sp, 7398 &fib_work->fen_info); 7399 if (err) { 7400 dev_warn(mlxsw_sp->bus_info->dev, "FIB replace failed.\n"); 7401 mlxsw_sp_fib4_offload_failed_flag_set(mlxsw_sp, 7402 &fib_work->fen_info); 7403 } 7404 fib_info_put(fib_work->fen_info.fi); 7405 break; 7406 case FIB_EVENT_ENTRY_DEL: 7407 mlxsw_sp_router_fib4_del(mlxsw_sp, &fib_work->fen_info); 7408 fib_info_put(fib_work->fen_info.fi); 7409 break; 7410 case FIB_EVENT_NH_ADD: 7411 case FIB_EVENT_NH_DEL: 7412 mlxsw_sp_nexthop4_event(mlxsw_sp, fib_work->event, 7413 fib_work->fnh_info.fib_nh); 7414 fib_info_put(fib_work->fnh_info.fib_nh->nh_parent); 7415 break; 7416 } 7417 mutex_unlock(&mlxsw_sp->router->lock); 7418 kfree(fib_work); 7419 } 7420 7421 static void mlxsw_sp_router_fib6_event_work(struct work_struct *work) 7422 { 7423 struct mlxsw_sp_fib_event_work *fib_work = 7424 container_of(work, struct mlxsw_sp_fib_event_work, work); 7425 struct mlxsw_sp_fib6_event_work *fib6_work = &fib_work->fib6_work; 7426 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp; 7427 int err; 7428 7429 mutex_lock(&mlxsw_sp->router->lock); 7430 mlxsw_sp_span_respin(mlxsw_sp); 7431 7432 switch (fib_work->event) { 7433 case FIB_EVENT_ENTRY_REPLACE: 7434 err = mlxsw_sp_router_fib6_replace(mlxsw_sp, 7435 fib6_work->rt_arr, 7436 fib6_work->nrt6); 7437 if (err) { 7438 dev_warn(mlxsw_sp->bus_info->dev, "FIB replace failed.\n"); 7439 mlxsw_sp_fib6_offload_failed_flag_set(mlxsw_sp, 7440 fib6_work->rt_arr, 7441 fib6_work->nrt6); 7442 } 7443 mlxsw_sp_router_fib6_work_fini(fib6_work); 7444 break; 7445 case FIB_EVENT_ENTRY_APPEND: 7446 err = mlxsw_sp_router_fib6_append(mlxsw_sp, 7447 fib6_work->rt_arr, 7448 fib6_work->nrt6); 7449 if (err) { 7450 dev_warn(mlxsw_sp->bus_info->dev, "FIB append failed.\n"); 7451 mlxsw_sp_fib6_offload_failed_flag_set(mlxsw_sp, 7452 fib6_work->rt_arr, 7453 fib6_work->nrt6); 7454 } 7455 mlxsw_sp_router_fib6_work_fini(fib6_work); 7456 break; 7457 case FIB_EVENT_ENTRY_DEL: 7458 mlxsw_sp_router_fib6_del(mlxsw_sp, 7459 fib6_work->rt_arr, 7460 fib6_work->nrt6); 7461 mlxsw_sp_router_fib6_work_fini(fib6_work); 7462 break; 7463 } 7464 mutex_unlock(&mlxsw_sp->router->lock); 7465 kfree(fib_work); 7466 } 7467 7468 static void mlxsw_sp_router_fibmr_event_work(struct work_struct *work) 7469 { 7470 struct mlxsw_sp_fib_event_work *fib_work = 7471 container_of(work, struct mlxsw_sp_fib_event_work, work); 7472 struct mlxsw_sp *mlxsw_sp = fib_work->mlxsw_sp; 7473 bool replace; 7474 int err; 7475 7476 rtnl_lock(); 7477 mutex_lock(&mlxsw_sp->router->lock); 7478 switch (fib_work->event) { 7479 case FIB_EVENT_ENTRY_REPLACE: 7480 case FIB_EVENT_ENTRY_ADD: 7481 replace = fib_work->event == FIB_EVENT_ENTRY_REPLACE; 7482 7483 err = mlxsw_sp_router_fibmr_add(mlxsw_sp, &fib_work->men_info, 7484 replace); 7485 if (err) 7486 dev_warn(mlxsw_sp->bus_info->dev, "MR entry add failed.\n"); 7487 mr_cache_put(fib_work->men_info.mfc); 7488 break; 7489 case FIB_EVENT_ENTRY_DEL: 7490 mlxsw_sp_router_fibmr_del(mlxsw_sp, &fib_work->men_info); 7491 mr_cache_put(fib_work->men_info.mfc); 7492 break; 7493 case FIB_EVENT_VIF_ADD: 7494 err = mlxsw_sp_router_fibmr_vif_add(mlxsw_sp, 7495 &fib_work->ven_info); 7496 if (err) 7497 dev_warn(mlxsw_sp->bus_info->dev, "MR VIF add failed.\n"); 7498 dev_put(fib_work->ven_info.dev); 7499 break; 7500 case FIB_EVENT_VIF_DEL: 7501 mlxsw_sp_router_fibmr_vif_del(mlxsw_sp, 7502 &fib_work->ven_info); 7503 dev_put(fib_work->ven_info.dev); 7504 break; 7505 } 7506 mutex_unlock(&mlxsw_sp->router->lock); 7507 rtnl_unlock(); 7508 kfree(fib_work); 7509 } 7510 7511 static void mlxsw_sp_router_fib4_event(struct mlxsw_sp_fib_event_work *fib_work, 7512 struct fib_notifier_info *info) 7513 { 7514 struct fib_entry_notifier_info *fen_info; 7515 struct fib_nh_notifier_info *fnh_info; 7516 7517 switch (fib_work->event) { 7518 case FIB_EVENT_ENTRY_REPLACE: 7519 case FIB_EVENT_ENTRY_DEL: 7520 fen_info = container_of(info, struct fib_entry_notifier_info, 7521 info); 7522 fib_work->fen_info = *fen_info; 7523 /* Take reference on fib_info to prevent it from being 7524 * freed while work is queued. Release it afterwards. 7525 */ 7526 fib_info_hold(fib_work->fen_info.fi); 7527 break; 7528 case FIB_EVENT_NH_ADD: 7529 case FIB_EVENT_NH_DEL: 7530 fnh_info = container_of(info, struct fib_nh_notifier_info, 7531 info); 7532 fib_work->fnh_info = *fnh_info; 7533 fib_info_hold(fib_work->fnh_info.fib_nh->nh_parent); 7534 break; 7535 } 7536 } 7537 7538 static int mlxsw_sp_router_fib6_event(struct mlxsw_sp_fib_event_work *fib_work, 7539 struct fib_notifier_info *info) 7540 { 7541 struct fib6_entry_notifier_info *fen6_info; 7542 int err; 7543 7544 switch (fib_work->event) { 7545 case FIB_EVENT_ENTRY_REPLACE: 7546 case FIB_EVENT_ENTRY_APPEND: 7547 case FIB_EVENT_ENTRY_DEL: 7548 fen6_info = container_of(info, struct fib6_entry_notifier_info, 7549 info); 7550 err = mlxsw_sp_router_fib6_work_init(&fib_work->fib6_work, 7551 fen6_info); 7552 if (err) 7553 return err; 7554 break; 7555 } 7556 7557 return 0; 7558 } 7559 7560 static void 7561 mlxsw_sp_router_fibmr_event(struct mlxsw_sp_fib_event_work *fib_work, 7562 struct fib_notifier_info *info) 7563 { 7564 switch (fib_work->event) { 7565 case FIB_EVENT_ENTRY_REPLACE: 7566 case FIB_EVENT_ENTRY_ADD: 7567 case FIB_EVENT_ENTRY_DEL: 7568 memcpy(&fib_work->men_info, info, sizeof(fib_work->men_info)); 7569 mr_cache_hold(fib_work->men_info.mfc); 7570 break; 7571 case FIB_EVENT_VIF_ADD: 7572 case FIB_EVENT_VIF_DEL: 7573 memcpy(&fib_work->ven_info, info, sizeof(fib_work->ven_info)); 7574 dev_hold(fib_work->ven_info.dev); 7575 break; 7576 } 7577 } 7578 7579 static int mlxsw_sp_router_fib_rule_event(unsigned long event, 7580 struct fib_notifier_info *info, 7581 struct mlxsw_sp *mlxsw_sp) 7582 { 7583 struct netlink_ext_ack *extack = info->extack; 7584 struct fib_rule_notifier_info *fr_info; 7585 struct fib_rule *rule; 7586 int err = 0; 7587 7588 /* nothing to do at the moment */ 7589 if (event == FIB_EVENT_RULE_DEL) 7590 return 0; 7591 7592 fr_info = container_of(info, struct fib_rule_notifier_info, info); 7593 rule = fr_info->rule; 7594 7595 /* Rule only affects locally generated traffic */ 7596 if (rule->iifindex == mlxsw_sp_net(mlxsw_sp)->loopback_dev->ifindex) 7597 return 0; 7598 7599 switch (info->family) { 7600 case AF_INET: 7601 if (!fib4_rule_default(rule) && !rule->l3mdev) 7602 err = -EOPNOTSUPP; 7603 break; 7604 case AF_INET6: 7605 if (!fib6_rule_default(rule) && !rule->l3mdev) 7606 err = -EOPNOTSUPP; 7607 break; 7608 case RTNL_FAMILY_IPMR: 7609 if (!ipmr_rule_default(rule) && !rule->l3mdev) 7610 err = -EOPNOTSUPP; 7611 break; 7612 case RTNL_FAMILY_IP6MR: 7613 if (!ip6mr_rule_default(rule) && !rule->l3mdev) 7614 err = -EOPNOTSUPP; 7615 break; 7616 } 7617 7618 if (err < 0) 7619 NL_SET_ERR_MSG_MOD(extack, "FIB rules not supported"); 7620 7621 return err; 7622 } 7623 7624 /* Called with rcu_read_lock() */ 7625 static int mlxsw_sp_router_fib_event(struct notifier_block *nb, 7626 unsigned long event, void *ptr) 7627 { 7628 struct mlxsw_sp_fib_event_work *fib_work; 7629 struct fib_notifier_info *info = ptr; 7630 struct mlxsw_sp_router *router; 7631 int err; 7632 7633 if ((info->family != AF_INET && info->family != AF_INET6 && 7634 info->family != RTNL_FAMILY_IPMR && 7635 info->family != RTNL_FAMILY_IP6MR)) 7636 return NOTIFY_DONE; 7637 7638 router = container_of(nb, struct mlxsw_sp_router, fib_nb); 7639 7640 switch (event) { 7641 case FIB_EVENT_RULE_ADD: 7642 case FIB_EVENT_RULE_DEL: 7643 err = mlxsw_sp_router_fib_rule_event(event, info, 7644 router->mlxsw_sp); 7645 return notifier_from_errno(err); 7646 case FIB_EVENT_ENTRY_ADD: 7647 case FIB_EVENT_ENTRY_REPLACE: 7648 case FIB_EVENT_ENTRY_APPEND: 7649 if (info->family == AF_INET) { 7650 struct fib_entry_notifier_info *fen_info = ptr; 7651 7652 if (fen_info->fi->fib_nh_is_v6) { 7653 NL_SET_ERR_MSG_MOD(info->extack, "IPv6 gateway with IPv4 route is not supported"); 7654 return notifier_from_errno(-EINVAL); 7655 } 7656 } 7657 break; 7658 } 7659 7660 fib_work = kzalloc(sizeof(*fib_work), GFP_ATOMIC); 7661 if (!fib_work) 7662 return NOTIFY_BAD; 7663 7664 fib_work->mlxsw_sp = router->mlxsw_sp; 7665 fib_work->event = event; 7666 7667 switch (info->family) { 7668 case AF_INET: 7669 INIT_WORK(&fib_work->work, mlxsw_sp_router_fib4_event_work); 7670 mlxsw_sp_router_fib4_event(fib_work, info); 7671 break; 7672 case AF_INET6: 7673 INIT_WORK(&fib_work->work, mlxsw_sp_router_fib6_event_work); 7674 err = mlxsw_sp_router_fib6_event(fib_work, info); 7675 if (err) 7676 goto err_fib_event; 7677 break; 7678 case RTNL_FAMILY_IP6MR: 7679 case RTNL_FAMILY_IPMR: 7680 INIT_WORK(&fib_work->work, mlxsw_sp_router_fibmr_event_work); 7681 mlxsw_sp_router_fibmr_event(fib_work, info); 7682 break; 7683 } 7684 7685 mlxsw_core_schedule_work(&fib_work->work); 7686 7687 return NOTIFY_DONE; 7688 7689 err_fib_event: 7690 kfree(fib_work); 7691 return NOTIFY_BAD; 7692 } 7693 7694 static struct mlxsw_sp_rif * 7695 mlxsw_sp_rif_find_by_dev(const struct mlxsw_sp *mlxsw_sp, 7696 const struct net_device *dev) 7697 { 7698 int i; 7699 7700 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) 7701 if (mlxsw_sp->router->rifs[i] && 7702 mlxsw_sp->router->rifs[i]->dev == dev) 7703 return mlxsw_sp->router->rifs[i]; 7704 7705 return NULL; 7706 } 7707 7708 bool mlxsw_sp_rif_exists(struct mlxsw_sp *mlxsw_sp, 7709 const struct net_device *dev) 7710 { 7711 struct mlxsw_sp_rif *rif; 7712 7713 mutex_lock(&mlxsw_sp->router->lock); 7714 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 7715 mutex_unlock(&mlxsw_sp->router->lock); 7716 7717 return rif; 7718 } 7719 7720 u16 mlxsw_sp_rif_vid(struct mlxsw_sp *mlxsw_sp, const struct net_device *dev) 7721 { 7722 struct mlxsw_sp_rif *rif; 7723 u16 vid = 0; 7724 7725 mutex_lock(&mlxsw_sp->router->lock); 7726 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 7727 if (!rif) 7728 goto out; 7729 7730 /* We only return the VID for VLAN RIFs. Otherwise we return an 7731 * invalid value (0). 7732 */ 7733 if (rif->ops->type != MLXSW_SP_RIF_TYPE_VLAN) 7734 goto out; 7735 7736 vid = mlxsw_sp_fid_8021q_vid(rif->fid); 7737 7738 out: 7739 mutex_unlock(&mlxsw_sp->router->lock); 7740 return vid; 7741 } 7742 7743 static int mlxsw_sp_router_rif_disable(struct mlxsw_sp *mlxsw_sp, u16 rif) 7744 { 7745 char ritr_pl[MLXSW_REG_RITR_LEN]; 7746 int err; 7747 7748 mlxsw_reg_ritr_rif_pack(ritr_pl, rif); 7749 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 7750 if (err) 7751 return err; 7752 7753 mlxsw_reg_ritr_enable_set(ritr_pl, false); 7754 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 7755 } 7756 7757 static void mlxsw_sp_router_rif_gone_sync(struct mlxsw_sp *mlxsw_sp, 7758 struct mlxsw_sp_rif *rif) 7759 { 7760 mlxsw_sp_router_rif_disable(mlxsw_sp, rif->rif_index); 7761 mlxsw_sp_nexthop_rif_gone_sync(mlxsw_sp, rif); 7762 mlxsw_sp_neigh_rif_gone_sync(mlxsw_sp, rif); 7763 } 7764 7765 static bool 7766 mlxsw_sp_rif_should_config(struct mlxsw_sp_rif *rif, struct net_device *dev, 7767 unsigned long event) 7768 { 7769 struct inet6_dev *inet6_dev; 7770 bool addr_list_empty = true; 7771 struct in_device *idev; 7772 7773 switch (event) { 7774 case NETDEV_UP: 7775 return rif == NULL; 7776 case NETDEV_DOWN: 7777 rcu_read_lock(); 7778 idev = __in_dev_get_rcu(dev); 7779 if (idev && idev->ifa_list) 7780 addr_list_empty = false; 7781 7782 inet6_dev = __in6_dev_get(dev); 7783 if (addr_list_empty && inet6_dev && 7784 !list_empty(&inet6_dev->addr_list)) 7785 addr_list_empty = false; 7786 rcu_read_unlock(); 7787 7788 /* macvlans do not have a RIF, but rather piggy back on the 7789 * RIF of their lower device. 7790 */ 7791 if (netif_is_macvlan(dev) && addr_list_empty) 7792 return true; 7793 7794 if (rif && addr_list_empty && 7795 !netif_is_l3_slave(rif->dev)) 7796 return true; 7797 /* It is possible we already removed the RIF ourselves 7798 * if it was assigned to a netdev that is now a bridge 7799 * or LAG slave. 7800 */ 7801 return false; 7802 } 7803 7804 return false; 7805 } 7806 7807 static enum mlxsw_sp_rif_type 7808 mlxsw_sp_dev_rif_type(const struct mlxsw_sp *mlxsw_sp, 7809 const struct net_device *dev) 7810 { 7811 enum mlxsw_sp_fid_type type; 7812 7813 if (mlxsw_sp_netdev_ipip_type(mlxsw_sp, dev, NULL)) 7814 return MLXSW_SP_RIF_TYPE_IPIP_LB; 7815 7816 /* Otherwise RIF type is derived from the type of the underlying FID. */ 7817 if (is_vlan_dev(dev) && netif_is_bridge_master(vlan_dev_real_dev(dev))) 7818 type = MLXSW_SP_FID_TYPE_8021Q; 7819 else if (netif_is_bridge_master(dev) && br_vlan_enabled(dev)) 7820 type = MLXSW_SP_FID_TYPE_8021Q; 7821 else if (netif_is_bridge_master(dev)) 7822 type = MLXSW_SP_FID_TYPE_8021D; 7823 else 7824 type = MLXSW_SP_FID_TYPE_RFID; 7825 7826 return mlxsw_sp_fid_type_rif_type(mlxsw_sp, type); 7827 } 7828 7829 static int mlxsw_sp_rif_index_alloc(struct mlxsw_sp *mlxsw_sp, u16 *p_rif_index) 7830 { 7831 int i; 7832 7833 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) { 7834 if (!mlxsw_sp->router->rifs[i]) { 7835 *p_rif_index = i; 7836 return 0; 7837 } 7838 } 7839 7840 return -ENOBUFS; 7841 } 7842 7843 static struct mlxsw_sp_rif *mlxsw_sp_rif_alloc(size_t rif_size, u16 rif_index, 7844 u16 vr_id, 7845 struct net_device *l3_dev) 7846 { 7847 struct mlxsw_sp_rif *rif; 7848 7849 rif = kzalloc(rif_size, GFP_KERNEL); 7850 if (!rif) 7851 return NULL; 7852 7853 INIT_LIST_HEAD(&rif->nexthop_list); 7854 INIT_LIST_HEAD(&rif->neigh_list); 7855 if (l3_dev) { 7856 ether_addr_copy(rif->addr, l3_dev->dev_addr); 7857 rif->mtu = l3_dev->mtu; 7858 rif->dev = l3_dev; 7859 } 7860 rif->vr_id = vr_id; 7861 rif->rif_index = rif_index; 7862 7863 return rif; 7864 } 7865 7866 struct mlxsw_sp_rif *mlxsw_sp_rif_by_index(const struct mlxsw_sp *mlxsw_sp, 7867 u16 rif_index) 7868 { 7869 return mlxsw_sp->router->rifs[rif_index]; 7870 } 7871 7872 u16 mlxsw_sp_rif_index(const struct mlxsw_sp_rif *rif) 7873 { 7874 return rif->rif_index; 7875 } 7876 7877 u16 mlxsw_sp_ipip_lb_rif_index(const struct mlxsw_sp_rif_ipip_lb *lb_rif) 7878 { 7879 return lb_rif->common.rif_index; 7880 } 7881 7882 u16 mlxsw_sp_ipip_lb_ul_vr_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif) 7883 { 7884 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(lb_rif->common.dev); 7885 struct mlxsw_sp_vr *ul_vr; 7886 7887 ul_vr = mlxsw_sp_vr_get(lb_rif->common.mlxsw_sp, ul_tb_id, NULL); 7888 if (WARN_ON(IS_ERR(ul_vr))) 7889 return 0; 7890 7891 return ul_vr->id; 7892 } 7893 7894 u16 mlxsw_sp_ipip_lb_ul_rif_id(const struct mlxsw_sp_rif_ipip_lb *lb_rif) 7895 { 7896 return lb_rif->ul_rif_id; 7897 } 7898 7899 static bool 7900 mlxsw_sp_router_port_l3_stats_enabled(struct mlxsw_sp_rif *rif) 7901 { 7902 return mlxsw_sp_rif_counter_valid_get(rif, 7903 MLXSW_SP_RIF_COUNTER_EGRESS) && 7904 mlxsw_sp_rif_counter_valid_get(rif, 7905 MLXSW_SP_RIF_COUNTER_INGRESS); 7906 } 7907 7908 static int 7909 mlxsw_sp_router_port_l3_stats_enable(struct mlxsw_sp_rif *rif) 7910 { 7911 int err; 7912 7913 err = mlxsw_sp_rif_counter_alloc(rif, MLXSW_SP_RIF_COUNTER_INGRESS); 7914 if (err) 7915 return err; 7916 7917 /* Clear stale data. */ 7918 err = mlxsw_sp_rif_counter_fetch_clear(rif, 7919 MLXSW_SP_RIF_COUNTER_INGRESS, 7920 NULL); 7921 if (err) 7922 goto err_clear_ingress; 7923 7924 err = mlxsw_sp_rif_counter_alloc(rif, MLXSW_SP_RIF_COUNTER_EGRESS); 7925 if (err) 7926 goto err_alloc_egress; 7927 7928 /* Clear stale data. */ 7929 err = mlxsw_sp_rif_counter_fetch_clear(rif, 7930 MLXSW_SP_RIF_COUNTER_EGRESS, 7931 NULL); 7932 if (err) 7933 goto err_clear_egress; 7934 7935 return 0; 7936 7937 err_clear_egress: 7938 mlxsw_sp_rif_counter_free(rif, MLXSW_SP_RIF_COUNTER_EGRESS); 7939 err_alloc_egress: 7940 err_clear_ingress: 7941 mlxsw_sp_rif_counter_free(rif, MLXSW_SP_RIF_COUNTER_INGRESS); 7942 return err; 7943 } 7944 7945 static void 7946 mlxsw_sp_router_port_l3_stats_disable(struct mlxsw_sp_rif *rif) 7947 { 7948 mlxsw_sp_rif_counter_free(rif, MLXSW_SP_RIF_COUNTER_EGRESS); 7949 mlxsw_sp_rif_counter_free(rif, MLXSW_SP_RIF_COUNTER_INGRESS); 7950 } 7951 7952 static void 7953 mlxsw_sp_router_port_l3_stats_report_used(struct mlxsw_sp_rif *rif, 7954 struct netdev_notifier_offload_xstats_info *info) 7955 { 7956 if (!mlxsw_sp_router_port_l3_stats_enabled(rif)) 7957 return; 7958 netdev_offload_xstats_report_used(info->report_used); 7959 } 7960 7961 static int 7962 mlxsw_sp_router_port_l3_stats_fetch(struct mlxsw_sp_rif *rif, 7963 struct rtnl_hw_stats64 *p_stats) 7964 { 7965 struct mlxsw_sp_rif_counter_set_basic ingress; 7966 struct mlxsw_sp_rif_counter_set_basic egress; 7967 int err; 7968 7969 err = mlxsw_sp_rif_counter_fetch_clear(rif, 7970 MLXSW_SP_RIF_COUNTER_INGRESS, 7971 &ingress); 7972 if (err) 7973 return err; 7974 7975 err = mlxsw_sp_rif_counter_fetch_clear(rif, 7976 MLXSW_SP_RIF_COUNTER_EGRESS, 7977 &egress); 7978 if (err) 7979 return err; 7980 7981 #define MLXSW_SP_ROUTER_ALL_GOOD(SET, SFX) \ 7982 ((SET.good_unicast_ ## SFX) + \ 7983 (SET.good_multicast_ ## SFX) + \ 7984 (SET.good_broadcast_ ## SFX)) 7985 7986 p_stats->rx_packets = MLXSW_SP_ROUTER_ALL_GOOD(ingress, packets); 7987 p_stats->tx_packets = MLXSW_SP_ROUTER_ALL_GOOD(egress, packets); 7988 p_stats->rx_bytes = MLXSW_SP_ROUTER_ALL_GOOD(ingress, bytes); 7989 p_stats->tx_bytes = MLXSW_SP_ROUTER_ALL_GOOD(egress, bytes); 7990 p_stats->rx_errors = ingress.error_packets; 7991 p_stats->tx_errors = egress.error_packets; 7992 p_stats->rx_dropped = ingress.discard_packets; 7993 p_stats->tx_dropped = egress.discard_packets; 7994 p_stats->multicast = ingress.good_multicast_packets + 7995 ingress.good_broadcast_packets; 7996 7997 #undef MLXSW_SP_ROUTER_ALL_GOOD 7998 7999 return 0; 8000 } 8001 8002 static int 8003 mlxsw_sp_router_port_l3_stats_report_delta(struct mlxsw_sp_rif *rif, 8004 struct netdev_notifier_offload_xstats_info *info) 8005 { 8006 struct rtnl_hw_stats64 stats = {}; 8007 int err; 8008 8009 if (!mlxsw_sp_router_port_l3_stats_enabled(rif)) 8010 return 0; 8011 8012 err = mlxsw_sp_router_port_l3_stats_fetch(rif, &stats); 8013 if (err) 8014 return err; 8015 8016 netdev_offload_xstats_report_delta(info->report_delta, &stats); 8017 return 0; 8018 } 8019 8020 struct mlxsw_sp_router_hwstats_notify_work { 8021 struct work_struct work; 8022 struct net_device *dev; 8023 }; 8024 8025 static void mlxsw_sp_router_hwstats_notify_work(struct work_struct *work) 8026 { 8027 struct mlxsw_sp_router_hwstats_notify_work *hws_work = 8028 container_of(work, struct mlxsw_sp_router_hwstats_notify_work, 8029 work); 8030 8031 rtnl_lock(); 8032 rtnl_offload_xstats_notify(hws_work->dev); 8033 rtnl_unlock(); 8034 dev_put(hws_work->dev); 8035 kfree(hws_work); 8036 } 8037 8038 static void 8039 mlxsw_sp_router_hwstats_notify_schedule(struct net_device *dev) 8040 { 8041 struct mlxsw_sp_router_hwstats_notify_work *hws_work; 8042 8043 /* To collect notification payload, the core ends up sending another 8044 * notifier block message, which would deadlock on the attempt to 8045 * acquire the router lock again. Just postpone the notification until 8046 * later. 8047 */ 8048 8049 hws_work = kzalloc(sizeof(*hws_work), GFP_KERNEL); 8050 if (!hws_work) 8051 return; 8052 8053 INIT_WORK(&hws_work->work, mlxsw_sp_router_hwstats_notify_work); 8054 dev_hold(dev); 8055 hws_work->dev = dev; 8056 mlxsw_core_schedule_work(&hws_work->work); 8057 } 8058 8059 int mlxsw_sp_rif_dev_ifindex(const struct mlxsw_sp_rif *rif) 8060 { 8061 return rif->dev->ifindex; 8062 } 8063 8064 const struct net_device *mlxsw_sp_rif_dev(const struct mlxsw_sp_rif *rif) 8065 { 8066 return rif->dev; 8067 } 8068 8069 static void mlxsw_sp_rif_push_l3_stats(struct mlxsw_sp_rif *rif) 8070 { 8071 struct rtnl_hw_stats64 stats = {}; 8072 8073 if (!mlxsw_sp_router_port_l3_stats_fetch(rif, &stats)) 8074 netdev_offload_xstats_push_delta(rif->dev, 8075 NETDEV_OFFLOAD_XSTATS_TYPE_L3, 8076 &stats); 8077 } 8078 8079 static struct mlxsw_sp_rif * 8080 mlxsw_sp_rif_create(struct mlxsw_sp *mlxsw_sp, 8081 const struct mlxsw_sp_rif_params *params, 8082 struct netlink_ext_ack *extack) 8083 { 8084 u32 tb_id = l3mdev_fib_table(params->dev); 8085 const struct mlxsw_sp_rif_ops *ops; 8086 struct mlxsw_sp_fid *fid = NULL; 8087 enum mlxsw_sp_rif_type type; 8088 struct mlxsw_sp_rif *rif; 8089 struct mlxsw_sp_vr *vr; 8090 u16 rif_index; 8091 int i, err; 8092 8093 type = mlxsw_sp_dev_rif_type(mlxsw_sp, params->dev); 8094 ops = mlxsw_sp->router->rif_ops_arr[type]; 8095 8096 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id ? : RT_TABLE_MAIN, extack); 8097 if (IS_ERR(vr)) 8098 return ERR_CAST(vr); 8099 vr->rif_count++; 8100 8101 err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index); 8102 if (err) { 8103 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interfaces"); 8104 goto err_rif_index_alloc; 8105 } 8106 8107 rif = mlxsw_sp_rif_alloc(ops->rif_size, rif_index, vr->id, params->dev); 8108 if (!rif) { 8109 err = -ENOMEM; 8110 goto err_rif_alloc; 8111 } 8112 dev_hold(rif->dev); 8113 mlxsw_sp->router->rifs[rif_index] = rif; 8114 rif->mlxsw_sp = mlxsw_sp; 8115 rif->ops = ops; 8116 8117 if (ops->fid_get) { 8118 fid = ops->fid_get(rif, extack); 8119 if (IS_ERR(fid)) { 8120 err = PTR_ERR(fid); 8121 goto err_fid_get; 8122 } 8123 rif->fid = fid; 8124 } 8125 8126 if (ops->setup) 8127 ops->setup(rif, params); 8128 8129 err = ops->configure(rif, extack); 8130 if (err) 8131 goto err_configure; 8132 8133 for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++) { 8134 err = mlxsw_sp_mr_rif_add(vr->mr_table[i], rif); 8135 if (err) 8136 goto err_mr_rif_add; 8137 } 8138 8139 if (netdev_offload_xstats_enabled(rif->dev, 8140 NETDEV_OFFLOAD_XSTATS_TYPE_L3)) { 8141 err = mlxsw_sp_router_port_l3_stats_enable(rif); 8142 if (err) 8143 goto err_stats_enable; 8144 mlxsw_sp_router_hwstats_notify_schedule(rif->dev); 8145 } else { 8146 mlxsw_sp_rif_counters_alloc(rif); 8147 } 8148 8149 atomic_inc(&mlxsw_sp->router->rifs_count); 8150 return rif; 8151 8152 err_stats_enable: 8153 err_mr_rif_add: 8154 for (i--; i >= 0; i--) 8155 mlxsw_sp_mr_rif_del(vr->mr_table[i], rif); 8156 ops->deconfigure(rif); 8157 err_configure: 8158 if (fid) 8159 mlxsw_sp_fid_put(fid); 8160 err_fid_get: 8161 mlxsw_sp->router->rifs[rif_index] = NULL; 8162 dev_put(rif->dev); 8163 kfree(rif); 8164 err_rif_alloc: 8165 err_rif_index_alloc: 8166 vr->rif_count--; 8167 mlxsw_sp_vr_put(mlxsw_sp, vr); 8168 return ERR_PTR(err); 8169 } 8170 8171 static void mlxsw_sp_rif_destroy(struct mlxsw_sp_rif *rif) 8172 { 8173 const struct mlxsw_sp_rif_ops *ops = rif->ops; 8174 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 8175 struct mlxsw_sp_fid *fid = rif->fid; 8176 struct mlxsw_sp_vr *vr; 8177 int i; 8178 8179 atomic_dec(&mlxsw_sp->router->rifs_count); 8180 mlxsw_sp_router_rif_gone_sync(mlxsw_sp, rif); 8181 vr = &mlxsw_sp->router->vrs[rif->vr_id]; 8182 8183 if (netdev_offload_xstats_enabled(rif->dev, 8184 NETDEV_OFFLOAD_XSTATS_TYPE_L3)) { 8185 mlxsw_sp_rif_push_l3_stats(rif); 8186 mlxsw_sp_router_port_l3_stats_disable(rif); 8187 mlxsw_sp_router_hwstats_notify_schedule(rif->dev); 8188 } else { 8189 mlxsw_sp_rif_counters_free(rif); 8190 } 8191 8192 for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++) 8193 mlxsw_sp_mr_rif_del(vr->mr_table[i], rif); 8194 ops->deconfigure(rif); 8195 if (fid) 8196 /* Loopback RIFs are not associated with a FID. */ 8197 mlxsw_sp_fid_put(fid); 8198 mlxsw_sp->router->rifs[rif->rif_index] = NULL; 8199 dev_put(rif->dev); 8200 kfree(rif); 8201 vr->rif_count--; 8202 mlxsw_sp_vr_put(mlxsw_sp, vr); 8203 } 8204 8205 void mlxsw_sp_rif_destroy_by_dev(struct mlxsw_sp *mlxsw_sp, 8206 struct net_device *dev) 8207 { 8208 struct mlxsw_sp_rif *rif; 8209 8210 mutex_lock(&mlxsw_sp->router->lock); 8211 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 8212 if (!rif) 8213 goto out; 8214 mlxsw_sp_rif_destroy(rif); 8215 out: 8216 mutex_unlock(&mlxsw_sp->router->lock); 8217 } 8218 8219 static void 8220 mlxsw_sp_rif_subport_params_init(struct mlxsw_sp_rif_params *params, 8221 struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan) 8222 { 8223 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port; 8224 8225 params->vid = mlxsw_sp_port_vlan->vid; 8226 params->lag = mlxsw_sp_port->lagged; 8227 if (params->lag) 8228 params->lag_id = mlxsw_sp_port->lag_id; 8229 else 8230 params->system_port = mlxsw_sp_port->local_port; 8231 } 8232 8233 static struct mlxsw_sp_rif_subport * 8234 mlxsw_sp_rif_subport_rif(const struct mlxsw_sp_rif *rif) 8235 { 8236 return container_of(rif, struct mlxsw_sp_rif_subport, common); 8237 } 8238 8239 static struct mlxsw_sp_rif * 8240 mlxsw_sp_rif_subport_get(struct mlxsw_sp *mlxsw_sp, 8241 const struct mlxsw_sp_rif_params *params, 8242 struct netlink_ext_ack *extack) 8243 { 8244 struct mlxsw_sp_rif_subport *rif_subport; 8245 struct mlxsw_sp_rif *rif; 8246 8247 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, params->dev); 8248 if (!rif) 8249 return mlxsw_sp_rif_create(mlxsw_sp, params, extack); 8250 8251 rif_subport = mlxsw_sp_rif_subport_rif(rif); 8252 refcount_inc(&rif_subport->ref_count); 8253 return rif; 8254 } 8255 8256 static void mlxsw_sp_rif_subport_put(struct mlxsw_sp_rif *rif) 8257 { 8258 struct mlxsw_sp_rif_subport *rif_subport; 8259 8260 rif_subport = mlxsw_sp_rif_subport_rif(rif); 8261 if (!refcount_dec_and_test(&rif_subport->ref_count)) 8262 return; 8263 8264 mlxsw_sp_rif_destroy(rif); 8265 } 8266 8267 static int mlxsw_sp_rif_mac_profile_index_alloc(struct mlxsw_sp *mlxsw_sp, 8268 struct mlxsw_sp_rif_mac_profile *profile, 8269 struct netlink_ext_ack *extack) 8270 { 8271 u8 max_rif_mac_profiles = mlxsw_sp->router->max_rif_mac_profile; 8272 struct mlxsw_sp_router *router = mlxsw_sp->router; 8273 int id; 8274 8275 id = idr_alloc(&router->rif_mac_profiles_idr, profile, 0, 8276 max_rif_mac_profiles, GFP_KERNEL); 8277 8278 if (id >= 0) { 8279 profile->id = id; 8280 return 0; 8281 } 8282 8283 if (id == -ENOSPC) 8284 NL_SET_ERR_MSG_MOD(extack, 8285 "Exceeded number of supported router interface MAC profiles"); 8286 8287 return id; 8288 } 8289 8290 static struct mlxsw_sp_rif_mac_profile * 8291 mlxsw_sp_rif_mac_profile_index_free(struct mlxsw_sp *mlxsw_sp, u8 mac_profile) 8292 { 8293 struct mlxsw_sp_rif_mac_profile *profile; 8294 8295 profile = idr_remove(&mlxsw_sp->router->rif_mac_profiles_idr, 8296 mac_profile); 8297 WARN_ON(!profile); 8298 return profile; 8299 } 8300 8301 static struct mlxsw_sp_rif_mac_profile * 8302 mlxsw_sp_rif_mac_profile_alloc(const char *mac) 8303 { 8304 struct mlxsw_sp_rif_mac_profile *profile; 8305 8306 profile = kzalloc(sizeof(*profile), GFP_KERNEL); 8307 if (!profile) 8308 return NULL; 8309 8310 ether_addr_copy(profile->mac_prefix, mac); 8311 refcount_set(&profile->ref_count, 1); 8312 return profile; 8313 } 8314 8315 static struct mlxsw_sp_rif_mac_profile * 8316 mlxsw_sp_rif_mac_profile_find(const struct mlxsw_sp *mlxsw_sp, const char *mac) 8317 { 8318 struct mlxsw_sp_router *router = mlxsw_sp->router; 8319 struct mlxsw_sp_rif_mac_profile *profile; 8320 int id; 8321 8322 idr_for_each_entry(&router->rif_mac_profiles_idr, profile, id) { 8323 if (ether_addr_equal_masked(profile->mac_prefix, mac, 8324 mlxsw_sp->mac_mask)) 8325 return profile; 8326 } 8327 8328 return NULL; 8329 } 8330 8331 static u64 mlxsw_sp_rif_mac_profiles_occ_get(void *priv) 8332 { 8333 const struct mlxsw_sp *mlxsw_sp = priv; 8334 8335 return atomic_read(&mlxsw_sp->router->rif_mac_profiles_count); 8336 } 8337 8338 static u64 mlxsw_sp_rifs_occ_get(void *priv) 8339 { 8340 const struct mlxsw_sp *mlxsw_sp = priv; 8341 8342 return atomic_read(&mlxsw_sp->router->rifs_count); 8343 } 8344 8345 static struct mlxsw_sp_rif_mac_profile * 8346 mlxsw_sp_rif_mac_profile_create(struct mlxsw_sp *mlxsw_sp, const char *mac, 8347 struct netlink_ext_ack *extack) 8348 { 8349 struct mlxsw_sp_rif_mac_profile *profile; 8350 int err; 8351 8352 profile = mlxsw_sp_rif_mac_profile_alloc(mac); 8353 if (!profile) 8354 return ERR_PTR(-ENOMEM); 8355 8356 err = mlxsw_sp_rif_mac_profile_index_alloc(mlxsw_sp, profile, extack); 8357 if (err) 8358 goto profile_index_alloc_err; 8359 8360 atomic_inc(&mlxsw_sp->router->rif_mac_profiles_count); 8361 return profile; 8362 8363 profile_index_alloc_err: 8364 kfree(profile); 8365 return ERR_PTR(err); 8366 } 8367 8368 static void mlxsw_sp_rif_mac_profile_destroy(struct mlxsw_sp *mlxsw_sp, 8369 u8 mac_profile) 8370 { 8371 struct mlxsw_sp_rif_mac_profile *profile; 8372 8373 atomic_dec(&mlxsw_sp->router->rif_mac_profiles_count); 8374 profile = mlxsw_sp_rif_mac_profile_index_free(mlxsw_sp, mac_profile); 8375 kfree(profile); 8376 } 8377 8378 static int mlxsw_sp_rif_mac_profile_get(struct mlxsw_sp *mlxsw_sp, 8379 const char *mac, u8 *p_mac_profile, 8380 struct netlink_ext_ack *extack) 8381 { 8382 struct mlxsw_sp_rif_mac_profile *profile; 8383 8384 profile = mlxsw_sp_rif_mac_profile_find(mlxsw_sp, mac); 8385 if (profile) { 8386 refcount_inc(&profile->ref_count); 8387 goto out; 8388 } 8389 8390 profile = mlxsw_sp_rif_mac_profile_create(mlxsw_sp, mac, extack); 8391 if (IS_ERR(profile)) 8392 return PTR_ERR(profile); 8393 8394 out: 8395 *p_mac_profile = profile->id; 8396 return 0; 8397 } 8398 8399 static void mlxsw_sp_rif_mac_profile_put(struct mlxsw_sp *mlxsw_sp, 8400 u8 mac_profile) 8401 { 8402 struct mlxsw_sp_rif_mac_profile *profile; 8403 8404 profile = idr_find(&mlxsw_sp->router->rif_mac_profiles_idr, 8405 mac_profile); 8406 if (WARN_ON(!profile)) 8407 return; 8408 8409 if (!refcount_dec_and_test(&profile->ref_count)) 8410 return; 8411 8412 mlxsw_sp_rif_mac_profile_destroy(mlxsw_sp, mac_profile); 8413 } 8414 8415 static bool mlxsw_sp_rif_mac_profile_is_shared(const struct mlxsw_sp_rif *rif) 8416 { 8417 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 8418 struct mlxsw_sp_rif_mac_profile *profile; 8419 8420 profile = idr_find(&mlxsw_sp->router->rif_mac_profiles_idr, 8421 rif->mac_profile_id); 8422 if (WARN_ON(!profile)) 8423 return false; 8424 8425 return refcount_read(&profile->ref_count) > 1; 8426 } 8427 8428 static int mlxsw_sp_rif_mac_profile_edit(struct mlxsw_sp_rif *rif, 8429 const char *new_mac) 8430 { 8431 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 8432 struct mlxsw_sp_rif_mac_profile *profile; 8433 8434 profile = idr_find(&mlxsw_sp->router->rif_mac_profiles_idr, 8435 rif->mac_profile_id); 8436 if (WARN_ON(!profile)) 8437 return -EINVAL; 8438 8439 ether_addr_copy(profile->mac_prefix, new_mac); 8440 return 0; 8441 } 8442 8443 static int 8444 mlxsw_sp_rif_mac_profile_replace(struct mlxsw_sp *mlxsw_sp, 8445 struct mlxsw_sp_rif *rif, 8446 const char *new_mac, 8447 struct netlink_ext_ack *extack) 8448 { 8449 u8 mac_profile; 8450 int err; 8451 8452 if (!mlxsw_sp_rif_mac_profile_is_shared(rif) && 8453 !mlxsw_sp_rif_mac_profile_find(mlxsw_sp, new_mac)) 8454 return mlxsw_sp_rif_mac_profile_edit(rif, new_mac); 8455 8456 err = mlxsw_sp_rif_mac_profile_get(mlxsw_sp, new_mac, 8457 &mac_profile, extack); 8458 if (err) 8459 return err; 8460 8461 mlxsw_sp_rif_mac_profile_put(mlxsw_sp, rif->mac_profile_id); 8462 rif->mac_profile_id = mac_profile; 8463 return 0; 8464 } 8465 8466 static int 8467 __mlxsw_sp_port_vlan_router_join(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan, 8468 struct net_device *l3_dev, 8469 struct netlink_ext_ack *extack) 8470 { 8471 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port; 8472 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp; 8473 struct mlxsw_sp_rif_params params = { 8474 .dev = l3_dev, 8475 }; 8476 u16 vid = mlxsw_sp_port_vlan->vid; 8477 struct mlxsw_sp_rif *rif; 8478 struct mlxsw_sp_fid *fid; 8479 int err; 8480 8481 mlxsw_sp_rif_subport_params_init(¶ms, mlxsw_sp_port_vlan); 8482 rif = mlxsw_sp_rif_subport_get(mlxsw_sp, ¶ms, extack); 8483 if (IS_ERR(rif)) 8484 return PTR_ERR(rif); 8485 8486 /* FID was already created, just take a reference */ 8487 fid = rif->ops->fid_get(rif, extack); 8488 err = mlxsw_sp_fid_port_vid_map(fid, mlxsw_sp_port, vid); 8489 if (err) 8490 goto err_fid_port_vid_map; 8491 8492 err = mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, false); 8493 if (err) 8494 goto err_port_vid_learning_set; 8495 8496 err = mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid, 8497 BR_STATE_FORWARDING); 8498 if (err) 8499 goto err_port_vid_stp_set; 8500 8501 mlxsw_sp_port_vlan->fid = fid; 8502 8503 return 0; 8504 8505 err_port_vid_stp_set: 8506 mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true); 8507 err_port_vid_learning_set: 8508 mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid); 8509 err_fid_port_vid_map: 8510 mlxsw_sp_fid_put(fid); 8511 mlxsw_sp_rif_subport_put(rif); 8512 return err; 8513 } 8514 8515 static void 8516 __mlxsw_sp_port_vlan_router_leave(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan) 8517 { 8518 struct mlxsw_sp_port *mlxsw_sp_port = mlxsw_sp_port_vlan->mlxsw_sp_port; 8519 struct mlxsw_sp_fid *fid = mlxsw_sp_port_vlan->fid; 8520 struct mlxsw_sp_rif *rif = mlxsw_sp_fid_rif(fid); 8521 u16 vid = mlxsw_sp_port_vlan->vid; 8522 8523 if (WARN_ON(mlxsw_sp_fid_type(fid) != MLXSW_SP_FID_TYPE_RFID)) 8524 return; 8525 8526 mlxsw_sp_port_vlan->fid = NULL; 8527 mlxsw_sp_port_vid_stp_set(mlxsw_sp_port, vid, BR_STATE_BLOCKING); 8528 mlxsw_sp_port_vid_learning_set(mlxsw_sp_port, vid, true); 8529 mlxsw_sp_fid_port_vid_unmap(fid, mlxsw_sp_port, vid); 8530 mlxsw_sp_fid_put(fid); 8531 mlxsw_sp_rif_subport_put(rif); 8532 } 8533 8534 int 8535 mlxsw_sp_port_vlan_router_join(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan, 8536 struct net_device *l3_dev, 8537 struct netlink_ext_ack *extack) 8538 { 8539 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port_vlan->mlxsw_sp_port->mlxsw_sp; 8540 struct mlxsw_sp_rif *rif; 8541 int err = 0; 8542 8543 mutex_lock(&mlxsw_sp->router->lock); 8544 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev); 8545 if (!rif) 8546 goto out; 8547 8548 err = __mlxsw_sp_port_vlan_router_join(mlxsw_sp_port_vlan, l3_dev, 8549 extack); 8550 out: 8551 mutex_unlock(&mlxsw_sp->router->lock); 8552 return err; 8553 } 8554 8555 void 8556 mlxsw_sp_port_vlan_router_leave(struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan) 8557 { 8558 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port_vlan->mlxsw_sp_port->mlxsw_sp; 8559 8560 mutex_lock(&mlxsw_sp->router->lock); 8561 __mlxsw_sp_port_vlan_router_leave(mlxsw_sp_port_vlan); 8562 mutex_unlock(&mlxsw_sp->router->lock); 8563 } 8564 8565 static int mlxsw_sp_inetaddr_port_vlan_event(struct net_device *l3_dev, 8566 struct net_device *port_dev, 8567 unsigned long event, u16 vid, 8568 struct netlink_ext_ack *extack) 8569 { 8570 struct mlxsw_sp_port *mlxsw_sp_port = netdev_priv(port_dev); 8571 struct mlxsw_sp_port_vlan *mlxsw_sp_port_vlan; 8572 8573 mlxsw_sp_port_vlan = mlxsw_sp_port_vlan_find_by_vid(mlxsw_sp_port, vid); 8574 if (WARN_ON(!mlxsw_sp_port_vlan)) 8575 return -EINVAL; 8576 8577 switch (event) { 8578 case NETDEV_UP: 8579 return __mlxsw_sp_port_vlan_router_join(mlxsw_sp_port_vlan, 8580 l3_dev, extack); 8581 case NETDEV_DOWN: 8582 __mlxsw_sp_port_vlan_router_leave(mlxsw_sp_port_vlan); 8583 break; 8584 } 8585 8586 return 0; 8587 } 8588 8589 static int mlxsw_sp_inetaddr_port_event(struct net_device *port_dev, 8590 unsigned long event, 8591 struct netlink_ext_ack *extack) 8592 { 8593 if (netif_is_any_bridge_port(port_dev) || netif_is_lag_port(port_dev)) 8594 return 0; 8595 8596 return mlxsw_sp_inetaddr_port_vlan_event(port_dev, port_dev, event, 8597 MLXSW_SP_DEFAULT_VID, extack); 8598 } 8599 8600 static int __mlxsw_sp_inetaddr_lag_event(struct net_device *l3_dev, 8601 struct net_device *lag_dev, 8602 unsigned long event, u16 vid, 8603 struct netlink_ext_ack *extack) 8604 { 8605 struct net_device *port_dev; 8606 struct list_head *iter; 8607 int err; 8608 8609 netdev_for_each_lower_dev(lag_dev, port_dev, iter) { 8610 if (mlxsw_sp_port_dev_check(port_dev)) { 8611 err = mlxsw_sp_inetaddr_port_vlan_event(l3_dev, 8612 port_dev, 8613 event, vid, 8614 extack); 8615 if (err) 8616 return err; 8617 } 8618 } 8619 8620 return 0; 8621 } 8622 8623 static int mlxsw_sp_inetaddr_lag_event(struct net_device *lag_dev, 8624 unsigned long event, 8625 struct netlink_ext_ack *extack) 8626 { 8627 if (netif_is_bridge_port(lag_dev)) 8628 return 0; 8629 8630 return __mlxsw_sp_inetaddr_lag_event(lag_dev, lag_dev, event, 8631 MLXSW_SP_DEFAULT_VID, extack); 8632 } 8633 8634 static int mlxsw_sp_inetaddr_bridge_event(struct mlxsw_sp *mlxsw_sp, 8635 struct net_device *l3_dev, 8636 unsigned long event, 8637 struct netlink_ext_ack *extack) 8638 { 8639 struct mlxsw_sp_rif_params params = { 8640 .dev = l3_dev, 8641 }; 8642 struct mlxsw_sp_rif *rif; 8643 8644 switch (event) { 8645 case NETDEV_UP: 8646 if (netif_is_bridge_master(l3_dev) && br_vlan_enabled(l3_dev)) { 8647 u16 proto; 8648 8649 br_vlan_get_proto(l3_dev, &proto); 8650 if (proto == ETH_P_8021AD) { 8651 NL_SET_ERR_MSG_MOD(extack, "Adding an IP address to 802.1ad bridge is not supported"); 8652 return -EOPNOTSUPP; 8653 } 8654 } 8655 rif = mlxsw_sp_rif_create(mlxsw_sp, ¶ms, extack); 8656 if (IS_ERR(rif)) 8657 return PTR_ERR(rif); 8658 break; 8659 case NETDEV_DOWN: 8660 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev); 8661 mlxsw_sp_rif_destroy(rif); 8662 break; 8663 } 8664 8665 return 0; 8666 } 8667 8668 static int mlxsw_sp_inetaddr_vlan_event(struct mlxsw_sp *mlxsw_sp, 8669 struct net_device *vlan_dev, 8670 unsigned long event, 8671 struct netlink_ext_ack *extack) 8672 { 8673 struct net_device *real_dev = vlan_dev_real_dev(vlan_dev); 8674 u16 vid = vlan_dev_vlan_id(vlan_dev); 8675 8676 if (netif_is_bridge_port(vlan_dev)) 8677 return 0; 8678 8679 if (mlxsw_sp_port_dev_check(real_dev)) 8680 return mlxsw_sp_inetaddr_port_vlan_event(vlan_dev, real_dev, 8681 event, vid, extack); 8682 else if (netif_is_lag_master(real_dev)) 8683 return __mlxsw_sp_inetaddr_lag_event(vlan_dev, real_dev, event, 8684 vid, extack); 8685 else if (netif_is_bridge_master(real_dev) && br_vlan_enabled(real_dev)) 8686 return mlxsw_sp_inetaddr_bridge_event(mlxsw_sp, vlan_dev, event, 8687 extack); 8688 8689 return 0; 8690 } 8691 8692 static bool mlxsw_sp_rif_macvlan_is_vrrp4(const u8 *mac) 8693 { 8694 u8 vrrp4[ETH_ALEN] = { 0x00, 0x00, 0x5e, 0x00, 0x01, 0x00 }; 8695 u8 mask[ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0x00 }; 8696 8697 return ether_addr_equal_masked(mac, vrrp4, mask); 8698 } 8699 8700 static bool mlxsw_sp_rif_macvlan_is_vrrp6(const u8 *mac) 8701 { 8702 u8 vrrp6[ETH_ALEN] = { 0x00, 0x00, 0x5e, 0x00, 0x02, 0x00 }; 8703 u8 mask[ETH_ALEN] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0x00 }; 8704 8705 return ether_addr_equal_masked(mac, vrrp6, mask); 8706 } 8707 8708 static int mlxsw_sp_rif_vrrp_op(struct mlxsw_sp *mlxsw_sp, u16 rif_index, 8709 const u8 *mac, bool adding) 8710 { 8711 char ritr_pl[MLXSW_REG_RITR_LEN]; 8712 u8 vrrp_id = adding ? mac[5] : 0; 8713 int err; 8714 8715 if (!mlxsw_sp_rif_macvlan_is_vrrp4(mac) && 8716 !mlxsw_sp_rif_macvlan_is_vrrp6(mac)) 8717 return 0; 8718 8719 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index); 8720 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 8721 if (err) 8722 return err; 8723 8724 if (mlxsw_sp_rif_macvlan_is_vrrp4(mac)) 8725 mlxsw_reg_ritr_if_vrrp_id_ipv4_set(ritr_pl, vrrp_id); 8726 else 8727 mlxsw_reg_ritr_if_vrrp_id_ipv6_set(ritr_pl, vrrp_id); 8728 8729 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 8730 } 8731 8732 static int mlxsw_sp_rif_macvlan_add(struct mlxsw_sp *mlxsw_sp, 8733 const struct net_device *macvlan_dev, 8734 struct netlink_ext_ack *extack) 8735 { 8736 struct macvlan_dev *vlan = netdev_priv(macvlan_dev); 8737 struct mlxsw_sp_rif *rif; 8738 int err; 8739 8740 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, vlan->lowerdev); 8741 if (!rif) { 8742 NL_SET_ERR_MSG_MOD(extack, "macvlan is only supported on top of router interfaces"); 8743 return -EOPNOTSUPP; 8744 } 8745 8746 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr, 8747 mlxsw_sp_fid_index(rif->fid), true); 8748 if (err) 8749 return err; 8750 8751 err = mlxsw_sp_rif_vrrp_op(mlxsw_sp, rif->rif_index, 8752 macvlan_dev->dev_addr, true); 8753 if (err) 8754 goto err_rif_vrrp_add; 8755 8756 /* Make sure the bridge driver does not have this MAC pointing at 8757 * some other port. 8758 */ 8759 if (rif->ops->fdb_del) 8760 rif->ops->fdb_del(rif, macvlan_dev->dev_addr); 8761 8762 return 0; 8763 8764 err_rif_vrrp_add: 8765 mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr, 8766 mlxsw_sp_fid_index(rif->fid), false); 8767 return err; 8768 } 8769 8770 static void __mlxsw_sp_rif_macvlan_del(struct mlxsw_sp *mlxsw_sp, 8771 const struct net_device *macvlan_dev) 8772 { 8773 struct macvlan_dev *vlan = netdev_priv(macvlan_dev); 8774 struct mlxsw_sp_rif *rif; 8775 8776 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, vlan->lowerdev); 8777 /* If we do not have a RIF, then we already took care of 8778 * removing the macvlan's MAC during RIF deletion. 8779 */ 8780 if (!rif) 8781 return; 8782 mlxsw_sp_rif_vrrp_op(mlxsw_sp, rif->rif_index, macvlan_dev->dev_addr, 8783 false); 8784 mlxsw_sp_rif_fdb_op(mlxsw_sp, macvlan_dev->dev_addr, 8785 mlxsw_sp_fid_index(rif->fid), false); 8786 } 8787 8788 void mlxsw_sp_rif_macvlan_del(struct mlxsw_sp *mlxsw_sp, 8789 const struct net_device *macvlan_dev) 8790 { 8791 mutex_lock(&mlxsw_sp->router->lock); 8792 __mlxsw_sp_rif_macvlan_del(mlxsw_sp, macvlan_dev); 8793 mutex_unlock(&mlxsw_sp->router->lock); 8794 } 8795 8796 static int mlxsw_sp_inetaddr_macvlan_event(struct mlxsw_sp *mlxsw_sp, 8797 struct net_device *macvlan_dev, 8798 unsigned long event, 8799 struct netlink_ext_ack *extack) 8800 { 8801 switch (event) { 8802 case NETDEV_UP: 8803 return mlxsw_sp_rif_macvlan_add(mlxsw_sp, macvlan_dev, extack); 8804 case NETDEV_DOWN: 8805 __mlxsw_sp_rif_macvlan_del(mlxsw_sp, macvlan_dev); 8806 break; 8807 } 8808 8809 return 0; 8810 } 8811 8812 static int __mlxsw_sp_inetaddr_event(struct mlxsw_sp *mlxsw_sp, 8813 struct net_device *dev, 8814 unsigned long event, 8815 struct netlink_ext_ack *extack) 8816 { 8817 if (mlxsw_sp_port_dev_check(dev)) 8818 return mlxsw_sp_inetaddr_port_event(dev, event, extack); 8819 else if (netif_is_lag_master(dev)) 8820 return mlxsw_sp_inetaddr_lag_event(dev, event, extack); 8821 else if (netif_is_bridge_master(dev)) 8822 return mlxsw_sp_inetaddr_bridge_event(mlxsw_sp, dev, event, 8823 extack); 8824 else if (is_vlan_dev(dev)) 8825 return mlxsw_sp_inetaddr_vlan_event(mlxsw_sp, dev, event, 8826 extack); 8827 else if (netif_is_macvlan(dev)) 8828 return mlxsw_sp_inetaddr_macvlan_event(mlxsw_sp, dev, event, 8829 extack); 8830 else 8831 return 0; 8832 } 8833 8834 static int mlxsw_sp_inetaddr_event(struct notifier_block *nb, 8835 unsigned long event, void *ptr) 8836 { 8837 struct in_ifaddr *ifa = (struct in_ifaddr *) ptr; 8838 struct net_device *dev = ifa->ifa_dev->dev; 8839 struct mlxsw_sp_router *router; 8840 struct mlxsw_sp_rif *rif; 8841 int err = 0; 8842 8843 /* NETDEV_UP event is handled by mlxsw_sp_inetaddr_valid_event */ 8844 if (event == NETDEV_UP) 8845 return NOTIFY_DONE; 8846 8847 router = container_of(nb, struct mlxsw_sp_router, inetaddr_nb); 8848 mutex_lock(&router->lock); 8849 rif = mlxsw_sp_rif_find_by_dev(router->mlxsw_sp, dev); 8850 if (!mlxsw_sp_rif_should_config(rif, dev, event)) 8851 goto out; 8852 8853 err = __mlxsw_sp_inetaddr_event(router->mlxsw_sp, dev, event, NULL); 8854 out: 8855 mutex_unlock(&router->lock); 8856 return notifier_from_errno(err); 8857 } 8858 8859 int mlxsw_sp_inetaddr_valid_event(struct notifier_block *unused, 8860 unsigned long event, void *ptr) 8861 { 8862 struct in_validator_info *ivi = (struct in_validator_info *) ptr; 8863 struct net_device *dev = ivi->ivi_dev->dev; 8864 struct mlxsw_sp *mlxsw_sp; 8865 struct mlxsw_sp_rif *rif; 8866 int err = 0; 8867 8868 mlxsw_sp = mlxsw_sp_lower_get(dev); 8869 if (!mlxsw_sp) 8870 return NOTIFY_DONE; 8871 8872 mutex_lock(&mlxsw_sp->router->lock); 8873 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 8874 if (!mlxsw_sp_rif_should_config(rif, dev, event)) 8875 goto out; 8876 8877 err = __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, ivi->extack); 8878 out: 8879 mutex_unlock(&mlxsw_sp->router->lock); 8880 return notifier_from_errno(err); 8881 } 8882 8883 struct mlxsw_sp_inet6addr_event_work { 8884 struct work_struct work; 8885 struct mlxsw_sp *mlxsw_sp; 8886 struct net_device *dev; 8887 unsigned long event; 8888 }; 8889 8890 static void mlxsw_sp_inet6addr_event_work(struct work_struct *work) 8891 { 8892 struct mlxsw_sp_inet6addr_event_work *inet6addr_work = 8893 container_of(work, struct mlxsw_sp_inet6addr_event_work, work); 8894 struct mlxsw_sp *mlxsw_sp = inet6addr_work->mlxsw_sp; 8895 struct net_device *dev = inet6addr_work->dev; 8896 unsigned long event = inet6addr_work->event; 8897 struct mlxsw_sp_rif *rif; 8898 8899 rtnl_lock(); 8900 mutex_lock(&mlxsw_sp->router->lock); 8901 8902 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 8903 if (!mlxsw_sp_rif_should_config(rif, dev, event)) 8904 goto out; 8905 8906 __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, NULL); 8907 out: 8908 mutex_unlock(&mlxsw_sp->router->lock); 8909 rtnl_unlock(); 8910 dev_put(dev); 8911 kfree(inet6addr_work); 8912 } 8913 8914 /* Called with rcu_read_lock() */ 8915 static int mlxsw_sp_inet6addr_event(struct notifier_block *nb, 8916 unsigned long event, void *ptr) 8917 { 8918 struct inet6_ifaddr *if6 = (struct inet6_ifaddr *) ptr; 8919 struct mlxsw_sp_inet6addr_event_work *inet6addr_work; 8920 struct net_device *dev = if6->idev->dev; 8921 struct mlxsw_sp_router *router; 8922 8923 /* NETDEV_UP event is handled by mlxsw_sp_inet6addr_valid_event */ 8924 if (event == NETDEV_UP) 8925 return NOTIFY_DONE; 8926 8927 inet6addr_work = kzalloc(sizeof(*inet6addr_work), GFP_ATOMIC); 8928 if (!inet6addr_work) 8929 return NOTIFY_BAD; 8930 8931 router = container_of(nb, struct mlxsw_sp_router, inet6addr_nb); 8932 INIT_WORK(&inet6addr_work->work, mlxsw_sp_inet6addr_event_work); 8933 inet6addr_work->mlxsw_sp = router->mlxsw_sp; 8934 inet6addr_work->dev = dev; 8935 inet6addr_work->event = event; 8936 dev_hold(dev); 8937 mlxsw_core_schedule_work(&inet6addr_work->work); 8938 8939 return NOTIFY_DONE; 8940 } 8941 8942 int mlxsw_sp_inet6addr_valid_event(struct notifier_block *unused, 8943 unsigned long event, void *ptr) 8944 { 8945 struct in6_validator_info *i6vi = (struct in6_validator_info *) ptr; 8946 struct net_device *dev = i6vi->i6vi_dev->dev; 8947 struct mlxsw_sp *mlxsw_sp; 8948 struct mlxsw_sp_rif *rif; 8949 int err = 0; 8950 8951 mlxsw_sp = mlxsw_sp_lower_get(dev); 8952 if (!mlxsw_sp) 8953 return NOTIFY_DONE; 8954 8955 mutex_lock(&mlxsw_sp->router->lock); 8956 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 8957 if (!mlxsw_sp_rif_should_config(rif, dev, event)) 8958 goto out; 8959 8960 err = __mlxsw_sp_inetaddr_event(mlxsw_sp, dev, event, i6vi->extack); 8961 out: 8962 mutex_unlock(&mlxsw_sp->router->lock); 8963 return notifier_from_errno(err); 8964 } 8965 8966 static int mlxsw_sp_rif_edit(struct mlxsw_sp *mlxsw_sp, u16 rif_index, 8967 const char *mac, int mtu, u8 mac_profile) 8968 { 8969 char ritr_pl[MLXSW_REG_RITR_LEN]; 8970 int err; 8971 8972 mlxsw_reg_ritr_rif_pack(ritr_pl, rif_index); 8973 err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 8974 if (err) 8975 return err; 8976 8977 mlxsw_reg_ritr_mtu_set(ritr_pl, mtu); 8978 mlxsw_reg_ritr_if_mac_memcpy_to(ritr_pl, mac); 8979 mlxsw_reg_ritr_if_mac_profile_id_set(ritr_pl, mac_profile); 8980 mlxsw_reg_ritr_op_set(ritr_pl, MLXSW_REG_RITR_RIF_CREATE); 8981 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 8982 } 8983 8984 static int 8985 mlxsw_sp_router_port_change_event(struct mlxsw_sp *mlxsw_sp, 8986 struct mlxsw_sp_rif *rif, 8987 struct netlink_ext_ack *extack) 8988 { 8989 struct net_device *dev = rif->dev; 8990 u8 old_mac_profile; 8991 u16 fid_index; 8992 int err; 8993 8994 fid_index = mlxsw_sp_fid_index(rif->fid); 8995 8996 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, false); 8997 if (err) 8998 return err; 8999 9000 old_mac_profile = rif->mac_profile_id; 9001 err = mlxsw_sp_rif_mac_profile_replace(mlxsw_sp, rif, dev->dev_addr, 9002 extack); 9003 if (err) 9004 goto err_rif_mac_profile_replace; 9005 9006 err = mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, dev->dev_addr, 9007 dev->mtu, rif->mac_profile_id); 9008 if (err) 9009 goto err_rif_edit; 9010 9011 err = mlxsw_sp_rif_fdb_op(mlxsw_sp, dev->dev_addr, fid_index, true); 9012 if (err) 9013 goto err_rif_fdb_op; 9014 9015 if (rif->mtu != dev->mtu) { 9016 struct mlxsw_sp_vr *vr; 9017 int i; 9018 9019 /* The RIF is relevant only to its mr_table instance, as unlike 9020 * unicast routing, in multicast routing a RIF cannot be shared 9021 * between several multicast routing tables. 9022 */ 9023 vr = &mlxsw_sp->router->vrs[rif->vr_id]; 9024 for (i = 0; i < MLXSW_SP_L3_PROTO_MAX; i++) 9025 mlxsw_sp_mr_rif_mtu_update(vr->mr_table[i], 9026 rif, dev->mtu); 9027 } 9028 9029 ether_addr_copy(rif->addr, dev->dev_addr); 9030 rif->mtu = dev->mtu; 9031 9032 netdev_dbg(dev, "Updated RIF=%d\n", rif->rif_index); 9033 9034 return 0; 9035 9036 err_rif_fdb_op: 9037 mlxsw_sp_rif_edit(mlxsw_sp, rif->rif_index, rif->addr, rif->mtu, 9038 old_mac_profile); 9039 err_rif_edit: 9040 mlxsw_sp_rif_mac_profile_replace(mlxsw_sp, rif, rif->addr, extack); 9041 err_rif_mac_profile_replace: 9042 mlxsw_sp_rif_fdb_op(mlxsw_sp, rif->addr, fid_index, true); 9043 return err; 9044 } 9045 9046 static int mlxsw_sp_router_port_pre_changeaddr_event(struct mlxsw_sp_rif *rif, 9047 struct netdev_notifier_pre_changeaddr_info *info) 9048 { 9049 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9050 struct mlxsw_sp_rif_mac_profile *profile; 9051 struct netlink_ext_ack *extack; 9052 u8 max_rif_mac_profiles; 9053 u64 occ; 9054 9055 extack = netdev_notifier_info_to_extack(&info->info); 9056 9057 profile = mlxsw_sp_rif_mac_profile_find(mlxsw_sp, info->dev_addr); 9058 if (profile) 9059 return 0; 9060 9061 max_rif_mac_profiles = mlxsw_sp->router->max_rif_mac_profile; 9062 occ = mlxsw_sp_rif_mac_profiles_occ_get(mlxsw_sp); 9063 if (occ < max_rif_mac_profiles) 9064 return 0; 9065 9066 if (!mlxsw_sp_rif_mac_profile_is_shared(rif)) 9067 return 0; 9068 9069 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interface MAC profiles"); 9070 return -ENOBUFS; 9071 } 9072 9073 static bool mlxsw_sp_is_offload_xstats_event(unsigned long event) 9074 { 9075 switch (event) { 9076 case NETDEV_OFFLOAD_XSTATS_ENABLE: 9077 case NETDEV_OFFLOAD_XSTATS_DISABLE: 9078 case NETDEV_OFFLOAD_XSTATS_REPORT_USED: 9079 case NETDEV_OFFLOAD_XSTATS_REPORT_DELTA: 9080 return true; 9081 } 9082 9083 return false; 9084 } 9085 9086 static int 9087 mlxsw_sp_router_port_offload_xstats_cmd(struct mlxsw_sp_rif *rif, 9088 unsigned long event, 9089 struct netdev_notifier_offload_xstats_info *info) 9090 { 9091 switch (info->type) { 9092 case NETDEV_OFFLOAD_XSTATS_TYPE_L3: 9093 break; 9094 default: 9095 return 0; 9096 } 9097 9098 switch (event) { 9099 case NETDEV_OFFLOAD_XSTATS_ENABLE: 9100 return mlxsw_sp_router_port_l3_stats_enable(rif); 9101 case NETDEV_OFFLOAD_XSTATS_DISABLE: 9102 mlxsw_sp_router_port_l3_stats_disable(rif); 9103 return 0; 9104 case NETDEV_OFFLOAD_XSTATS_REPORT_USED: 9105 mlxsw_sp_router_port_l3_stats_report_used(rif, info); 9106 return 0; 9107 case NETDEV_OFFLOAD_XSTATS_REPORT_DELTA: 9108 return mlxsw_sp_router_port_l3_stats_report_delta(rif, info); 9109 } 9110 9111 WARN_ON_ONCE(1); 9112 return 0; 9113 } 9114 9115 static int 9116 mlxsw_sp_netdevice_offload_xstats_cmd(struct mlxsw_sp *mlxsw_sp, 9117 struct net_device *dev, 9118 unsigned long event, 9119 struct netdev_notifier_offload_xstats_info *info) 9120 { 9121 struct mlxsw_sp_rif *rif; 9122 9123 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 9124 if (!rif) 9125 return 0; 9126 9127 return mlxsw_sp_router_port_offload_xstats_cmd(rif, event, info); 9128 } 9129 9130 static bool mlxsw_sp_is_router_event(unsigned long event) 9131 { 9132 switch (event) { 9133 case NETDEV_PRE_CHANGEADDR: 9134 case NETDEV_CHANGEADDR: 9135 case NETDEV_CHANGEMTU: 9136 return true; 9137 default: 9138 return false; 9139 } 9140 } 9141 9142 static int mlxsw_sp_netdevice_router_port_event(struct net_device *dev, 9143 unsigned long event, void *ptr) 9144 { 9145 struct netlink_ext_ack *extack = netdev_notifier_info_to_extack(ptr); 9146 struct mlxsw_sp *mlxsw_sp; 9147 struct mlxsw_sp_rif *rif; 9148 9149 mlxsw_sp = mlxsw_sp_lower_get(dev); 9150 if (!mlxsw_sp) 9151 return 0; 9152 9153 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); 9154 if (!rif) 9155 return 0; 9156 9157 switch (event) { 9158 case NETDEV_CHANGEMTU: 9159 case NETDEV_CHANGEADDR: 9160 return mlxsw_sp_router_port_change_event(mlxsw_sp, rif, extack); 9161 case NETDEV_PRE_CHANGEADDR: 9162 return mlxsw_sp_router_port_pre_changeaddr_event(rif, ptr); 9163 default: 9164 WARN_ON_ONCE(1); 9165 break; 9166 } 9167 9168 return 0; 9169 } 9170 9171 static int mlxsw_sp_port_vrf_join(struct mlxsw_sp *mlxsw_sp, 9172 struct net_device *l3_dev, 9173 struct netlink_ext_ack *extack) 9174 { 9175 struct mlxsw_sp_rif *rif; 9176 9177 /* If netdev is already associated with a RIF, then we need to 9178 * destroy it and create a new one with the new virtual router ID. 9179 */ 9180 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev); 9181 if (rif) 9182 __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_DOWN, 9183 extack); 9184 9185 return __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_UP, extack); 9186 } 9187 9188 static void mlxsw_sp_port_vrf_leave(struct mlxsw_sp *mlxsw_sp, 9189 struct net_device *l3_dev) 9190 { 9191 struct mlxsw_sp_rif *rif; 9192 9193 rif = mlxsw_sp_rif_find_by_dev(mlxsw_sp, l3_dev); 9194 if (!rif) 9195 return; 9196 __mlxsw_sp_inetaddr_event(mlxsw_sp, l3_dev, NETDEV_DOWN, NULL); 9197 } 9198 9199 static bool mlxsw_sp_is_vrf_event(unsigned long event, void *ptr) 9200 { 9201 struct netdev_notifier_changeupper_info *info = ptr; 9202 9203 if (event != NETDEV_PRECHANGEUPPER && event != NETDEV_CHANGEUPPER) 9204 return false; 9205 return netif_is_l3_master(info->upper_dev); 9206 } 9207 9208 static int 9209 mlxsw_sp_netdevice_vrf_event(struct net_device *l3_dev, unsigned long event, 9210 struct netdev_notifier_changeupper_info *info) 9211 { 9212 struct mlxsw_sp *mlxsw_sp = mlxsw_sp_lower_get(l3_dev); 9213 int err = 0; 9214 9215 /* We do not create a RIF for a macvlan, but only use it to 9216 * direct more MAC addresses to the router. 9217 */ 9218 if (!mlxsw_sp || netif_is_macvlan(l3_dev)) 9219 return 0; 9220 9221 switch (event) { 9222 case NETDEV_PRECHANGEUPPER: 9223 break; 9224 case NETDEV_CHANGEUPPER: 9225 if (info->linking) { 9226 struct netlink_ext_ack *extack; 9227 9228 extack = netdev_notifier_info_to_extack(&info->info); 9229 err = mlxsw_sp_port_vrf_join(mlxsw_sp, l3_dev, extack); 9230 } else { 9231 mlxsw_sp_port_vrf_leave(mlxsw_sp, l3_dev); 9232 } 9233 break; 9234 } 9235 9236 return err; 9237 } 9238 9239 static int mlxsw_sp_router_netdevice_event(struct notifier_block *nb, 9240 unsigned long event, void *ptr) 9241 { 9242 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 9243 struct mlxsw_sp_router *router; 9244 struct mlxsw_sp *mlxsw_sp; 9245 int err = 0; 9246 9247 router = container_of(nb, struct mlxsw_sp_router, netdevice_nb); 9248 mlxsw_sp = router->mlxsw_sp; 9249 9250 mutex_lock(&mlxsw_sp->router->lock); 9251 9252 if (mlxsw_sp_is_offload_xstats_event(event)) 9253 err = mlxsw_sp_netdevice_offload_xstats_cmd(mlxsw_sp, dev, 9254 event, ptr); 9255 else if (mlxsw_sp_netdev_is_ipip_ol(mlxsw_sp, dev)) 9256 err = mlxsw_sp_netdevice_ipip_ol_event(mlxsw_sp, dev, 9257 event, ptr); 9258 else if (mlxsw_sp_netdev_is_ipip_ul(mlxsw_sp, dev)) 9259 err = mlxsw_sp_netdevice_ipip_ul_event(mlxsw_sp, dev, 9260 event, ptr); 9261 else if (mlxsw_sp_is_router_event(event)) 9262 err = mlxsw_sp_netdevice_router_port_event(dev, event, ptr); 9263 else if (mlxsw_sp_is_vrf_event(event, ptr)) 9264 err = mlxsw_sp_netdevice_vrf_event(dev, event, ptr); 9265 9266 mutex_unlock(&mlxsw_sp->router->lock); 9267 9268 return notifier_from_errno(err); 9269 } 9270 9271 static int __mlxsw_sp_rif_macvlan_flush(struct net_device *dev, 9272 struct netdev_nested_priv *priv) 9273 { 9274 struct mlxsw_sp_rif *rif = (struct mlxsw_sp_rif *)priv->data; 9275 9276 if (!netif_is_macvlan(dev)) 9277 return 0; 9278 9279 return mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, dev->dev_addr, 9280 mlxsw_sp_fid_index(rif->fid), false); 9281 } 9282 9283 static int mlxsw_sp_rif_macvlan_flush(struct mlxsw_sp_rif *rif) 9284 { 9285 struct netdev_nested_priv priv = { 9286 .data = (void *)rif, 9287 }; 9288 9289 if (!netif_is_macvlan_port(rif->dev)) 9290 return 0; 9291 9292 netdev_warn(rif->dev, "Router interface is deleted. Upper macvlans will not work\n"); 9293 return netdev_walk_all_upper_dev_rcu(rif->dev, 9294 __mlxsw_sp_rif_macvlan_flush, &priv); 9295 } 9296 9297 static void mlxsw_sp_rif_subport_setup(struct mlxsw_sp_rif *rif, 9298 const struct mlxsw_sp_rif_params *params) 9299 { 9300 struct mlxsw_sp_rif_subport *rif_subport; 9301 9302 rif_subport = mlxsw_sp_rif_subport_rif(rif); 9303 refcount_set(&rif_subport->ref_count, 1); 9304 rif_subport->vid = params->vid; 9305 rif_subport->lag = params->lag; 9306 if (params->lag) 9307 rif_subport->lag_id = params->lag_id; 9308 else 9309 rif_subport->system_port = params->system_port; 9310 } 9311 9312 static int mlxsw_sp_rif_subport_op(struct mlxsw_sp_rif *rif, bool enable) 9313 { 9314 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9315 struct mlxsw_sp_rif_subport *rif_subport; 9316 char ritr_pl[MLXSW_REG_RITR_LEN]; 9317 u16 efid; 9318 9319 rif_subport = mlxsw_sp_rif_subport_rif(rif); 9320 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_SP_IF, 9321 rif->rif_index, rif->vr_id, rif->dev->mtu); 9322 mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr); 9323 mlxsw_reg_ritr_if_mac_profile_id_set(ritr_pl, rif->mac_profile_id); 9324 efid = mlxsw_sp_fid_index(rif->fid); 9325 mlxsw_reg_ritr_sp_if_pack(ritr_pl, rif_subport->lag, 9326 rif_subport->lag ? rif_subport->lag_id : 9327 rif_subport->system_port, 9328 efid, 0); 9329 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 9330 } 9331 9332 static int mlxsw_sp_rif_subport_configure(struct mlxsw_sp_rif *rif, 9333 struct netlink_ext_ack *extack) 9334 { 9335 u8 mac_profile; 9336 int err; 9337 9338 err = mlxsw_sp_rif_mac_profile_get(rif->mlxsw_sp, rif->addr, 9339 &mac_profile, extack); 9340 if (err) 9341 return err; 9342 rif->mac_profile_id = mac_profile; 9343 9344 err = mlxsw_sp_rif_subport_op(rif, true); 9345 if (err) 9346 goto err_rif_subport_op; 9347 9348 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9349 mlxsw_sp_fid_index(rif->fid), true); 9350 if (err) 9351 goto err_rif_fdb_op; 9352 9353 err = mlxsw_sp_fid_rif_set(rif->fid, rif); 9354 if (err) 9355 goto err_fid_rif_set; 9356 9357 return 0; 9358 9359 err_fid_rif_set: 9360 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9361 mlxsw_sp_fid_index(rif->fid), false); 9362 err_rif_fdb_op: 9363 mlxsw_sp_rif_subport_op(rif, false); 9364 err_rif_subport_op: 9365 mlxsw_sp_rif_mac_profile_put(rif->mlxsw_sp, mac_profile); 9366 return err; 9367 } 9368 9369 static void mlxsw_sp_rif_subport_deconfigure(struct mlxsw_sp_rif *rif) 9370 { 9371 struct mlxsw_sp_fid *fid = rif->fid; 9372 9373 mlxsw_sp_fid_rif_unset(fid); 9374 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9375 mlxsw_sp_fid_index(fid), false); 9376 mlxsw_sp_rif_macvlan_flush(rif); 9377 mlxsw_sp_rif_subport_op(rif, false); 9378 mlxsw_sp_rif_mac_profile_put(rif->mlxsw_sp, rif->mac_profile_id); 9379 } 9380 9381 static struct mlxsw_sp_fid * 9382 mlxsw_sp_rif_subport_fid_get(struct mlxsw_sp_rif *rif, 9383 struct netlink_ext_ack *extack) 9384 { 9385 return mlxsw_sp_fid_rfid_get(rif->mlxsw_sp, rif->rif_index); 9386 } 9387 9388 static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_subport_ops = { 9389 .type = MLXSW_SP_RIF_TYPE_SUBPORT, 9390 .rif_size = sizeof(struct mlxsw_sp_rif_subport), 9391 .setup = mlxsw_sp_rif_subport_setup, 9392 .configure = mlxsw_sp_rif_subport_configure, 9393 .deconfigure = mlxsw_sp_rif_subport_deconfigure, 9394 .fid_get = mlxsw_sp_rif_subport_fid_get, 9395 }; 9396 9397 static int mlxsw_sp_rif_fid_op(struct mlxsw_sp_rif *rif, u16 fid, bool enable) 9398 { 9399 enum mlxsw_reg_ritr_if_type type = MLXSW_REG_RITR_FID_IF; 9400 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9401 char ritr_pl[MLXSW_REG_RITR_LEN]; 9402 9403 mlxsw_reg_ritr_pack(ritr_pl, enable, type, rif->rif_index, rif->vr_id, 9404 rif->dev->mtu); 9405 mlxsw_reg_ritr_mac_pack(ritr_pl, rif->dev->dev_addr); 9406 mlxsw_reg_ritr_if_mac_profile_id_set(ritr_pl, rif->mac_profile_id); 9407 mlxsw_reg_ritr_fid_if_fid_set(ritr_pl, fid); 9408 9409 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 9410 } 9411 9412 u16 mlxsw_sp_router_port(const struct mlxsw_sp *mlxsw_sp) 9413 { 9414 return mlxsw_core_max_ports(mlxsw_sp->core) + 1; 9415 } 9416 9417 static int mlxsw_sp_rif_fid_configure(struct mlxsw_sp_rif *rif, 9418 struct netlink_ext_ack *extack) 9419 { 9420 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9421 u16 fid_index = mlxsw_sp_fid_index(rif->fid); 9422 u8 mac_profile; 9423 int err; 9424 9425 err = mlxsw_sp_rif_mac_profile_get(mlxsw_sp, rif->addr, 9426 &mac_profile, extack); 9427 if (err) 9428 return err; 9429 rif->mac_profile_id = mac_profile; 9430 9431 err = mlxsw_sp_rif_fid_op(rif, fid_index, true); 9432 if (err) 9433 goto err_rif_fid_op; 9434 9435 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC, 9436 mlxsw_sp_router_port(mlxsw_sp), true); 9437 if (err) 9438 goto err_fid_mc_flood_set; 9439 9440 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC, 9441 mlxsw_sp_router_port(mlxsw_sp), true); 9442 if (err) 9443 goto err_fid_bc_flood_set; 9444 9445 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9446 mlxsw_sp_fid_index(rif->fid), true); 9447 if (err) 9448 goto err_rif_fdb_op; 9449 9450 err = mlxsw_sp_fid_rif_set(rif->fid, rif); 9451 if (err) 9452 goto err_fid_rif_set; 9453 9454 return 0; 9455 9456 err_fid_rif_set: 9457 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9458 mlxsw_sp_fid_index(rif->fid), false); 9459 err_rif_fdb_op: 9460 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC, 9461 mlxsw_sp_router_port(mlxsw_sp), false); 9462 err_fid_bc_flood_set: 9463 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC, 9464 mlxsw_sp_router_port(mlxsw_sp), false); 9465 err_fid_mc_flood_set: 9466 mlxsw_sp_rif_fid_op(rif, fid_index, false); 9467 err_rif_fid_op: 9468 mlxsw_sp_rif_mac_profile_put(mlxsw_sp, mac_profile); 9469 return err; 9470 } 9471 9472 static void mlxsw_sp_rif_fid_deconfigure(struct mlxsw_sp_rif *rif) 9473 { 9474 u16 fid_index = mlxsw_sp_fid_index(rif->fid); 9475 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9476 struct mlxsw_sp_fid *fid = rif->fid; 9477 9478 mlxsw_sp_fid_rif_unset(fid); 9479 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9480 mlxsw_sp_fid_index(fid), false); 9481 mlxsw_sp_rif_macvlan_flush(rif); 9482 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC, 9483 mlxsw_sp_router_port(mlxsw_sp), false); 9484 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC, 9485 mlxsw_sp_router_port(mlxsw_sp), false); 9486 mlxsw_sp_rif_fid_op(rif, fid_index, false); 9487 mlxsw_sp_rif_mac_profile_put(rif->mlxsw_sp, rif->mac_profile_id); 9488 } 9489 9490 static struct mlxsw_sp_fid * 9491 mlxsw_sp_rif_fid_fid_get(struct mlxsw_sp_rif *rif, 9492 struct netlink_ext_ack *extack) 9493 { 9494 return mlxsw_sp_fid_8021d_get(rif->mlxsw_sp, rif->dev->ifindex); 9495 } 9496 9497 static void mlxsw_sp_rif_fid_fdb_del(struct mlxsw_sp_rif *rif, const char *mac) 9498 { 9499 struct switchdev_notifier_fdb_info info = {}; 9500 struct net_device *dev; 9501 9502 dev = br_fdb_find_port(rif->dev, mac, 0); 9503 if (!dev) 9504 return; 9505 9506 info.addr = mac; 9507 info.vid = 0; 9508 call_switchdev_notifiers(SWITCHDEV_FDB_DEL_TO_BRIDGE, dev, &info.info, 9509 NULL); 9510 } 9511 9512 static const struct mlxsw_sp_rif_ops mlxsw_sp_rif_fid_ops = { 9513 .type = MLXSW_SP_RIF_TYPE_FID, 9514 .rif_size = sizeof(struct mlxsw_sp_rif), 9515 .configure = mlxsw_sp_rif_fid_configure, 9516 .deconfigure = mlxsw_sp_rif_fid_deconfigure, 9517 .fid_get = mlxsw_sp_rif_fid_fid_get, 9518 .fdb_del = mlxsw_sp_rif_fid_fdb_del, 9519 }; 9520 9521 static struct mlxsw_sp_fid * 9522 mlxsw_sp_rif_vlan_fid_get(struct mlxsw_sp_rif *rif, 9523 struct netlink_ext_ack *extack) 9524 { 9525 struct net_device *br_dev; 9526 u16 vid; 9527 int err; 9528 9529 if (is_vlan_dev(rif->dev)) { 9530 vid = vlan_dev_vlan_id(rif->dev); 9531 br_dev = vlan_dev_real_dev(rif->dev); 9532 if (WARN_ON(!netif_is_bridge_master(br_dev))) 9533 return ERR_PTR(-EINVAL); 9534 } else { 9535 err = br_vlan_get_pvid(rif->dev, &vid); 9536 if (err < 0 || !vid) { 9537 NL_SET_ERR_MSG_MOD(extack, "Couldn't determine bridge PVID"); 9538 return ERR_PTR(-EINVAL); 9539 } 9540 } 9541 9542 return mlxsw_sp_fid_8021q_get(rif->mlxsw_sp, vid); 9543 } 9544 9545 static void mlxsw_sp_rif_vlan_fdb_del(struct mlxsw_sp_rif *rif, const char *mac) 9546 { 9547 struct switchdev_notifier_fdb_info info = {}; 9548 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid); 9549 struct net_device *br_dev; 9550 struct net_device *dev; 9551 9552 br_dev = is_vlan_dev(rif->dev) ? vlan_dev_real_dev(rif->dev) : rif->dev; 9553 dev = br_fdb_find_port(br_dev, mac, vid); 9554 if (!dev) 9555 return; 9556 9557 info.addr = mac; 9558 info.vid = vid; 9559 call_switchdev_notifiers(SWITCHDEV_FDB_DEL_TO_BRIDGE, dev, &info.info, 9560 NULL); 9561 } 9562 9563 static int mlxsw_sp_rif_vlan_op(struct mlxsw_sp_rif *rif, u16 vid, u16 efid, 9564 bool enable) 9565 { 9566 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9567 char ritr_pl[MLXSW_REG_RITR_LEN]; 9568 9569 mlxsw_reg_ritr_vlan_if_pack(ritr_pl, enable, rif->rif_index, rif->vr_id, 9570 rif->dev->mtu, rif->dev->dev_addr, 9571 rif->mac_profile_id, vid, efid); 9572 9573 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 9574 } 9575 9576 static int mlxsw_sp_rif_vlan_configure(struct mlxsw_sp_rif *rif, u16 efid, 9577 struct netlink_ext_ack *extack) 9578 { 9579 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid); 9580 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9581 u8 mac_profile; 9582 int err; 9583 9584 err = mlxsw_sp_rif_mac_profile_get(mlxsw_sp, rif->addr, 9585 &mac_profile, extack); 9586 if (err) 9587 return err; 9588 rif->mac_profile_id = mac_profile; 9589 9590 err = mlxsw_sp_rif_vlan_op(rif, vid, efid, true); 9591 if (err) 9592 goto err_rif_vlan_fid_op; 9593 9594 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC, 9595 mlxsw_sp_router_port(mlxsw_sp), true); 9596 if (err) 9597 goto err_fid_mc_flood_set; 9598 9599 err = mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC, 9600 mlxsw_sp_router_port(mlxsw_sp), true); 9601 if (err) 9602 goto err_fid_bc_flood_set; 9603 9604 err = mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9605 mlxsw_sp_fid_index(rif->fid), true); 9606 if (err) 9607 goto err_rif_fdb_op; 9608 9609 err = mlxsw_sp_fid_rif_set(rif->fid, rif); 9610 if (err) 9611 goto err_fid_rif_set; 9612 9613 return 0; 9614 9615 err_fid_rif_set: 9616 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9617 mlxsw_sp_fid_index(rif->fid), false); 9618 err_rif_fdb_op: 9619 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC, 9620 mlxsw_sp_router_port(mlxsw_sp), false); 9621 err_fid_bc_flood_set: 9622 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC, 9623 mlxsw_sp_router_port(mlxsw_sp), false); 9624 err_fid_mc_flood_set: 9625 mlxsw_sp_rif_vlan_op(rif, vid, 0, false); 9626 err_rif_vlan_fid_op: 9627 mlxsw_sp_rif_mac_profile_put(mlxsw_sp, mac_profile); 9628 return err; 9629 } 9630 9631 static void mlxsw_sp_rif_vlan_deconfigure(struct mlxsw_sp_rif *rif) 9632 { 9633 u16 vid = mlxsw_sp_fid_8021q_vid(rif->fid); 9634 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9635 9636 mlxsw_sp_fid_rif_unset(rif->fid); 9637 mlxsw_sp_rif_fdb_op(rif->mlxsw_sp, rif->dev->dev_addr, 9638 mlxsw_sp_fid_index(rif->fid), false); 9639 mlxsw_sp_rif_macvlan_flush(rif); 9640 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_BC, 9641 mlxsw_sp_router_port(mlxsw_sp), false); 9642 mlxsw_sp_fid_flood_set(rif->fid, MLXSW_SP_FLOOD_TYPE_MC, 9643 mlxsw_sp_router_port(mlxsw_sp), false); 9644 mlxsw_sp_rif_vlan_op(rif, vid, 0, false); 9645 mlxsw_sp_rif_mac_profile_put(rif->mlxsw_sp, rif->mac_profile_id); 9646 } 9647 9648 static int mlxsw_sp1_rif_vlan_configure(struct mlxsw_sp_rif *rif, 9649 struct netlink_ext_ack *extack) 9650 { 9651 return mlxsw_sp_rif_vlan_configure(rif, 0, extack); 9652 } 9653 9654 static const struct mlxsw_sp_rif_ops mlxsw_sp1_rif_vlan_ops = { 9655 .type = MLXSW_SP_RIF_TYPE_VLAN, 9656 .rif_size = sizeof(struct mlxsw_sp_rif), 9657 .configure = mlxsw_sp1_rif_vlan_configure, 9658 .deconfigure = mlxsw_sp_rif_vlan_deconfigure, 9659 .fid_get = mlxsw_sp_rif_vlan_fid_get, 9660 .fdb_del = mlxsw_sp_rif_vlan_fdb_del, 9661 }; 9662 9663 static int mlxsw_sp2_rif_vlan_configure(struct mlxsw_sp_rif *rif, 9664 struct netlink_ext_ack *extack) 9665 { 9666 u16 efid = mlxsw_sp_fid_index(rif->fid); 9667 9668 return mlxsw_sp_rif_vlan_configure(rif, efid, extack); 9669 } 9670 9671 static const struct mlxsw_sp_rif_ops mlxsw_sp2_rif_vlan_ops = { 9672 .type = MLXSW_SP_RIF_TYPE_VLAN, 9673 .rif_size = sizeof(struct mlxsw_sp_rif), 9674 .configure = mlxsw_sp2_rif_vlan_configure, 9675 .deconfigure = mlxsw_sp_rif_vlan_deconfigure, 9676 .fid_get = mlxsw_sp_rif_vlan_fid_get, 9677 .fdb_del = mlxsw_sp_rif_vlan_fdb_del, 9678 }; 9679 9680 static struct mlxsw_sp_rif_ipip_lb * 9681 mlxsw_sp_rif_ipip_lb_rif(struct mlxsw_sp_rif *rif) 9682 { 9683 return container_of(rif, struct mlxsw_sp_rif_ipip_lb, common); 9684 } 9685 9686 static void 9687 mlxsw_sp_rif_ipip_lb_setup(struct mlxsw_sp_rif *rif, 9688 const struct mlxsw_sp_rif_params *params) 9689 { 9690 struct mlxsw_sp_rif_params_ipip_lb *params_lb; 9691 struct mlxsw_sp_rif_ipip_lb *rif_lb; 9692 9693 params_lb = container_of(params, struct mlxsw_sp_rif_params_ipip_lb, 9694 common); 9695 rif_lb = mlxsw_sp_rif_ipip_lb_rif(rif); 9696 rif_lb->lb_config = params_lb->lb_config; 9697 } 9698 9699 static int 9700 mlxsw_sp1_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif, 9701 struct netlink_ext_ack *extack) 9702 { 9703 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif); 9704 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev); 9705 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9706 struct mlxsw_sp_vr *ul_vr; 9707 int err; 9708 9709 ul_vr = mlxsw_sp_vr_get(mlxsw_sp, ul_tb_id, NULL); 9710 if (IS_ERR(ul_vr)) 9711 return PTR_ERR(ul_vr); 9712 9713 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr->id, 0, true); 9714 if (err) 9715 goto err_loopback_op; 9716 9717 lb_rif->ul_vr_id = ul_vr->id; 9718 lb_rif->ul_rif_id = 0; 9719 ++ul_vr->rif_count; 9720 return 0; 9721 9722 err_loopback_op: 9723 mlxsw_sp_vr_put(mlxsw_sp, ul_vr); 9724 return err; 9725 } 9726 9727 static void mlxsw_sp1_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif) 9728 { 9729 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif); 9730 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9731 struct mlxsw_sp_vr *ul_vr; 9732 9733 ul_vr = &mlxsw_sp->router->vrs[lb_rif->ul_vr_id]; 9734 mlxsw_sp_rif_ipip_lb_op(lb_rif, ul_vr->id, 0, false); 9735 9736 --ul_vr->rif_count; 9737 mlxsw_sp_vr_put(mlxsw_sp, ul_vr); 9738 } 9739 9740 static const struct mlxsw_sp_rif_ops mlxsw_sp1_rif_ipip_lb_ops = { 9741 .type = MLXSW_SP_RIF_TYPE_IPIP_LB, 9742 .rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb), 9743 .setup = mlxsw_sp_rif_ipip_lb_setup, 9744 .configure = mlxsw_sp1_rif_ipip_lb_configure, 9745 .deconfigure = mlxsw_sp1_rif_ipip_lb_deconfigure, 9746 }; 9747 9748 static const struct mlxsw_sp_rif_ops *mlxsw_sp1_rif_ops_arr[] = { 9749 [MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops, 9750 [MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp1_rif_vlan_ops, 9751 [MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops, 9752 [MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp1_rif_ipip_lb_ops, 9753 }; 9754 9755 static int 9756 mlxsw_sp_rif_ipip_lb_ul_rif_op(struct mlxsw_sp_rif *ul_rif, bool enable) 9757 { 9758 struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp; 9759 char ritr_pl[MLXSW_REG_RITR_LEN]; 9760 9761 mlxsw_reg_ritr_pack(ritr_pl, enable, MLXSW_REG_RITR_LOOPBACK_IF, 9762 ul_rif->rif_index, ul_rif->vr_id, IP_MAX_MTU); 9763 mlxsw_reg_ritr_loopback_protocol_set(ritr_pl, 9764 MLXSW_REG_RITR_LOOPBACK_GENERIC); 9765 9766 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ritr), ritr_pl); 9767 } 9768 9769 static struct mlxsw_sp_rif * 9770 mlxsw_sp_ul_rif_create(struct mlxsw_sp *mlxsw_sp, struct mlxsw_sp_vr *vr, 9771 struct netlink_ext_ack *extack) 9772 { 9773 struct mlxsw_sp_rif *ul_rif; 9774 u16 rif_index; 9775 int err; 9776 9777 err = mlxsw_sp_rif_index_alloc(mlxsw_sp, &rif_index); 9778 if (err) { 9779 NL_SET_ERR_MSG_MOD(extack, "Exceeded number of supported router interfaces"); 9780 return ERR_PTR(err); 9781 } 9782 9783 ul_rif = mlxsw_sp_rif_alloc(sizeof(*ul_rif), rif_index, vr->id, NULL); 9784 if (!ul_rif) 9785 return ERR_PTR(-ENOMEM); 9786 9787 mlxsw_sp->router->rifs[rif_index] = ul_rif; 9788 ul_rif->mlxsw_sp = mlxsw_sp; 9789 err = mlxsw_sp_rif_ipip_lb_ul_rif_op(ul_rif, true); 9790 if (err) 9791 goto ul_rif_op_err; 9792 9793 atomic_inc(&mlxsw_sp->router->rifs_count); 9794 return ul_rif; 9795 9796 ul_rif_op_err: 9797 mlxsw_sp->router->rifs[rif_index] = NULL; 9798 kfree(ul_rif); 9799 return ERR_PTR(err); 9800 } 9801 9802 static void mlxsw_sp_ul_rif_destroy(struct mlxsw_sp_rif *ul_rif) 9803 { 9804 struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp; 9805 9806 atomic_dec(&mlxsw_sp->router->rifs_count); 9807 mlxsw_sp_rif_ipip_lb_ul_rif_op(ul_rif, false); 9808 mlxsw_sp->router->rifs[ul_rif->rif_index] = NULL; 9809 kfree(ul_rif); 9810 } 9811 9812 static struct mlxsw_sp_rif * 9813 mlxsw_sp_ul_rif_get(struct mlxsw_sp *mlxsw_sp, u32 tb_id, 9814 struct netlink_ext_ack *extack) 9815 { 9816 struct mlxsw_sp_vr *vr; 9817 int err; 9818 9819 vr = mlxsw_sp_vr_get(mlxsw_sp, tb_id, extack); 9820 if (IS_ERR(vr)) 9821 return ERR_CAST(vr); 9822 9823 if (refcount_inc_not_zero(&vr->ul_rif_refcnt)) 9824 return vr->ul_rif; 9825 9826 vr->ul_rif = mlxsw_sp_ul_rif_create(mlxsw_sp, vr, extack); 9827 if (IS_ERR(vr->ul_rif)) { 9828 err = PTR_ERR(vr->ul_rif); 9829 goto err_ul_rif_create; 9830 } 9831 9832 vr->rif_count++; 9833 refcount_set(&vr->ul_rif_refcnt, 1); 9834 9835 return vr->ul_rif; 9836 9837 err_ul_rif_create: 9838 mlxsw_sp_vr_put(mlxsw_sp, vr); 9839 return ERR_PTR(err); 9840 } 9841 9842 static void mlxsw_sp_ul_rif_put(struct mlxsw_sp_rif *ul_rif) 9843 { 9844 struct mlxsw_sp *mlxsw_sp = ul_rif->mlxsw_sp; 9845 struct mlxsw_sp_vr *vr; 9846 9847 vr = &mlxsw_sp->router->vrs[ul_rif->vr_id]; 9848 9849 if (!refcount_dec_and_test(&vr->ul_rif_refcnt)) 9850 return; 9851 9852 vr->rif_count--; 9853 mlxsw_sp_ul_rif_destroy(ul_rif); 9854 mlxsw_sp_vr_put(mlxsw_sp, vr); 9855 } 9856 9857 int mlxsw_sp_router_ul_rif_get(struct mlxsw_sp *mlxsw_sp, u32 ul_tb_id, 9858 u16 *ul_rif_index) 9859 { 9860 struct mlxsw_sp_rif *ul_rif; 9861 int err = 0; 9862 9863 mutex_lock(&mlxsw_sp->router->lock); 9864 ul_rif = mlxsw_sp_ul_rif_get(mlxsw_sp, ul_tb_id, NULL); 9865 if (IS_ERR(ul_rif)) { 9866 err = PTR_ERR(ul_rif); 9867 goto out; 9868 } 9869 *ul_rif_index = ul_rif->rif_index; 9870 out: 9871 mutex_unlock(&mlxsw_sp->router->lock); 9872 return err; 9873 } 9874 9875 void mlxsw_sp_router_ul_rif_put(struct mlxsw_sp *mlxsw_sp, u16 ul_rif_index) 9876 { 9877 struct mlxsw_sp_rif *ul_rif; 9878 9879 mutex_lock(&mlxsw_sp->router->lock); 9880 ul_rif = mlxsw_sp->router->rifs[ul_rif_index]; 9881 if (WARN_ON(!ul_rif)) 9882 goto out; 9883 9884 mlxsw_sp_ul_rif_put(ul_rif); 9885 out: 9886 mutex_unlock(&mlxsw_sp->router->lock); 9887 } 9888 9889 static int 9890 mlxsw_sp2_rif_ipip_lb_configure(struct mlxsw_sp_rif *rif, 9891 struct netlink_ext_ack *extack) 9892 { 9893 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif); 9894 u32 ul_tb_id = mlxsw_sp_ipip_dev_ul_tb_id(rif->dev); 9895 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9896 struct mlxsw_sp_rif *ul_rif; 9897 int err; 9898 9899 ul_rif = mlxsw_sp_ul_rif_get(mlxsw_sp, ul_tb_id, NULL); 9900 if (IS_ERR(ul_rif)) 9901 return PTR_ERR(ul_rif); 9902 9903 err = mlxsw_sp_rif_ipip_lb_op(lb_rif, 0, ul_rif->rif_index, true); 9904 if (err) 9905 goto err_loopback_op; 9906 9907 lb_rif->ul_vr_id = 0; 9908 lb_rif->ul_rif_id = ul_rif->rif_index; 9909 9910 return 0; 9911 9912 err_loopback_op: 9913 mlxsw_sp_ul_rif_put(ul_rif); 9914 return err; 9915 } 9916 9917 static void mlxsw_sp2_rif_ipip_lb_deconfigure(struct mlxsw_sp_rif *rif) 9918 { 9919 struct mlxsw_sp_rif_ipip_lb *lb_rif = mlxsw_sp_rif_ipip_lb_rif(rif); 9920 struct mlxsw_sp *mlxsw_sp = rif->mlxsw_sp; 9921 struct mlxsw_sp_rif *ul_rif; 9922 9923 ul_rif = mlxsw_sp_rif_by_index(mlxsw_sp, lb_rif->ul_rif_id); 9924 mlxsw_sp_rif_ipip_lb_op(lb_rif, 0, lb_rif->ul_rif_id, false); 9925 mlxsw_sp_ul_rif_put(ul_rif); 9926 } 9927 9928 static const struct mlxsw_sp_rif_ops mlxsw_sp2_rif_ipip_lb_ops = { 9929 .type = MLXSW_SP_RIF_TYPE_IPIP_LB, 9930 .rif_size = sizeof(struct mlxsw_sp_rif_ipip_lb), 9931 .setup = mlxsw_sp_rif_ipip_lb_setup, 9932 .configure = mlxsw_sp2_rif_ipip_lb_configure, 9933 .deconfigure = mlxsw_sp2_rif_ipip_lb_deconfigure, 9934 }; 9935 9936 static const struct mlxsw_sp_rif_ops *mlxsw_sp2_rif_ops_arr[] = { 9937 [MLXSW_SP_RIF_TYPE_SUBPORT] = &mlxsw_sp_rif_subport_ops, 9938 [MLXSW_SP_RIF_TYPE_VLAN] = &mlxsw_sp2_rif_vlan_ops, 9939 [MLXSW_SP_RIF_TYPE_FID] = &mlxsw_sp_rif_fid_ops, 9940 [MLXSW_SP_RIF_TYPE_IPIP_LB] = &mlxsw_sp2_rif_ipip_lb_ops, 9941 }; 9942 9943 static int mlxsw_sp_rifs_init(struct mlxsw_sp *mlxsw_sp) 9944 { 9945 u64 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); 9946 struct devlink *devlink = priv_to_devlink(mlxsw_sp->core); 9947 struct mlxsw_core *core = mlxsw_sp->core; 9948 9949 if (!MLXSW_CORE_RES_VALID(core, MAX_RIF_MAC_PROFILES)) 9950 return -EIO; 9951 mlxsw_sp->router->max_rif_mac_profile = 9952 MLXSW_CORE_RES_GET(core, MAX_RIF_MAC_PROFILES); 9953 9954 mlxsw_sp->router->rifs = kcalloc(max_rifs, 9955 sizeof(struct mlxsw_sp_rif *), 9956 GFP_KERNEL); 9957 if (!mlxsw_sp->router->rifs) 9958 return -ENOMEM; 9959 9960 idr_init(&mlxsw_sp->router->rif_mac_profiles_idr); 9961 atomic_set(&mlxsw_sp->router->rif_mac_profiles_count, 0); 9962 atomic_set(&mlxsw_sp->router->rifs_count, 0); 9963 devl_resource_occ_get_register(devlink, 9964 MLXSW_SP_RESOURCE_RIF_MAC_PROFILES, 9965 mlxsw_sp_rif_mac_profiles_occ_get, 9966 mlxsw_sp); 9967 devl_resource_occ_get_register(devlink, 9968 MLXSW_SP_RESOURCE_RIFS, 9969 mlxsw_sp_rifs_occ_get, 9970 mlxsw_sp); 9971 9972 return 0; 9973 } 9974 9975 static void mlxsw_sp_rifs_fini(struct mlxsw_sp *mlxsw_sp) 9976 { 9977 struct devlink *devlink = priv_to_devlink(mlxsw_sp->core); 9978 int i; 9979 9980 WARN_ON_ONCE(atomic_read(&mlxsw_sp->router->rifs_count)); 9981 for (i = 0; i < MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); i++) 9982 WARN_ON_ONCE(mlxsw_sp->router->rifs[i]); 9983 9984 devl_resource_occ_get_unregister(devlink, MLXSW_SP_RESOURCE_RIFS); 9985 devl_resource_occ_get_unregister(devlink, 9986 MLXSW_SP_RESOURCE_RIF_MAC_PROFILES); 9987 WARN_ON(!idr_is_empty(&mlxsw_sp->router->rif_mac_profiles_idr)); 9988 idr_destroy(&mlxsw_sp->router->rif_mac_profiles_idr); 9989 kfree(mlxsw_sp->router->rifs); 9990 } 9991 9992 static int 9993 mlxsw_sp_ipip_config_tigcr(struct mlxsw_sp *mlxsw_sp) 9994 { 9995 char tigcr_pl[MLXSW_REG_TIGCR_LEN]; 9996 9997 mlxsw_reg_tigcr_pack(tigcr_pl, true, 0); 9998 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(tigcr), tigcr_pl); 9999 } 10000 10001 static int mlxsw_sp_ipips_init(struct mlxsw_sp *mlxsw_sp) 10002 { 10003 int err; 10004 10005 INIT_LIST_HEAD(&mlxsw_sp->router->ipip_list); 10006 10007 err = mlxsw_sp_ipip_ecn_encap_init(mlxsw_sp); 10008 if (err) 10009 return err; 10010 err = mlxsw_sp_ipip_ecn_decap_init(mlxsw_sp); 10011 if (err) 10012 return err; 10013 10014 return mlxsw_sp_ipip_config_tigcr(mlxsw_sp); 10015 } 10016 10017 static int mlxsw_sp1_ipips_init(struct mlxsw_sp *mlxsw_sp) 10018 { 10019 mlxsw_sp->router->ipip_ops_arr = mlxsw_sp1_ipip_ops_arr; 10020 return mlxsw_sp_ipips_init(mlxsw_sp); 10021 } 10022 10023 static int mlxsw_sp2_ipips_init(struct mlxsw_sp *mlxsw_sp) 10024 { 10025 mlxsw_sp->router->ipip_ops_arr = mlxsw_sp2_ipip_ops_arr; 10026 return mlxsw_sp_ipips_init(mlxsw_sp); 10027 } 10028 10029 static void mlxsw_sp_ipips_fini(struct mlxsw_sp *mlxsw_sp) 10030 { 10031 WARN_ON(!list_empty(&mlxsw_sp->router->ipip_list)); 10032 } 10033 10034 static void mlxsw_sp_router_fib_dump_flush(struct notifier_block *nb) 10035 { 10036 struct mlxsw_sp_router *router; 10037 10038 /* Flush pending FIB notifications and then flush the device's 10039 * table before requesting another dump. The FIB notification 10040 * block is unregistered, so no need to take RTNL. 10041 */ 10042 mlxsw_core_flush_owq(); 10043 router = container_of(nb, struct mlxsw_sp_router, fib_nb); 10044 mlxsw_sp_router_fib_flush(router->mlxsw_sp); 10045 } 10046 10047 #ifdef CONFIG_IP_ROUTE_MULTIPATH 10048 struct mlxsw_sp_mp_hash_config { 10049 DECLARE_BITMAP(headers, __MLXSW_REG_RECR2_HEADER_CNT); 10050 DECLARE_BITMAP(fields, __MLXSW_REG_RECR2_FIELD_CNT); 10051 DECLARE_BITMAP(inner_headers, __MLXSW_REG_RECR2_HEADER_CNT); 10052 DECLARE_BITMAP(inner_fields, __MLXSW_REG_RECR2_INNER_FIELD_CNT); 10053 bool inc_parsing_depth; 10054 }; 10055 10056 #define MLXSW_SP_MP_HASH_HEADER_SET(_headers, _header) \ 10057 bitmap_set(_headers, MLXSW_REG_RECR2_##_header, 1) 10058 10059 #define MLXSW_SP_MP_HASH_FIELD_SET(_fields, _field) \ 10060 bitmap_set(_fields, MLXSW_REG_RECR2_##_field, 1) 10061 10062 #define MLXSW_SP_MP_HASH_FIELD_RANGE_SET(_fields, _field, _nr) \ 10063 bitmap_set(_fields, MLXSW_REG_RECR2_##_field, _nr) 10064 10065 static void mlxsw_sp_mp_hash_inner_l3(struct mlxsw_sp_mp_hash_config *config) 10066 { 10067 unsigned long *inner_headers = config->inner_headers; 10068 unsigned long *inner_fields = config->inner_fields; 10069 10070 /* IPv4 inner */ 10071 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV4_EN_NOT_TCP_NOT_UDP); 10072 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV4_EN_TCP_UDP); 10073 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV4_SIP0, 4); 10074 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV4_DIP0, 4); 10075 /* IPv6 inner */ 10076 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV6_EN_NOT_TCP_NOT_UDP); 10077 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV6_EN_TCP_UDP); 10078 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_SIP0_7); 10079 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV6_SIP8, 8); 10080 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_DIP0_7); 10081 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV6_DIP8, 8); 10082 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_NEXT_HEADER); 10083 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_FLOW_LABEL); 10084 } 10085 10086 static void mlxsw_sp_mp4_hash_outer_addr(struct mlxsw_sp_mp_hash_config *config) 10087 { 10088 unsigned long *headers = config->headers; 10089 unsigned long *fields = config->fields; 10090 10091 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV4_EN_NOT_TCP_NOT_UDP); 10092 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV4_EN_TCP_UDP); 10093 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV4_SIP0, 4); 10094 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV4_DIP0, 4); 10095 } 10096 10097 static void 10098 mlxsw_sp_mp_hash_inner_custom(struct mlxsw_sp_mp_hash_config *config, 10099 u32 hash_fields) 10100 { 10101 unsigned long *inner_headers = config->inner_headers; 10102 unsigned long *inner_fields = config->inner_fields; 10103 10104 /* IPv4 Inner */ 10105 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV4_EN_NOT_TCP_NOT_UDP); 10106 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV4_EN_TCP_UDP); 10107 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_SRC_IP) 10108 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV4_SIP0, 4); 10109 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_DST_IP) 10110 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV4_DIP0, 4); 10111 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_IP_PROTO) 10112 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV4_PROTOCOL); 10113 /* IPv6 inner */ 10114 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV6_EN_NOT_TCP_NOT_UDP); 10115 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, IPV6_EN_TCP_UDP); 10116 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_SRC_IP) { 10117 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_SIP0_7); 10118 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV6_SIP8, 8); 10119 } 10120 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_DST_IP) { 10121 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_DIP0_7); 10122 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(inner_fields, INNER_IPV6_DIP8, 8); 10123 } 10124 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_IP_PROTO) 10125 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_NEXT_HEADER); 10126 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_FLOWLABEL) 10127 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_IPV6_FLOW_LABEL); 10128 /* L4 inner */ 10129 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, TCP_UDP_EN_IPV4); 10130 MLXSW_SP_MP_HASH_HEADER_SET(inner_headers, TCP_UDP_EN_IPV6); 10131 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_SRC_PORT) 10132 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_TCP_UDP_SPORT); 10133 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_DST_PORT) 10134 MLXSW_SP_MP_HASH_FIELD_SET(inner_fields, INNER_TCP_UDP_DPORT); 10135 } 10136 10137 static void mlxsw_sp_mp4_hash_init(struct mlxsw_sp *mlxsw_sp, 10138 struct mlxsw_sp_mp_hash_config *config) 10139 { 10140 struct net *net = mlxsw_sp_net(mlxsw_sp); 10141 unsigned long *headers = config->headers; 10142 unsigned long *fields = config->fields; 10143 u32 hash_fields; 10144 10145 switch (READ_ONCE(net->ipv4.sysctl_fib_multipath_hash_policy)) { 10146 case 0: 10147 mlxsw_sp_mp4_hash_outer_addr(config); 10148 break; 10149 case 1: 10150 mlxsw_sp_mp4_hash_outer_addr(config); 10151 MLXSW_SP_MP_HASH_HEADER_SET(headers, TCP_UDP_EN_IPV4); 10152 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV4_PROTOCOL); 10153 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_SPORT); 10154 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_DPORT); 10155 break; 10156 case 2: 10157 /* Outer */ 10158 mlxsw_sp_mp4_hash_outer_addr(config); 10159 /* Inner */ 10160 mlxsw_sp_mp_hash_inner_l3(config); 10161 break; 10162 case 3: 10163 hash_fields = READ_ONCE(net->ipv4.sysctl_fib_multipath_hash_fields); 10164 /* Outer */ 10165 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV4_EN_NOT_TCP_NOT_UDP); 10166 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV4_EN_TCP_UDP); 10167 MLXSW_SP_MP_HASH_HEADER_SET(headers, TCP_UDP_EN_IPV4); 10168 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_SRC_IP) 10169 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV4_SIP0, 4); 10170 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_DST_IP) 10171 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV4_DIP0, 4); 10172 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_IP_PROTO) 10173 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV4_PROTOCOL); 10174 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_SRC_PORT) 10175 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_SPORT); 10176 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_DST_PORT) 10177 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_DPORT); 10178 /* Inner */ 10179 mlxsw_sp_mp_hash_inner_custom(config, hash_fields); 10180 break; 10181 } 10182 } 10183 10184 static void mlxsw_sp_mp6_hash_outer_addr(struct mlxsw_sp_mp_hash_config *config) 10185 { 10186 unsigned long *headers = config->headers; 10187 unsigned long *fields = config->fields; 10188 10189 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV6_EN_NOT_TCP_NOT_UDP); 10190 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV6_EN_TCP_UDP); 10191 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_SIP0_7); 10192 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV6_SIP8, 8); 10193 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_DIP0_7); 10194 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV6_DIP8, 8); 10195 } 10196 10197 static void mlxsw_sp_mp6_hash_init(struct mlxsw_sp *mlxsw_sp, 10198 struct mlxsw_sp_mp_hash_config *config) 10199 { 10200 u32 hash_fields = ip6_multipath_hash_fields(mlxsw_sp_net(mlxsw_sp)); 10201 unsigned long *headers = config->headers; 10202 unsigned long *fields = config->fields; 10203 10204 switch (ip6_multipath_hash_policy(mlxsw_sp_net(mlxsw_sp))) { 10205 case 0: 10206 mlxsw_sp_mp6_hash_outer_addr(config); 10207 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_NEXT_HEADER); 10208 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_FLOW_LABEL); 10209 break; 10210 case 1: 10211 mlxsw_sp_mp6_hash_outer_addr(config); 10212 MLXSW_SP_MP_HASH_HEADER_SET(headers, TCP_UDP_EN_IPV6); 10213 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_NEXT_HEADER); 10214 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_SPORT); 10215 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_DPORT); 10216 break; 10217 case 2: 10218 /* Outer */ 10219 mlxsw_sp_mp6_hash_outer_addr(config); 10220 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_NEXT_HEADER); 10221 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_FLOW_LABEL); 10222 /* Inner */ 10223 mlxsw_sp_mp_hash_inner_l3(config); 10224 config->inc_parsing_depth = true; 10225 break; 10226 case 3: 10227 /* Outer */ 10228 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV6_EN_NOT_TCP_NOT_UDP); 10229 MLXSW_SP_MP_HASH_HEADER_SET(headers, IPV6_EN_TCP_UDP); 10230 MLXSW_SP_MP_HASH_HEADER_SET(headers, TCP_UDP_EN_IPV6); 10231 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_SRC_IP) { 10232 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_SIP0_7); 10233 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV6_SIP8, 8); 10234 } 10235 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_DST_IP) { 10236 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_DIP0_7); 10237 MLXSW_SP_MP_HASH_FIELD_RANGE_SET(fields, IPV6_DIP8, 8); 10238 } 10239 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_IP_PROTO) 10240 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_NEXT_HEADER); 10241 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_FLOWLABEL) 10242 MLXSW_SP_MP_HASH_FIELD_SET(fields, IPV6_FLOW_LABEL); 10243 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_SRC_PORT) 10244 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_SPORT); 10245 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_DST_PORT) 10246 MLXSW_SP_MP_HASH_FIELD_SET(fields, TCP_UDP_DPORT); 10247 /* Inner */ 10248 mlxsw_sp_mp_hash_inner_custom(config, hash_fields); 10249 if (hash_fields & FIB_MULTIPATH_HASH_FIELD_INNER_MASK) 10250 config->inc_parsing_depth = true; 10251 break; 10252 } 10253 } 10254 10255 static int mlxsw_sp_mp_hash_parsing_depth_adjust(struct mlxsw_sp *mlxsw_sp, 10256 bool old_inc_parsing_depth, 10257 bool new_inc_parsing_depth) 10258 { 10259 int err; 10260 10261 if (!old_inc_parsing_depth && new_inc_parsing_depth) { 10262 err = mlxsw_sp_parsing_depth_inc(mlxsw_sp); 10263 if (err) 10264 return err; 10265 mlxsw_sp->router->inc_parsing_depth = true; 10266 } else if (old_inc_parsing_depth && !new_inc_parsing_depth) { 10267 mlxsw_sp_parsing_depth_dec(mlxsw_sp); 10268 mlxsw_sp->router->inc_parsing_depth = false; 10269 } 10270 10271 return 0; 10272 } 10273 10274 static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp) 10275 { 10276 bool old_inc_parsing_depth, new_inc_parsing_depth; 10277 struct mlxsw_sp_mp_hash_config config = {}; 10278 char recr2_pl[MLXSW_REG_RECR2_LEN]; 10279 unsigned long bit; 10280 u32 seed; 10281 int err; 10282 10283 seed = jhash(mlxsw_sp->base_mac, sizeof(mlxsw_sp->base_mac), 0); 10284 mlxsw_reg_recr2_pack(recr2_pl, seed); 10285 mlxsw_sp_mp4_hash_init(mlxsw_sp, &config); 10286 mlxsw_sp_mp6_hash_init(mlxsw_sp, &config); 10287 10288 old_inc_parsing_depth = mlxsw_sp->router->inc_parsing_depth; 10289 new_inc_parsing_depth = config.inc_parsing_depth; 10290 err = mlxsw_sp_mp_hash_parsing_depth_adjust(mlxsw_sp, 10291 old_inc_parsing_depth, 10292 new_inc_parsing_depth); 10293 if (err) 10294 return err; 10295 10296 for_each_set_bit(bit, config.headers, __MLXSW_REG_RECR2_HEADER_CNT) 10297 mlxsw_reg_recr2_outer_header_enables_set(recr2_pl, bit, 1); 10298 for_each_set_bit(bit, config.fields, __MLXSW_REG_RECR2_FIELD_CNT) 10299 mlxsw_reg_recr2_outer_header_fields_enable_set(recr2_pl, bit, 1); 10300 for_each_set_bit(bit, config.inner_headers, __MLXSW_REG_RECR2_HEADER_CNT) 10301 mlxsw_reg_recr2_inner_header_enables_set(recr2_pl, bit, 1); 10302 for_each_set_bit(bit, config.inner_fields, __MLXSW_REG_RECR2_INNER_FIELD_CNT) 10303 mlxsw_reg_recr2_inner_header_fields_enable_set(recr2_pl, bit, 1); 10304 10305 err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(recr2), recr2_pl); 10306 if (err) 10307 goto err_reg_write; 10308 10309 return 0; 10310 10311 err_reg_write: 10312 mlxsw_sp_mp_hash_parsing_depth_adjust(mlxsw_sp, new_inc_parsing_depth, 10313 old_inc_parsing_depth); 10314 return err; 10315 } 10316 #else 10317 static int mlxsw_sp_mp_hash_init(struct mlxsw_sp *mlxsw_sp) 10318 { 10319 return 0; 10320 } 10321 #endif 10322 10323 static int mlxsw_sp_dscp_init(struct mlxsw_sp *mlxsw_sp) 10324 { 10325 char rdpm_pl[MLXSW_REG_RDPM_LEN]; 10326 unsigned int i; 10327 10328 MLXSW_REG_ZERO(rdpm, rdpm_pl); 10329 10330 /* HW is determining switch priority based on DSCP-bits, but the 10331 * kernel is still doing that based on the ToS. Since there's a 10332 * mismatch in bits we need to make sure to translate the right 10333 * value ToS would observe, skipping the 2 least-significant ECN bits. 10334 */ 10335 for (i = 0; i < MLXSW_REG_RDPM_DSCP_ENTRY_REC_MAX_COUNT; i++) 10336 mlxsw_reg_rdpm_pack(rdpm_pl, i, rt_tos2priority(i << 2)); 10337 10338 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rdpm), rdpm_pl); 10339 } 10340 10341 static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp) 10342 { 10343 struct net *net = mlxsw_sp_net(mlxsw_sp); 10344 char rgcr_pl[MLXSW_REG_RGCR_LEN]; 10345 u64 max_rifs; 10346 bool usp; 10347 10348 if (!MLXSW_CORE_RES_VALID(mlxsw_sp->core, MAX_RIFS)) 10349 return -EIO; 10350 max_rifs = MLXSW_CORE_RES_GET(mlxsw_sp->core, MAX_RIFS); 10351 usp = READ_ONCE(net->ipv4.sysctl_ip_fwd_update_priority); 10352 10353 mlxsw_reg_rgcr_pack(rgcr_pl, true, true); 10354 mlxsw_reg_rgcr_max_router_interfaces_set(rgcr_pl, max_rifs); 10355 mlxsw_reg_rgcr_usp_set(rgcr_pl, usp); 10356 return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl); 10357 } 10358 10359 static void __mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp) 10360 { 10361 char rgcr_pl[MLXSW_REG_RGCR_LEN]; 10362 10363 mlxsw_reg_rgcr_pack(rgcr_pl, false, false); 10364 mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rgcr), rgcr_pl); 10365 } 10366 10367 static int mlxsw_sp_lb_rif_init(struct mlxsw_sp *mlxsw_sp) 10368 { 10369 u16 lb_rif_index; 10370 int err; 10371 10372 /* Create a generic loopback RIF associated with the main table 10373 * (default VRF). Any table can be used, but the main table exists 10374 * anyway, so we do not waste resources. 10375 */ 10376 err = mlxsw_sp_router_ul_rif_get(mlxsw_sp, RT_TABLE_MAIN, 10377 &lb_rif_index); 10378 if (err) 10379 return err; 10380 10381 mlxsw_sp->router->lb_rif_index = lb_rif_index; 10382 10383 return 0; 10384 } 10385 10386 static void mlxsw_sp_lb_rif_fini(struct mlxsw_sp *mlxsw_sp) 10387 { 10388 mlxsw_sp_router_ul_rif_put(mlxsw_sp, mlxsw_sp->router->lb_rif_index); 10389 } 10390 10391 static int mlxsw_sp1_router_init(struct mlxsw_sp *mlxsw_sp) 10392 { 10393 size_t size_ranges_count = ARRAY_SIZE(mlxsw_sp1_adj_grp_size_ranges); 10394 10395 mlxsw_sp->router->rif_ops_arr = mlxsw_sp1_rif_ops_arr; 10396 mlxsw_sp->router->adj_grp_size_ranges = mlxsw_sp1_adj_grp_size_ranges; 10397 mlxsw_sp->router->adj_grp_size_ranges_count = size_ranges_count; 10398 10399 return 0; 10400 } 10401 10402 const struct mlxsw_sp_router_ops mlxsw_sp1_router_ops = { 10403 .init = mlxsw_sp1_router_init, 10404 .ipips_init = mlxsw_sp1_ipips_init, 10405 }; 10406 10407 static int mlxsw_sp2_router_init(struct mlxsw_sp *mlxsw_sp) 10408 { 10409 size_t size_ranges_count = ARRAY_SIZE(mlxsw_sp2_adj_grp_size_ranges); 10410 10411 mlxsw_sp->router->rif_ops_arr = mlxsw_sp2_rif_ops_arr; 10412 mlxsw_sp->router->adj_grp_size_ranges = mlxsw_sp2_adj_grp_size_ranges; 10413 mlxsw_sp->router->adj_grp_size_ranges_count = size_ranges_count; 10414 10415 return 0; 10416 } 10417 10418 const struct mlxsw_sp_router_ops mlxsw_sp2_router_ops = { 10419 .init = mlxsw_sp2_router_init, 10420 .ipips_init = mlxsw_sp2_ipips_init, 10421 }; 10422 10423 int mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp, 10424 struct netlink_ext_ack *extack) 10425 { 10426 struct mlxsw_sp_router *router; 10427 int err; 10428 10429 router = kzalloc(sizeof(*mlxsw_sp->router), GFP_KERNEL); 10430 if (!router) 10431 return -ENOMEM; 10432 mutex_init(&router->lock); 10433 mlxsw_sp->router = router; 10434 router->mlxsw_sp = mlxsw_sp; 10435 10436 err = mlxsw_sp->router_ops->init(mlxsw_sp); 10437 if (err) 10438 goto err_router_ops_init; 10439 10440 INIT_LIST_HEAD(&mlxsw_sp->router->nh_res_grp_list); 10441 INIT_DELAYED_WORK(&mlxsw_sp->router->nh_grp_activity_dw, 10442 mlxsw_sp_nh_grp_activity_work); 10443 INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_neighs_list); 10444 err = __mlxsw_sp_router_init(mlxsw_sp); 10445 if (err) 10446 goto err_router_init; 10447 10448 err = mlxsw_sp_rifs_init(mlxsw_sp); 10449 if (err) 10450 goto err_rifs_init; 10451 10452 err = mlxsw_sp->router_ops->ipips_init(mlxsw_sp); 10453 if (err) 10454 goto err_ipips_init; 10455 10456 err = rhashtable_init(&mlxsw_sp->router->nexthop_ht, 10457 &mlxsw_sp_nexthop_ht_params); 10458 if (err) 10459 goto err_nexthop_ht_init; 10460 10461 err = rhashtable_init(&mlxsw_sp->router->nexthop_group_ht, 10462 &mlxsw_sp_nexthop_group_ht_params); 10463 if (err) 10464 goto err_nexthop_group_ht_init; 10465 10466 INIT_LIST_HEAD(&mlxsw_sp->router->nexthop_list); 10467 err = mlxsw_sp_lpm_init(mlxsw_sp); 10468 if (err) 10469 goto err_lpm_init; 10470 10471 err = mlxsw_sp_mr_init(mlxsw_sp, &mlxsw_sp_mr_tcam_ops); 10472 if (err) 10473 goto err_mr_init; 10474 10475 err = mlxsw_sp_vrs_init(mlxsw_sp); 10476 if (err) 10477 goto err_vrs_init; 10478 10479 err = mlxsw_sp_lb_rif_init(mlxsw_sp); 10480 if (err) 10481 goto err_lb_rif_init; 10482 10483 err = mlxsw_sp_neigh_init(mlxsw_sp); 10484 if (err) 10485 goto err_neigh_init; 10486 10487 err = mlxsw_sp_mp_hash_init(mlxsw_sp); 10488 if (err) 10489 goto err_mp_hash_init; 10490 10491 err = mlxsw_sp_dscp_init(mlxsw_sp); 10492 if (err) 10493 goto err_dscp_init; 10494 10495 router->inetaddr_nb.notifier_call = mlxsw_sp_inetaddr_event; 10496 err = register_inetaddr_notifier(&router->inetaddr_nb); 10497 if (err) 10498 goto err_register_inetaddr_notifier; 10499 10500 router->inet6addr_nb.notifier_call = mlxsw_sp_inet6addr_event; 10501 err = register_inet6addr_notifier(&router->inet6addr_nb); 10502 if (err) 10503 goto err_register_inet6addr_notifier; 10504 10505 mlxsw_sp->router->netevent_nb.notifier_call = 10506 mlxsw_sp_router_netevent_event; 10507 err = register_netevent_notifier(&mlxsw_sp->router->netevent_nb); 10508 if (err) 10509 goto err_register_netevent_notifier; 10510 10511 mlxsw_sp->router->nexthop_nb.notifier_call = 10512 mlxsw_sp_nexthop_obj_event; 10513 err = register_nexthop_notifier(mlxsw_sp_net(mlxsw_sp), 10514 &mlxsw_sp->router->nexthop_nb, 10515 extack); 10516 if (err) 10517 goto err_register_nexthop_notifier; 10518 10519 mlxsw_sp->router->fib_nb.notifier_call = mlxsw_sp_router_fib_event; 10520 err = register_fib_notifier(mlxsw_sp_net(mlxsw_sp), 10521 &mlxsw_sp->router->fib_nb, 10522 mlxsw_sp_router_fib_dump_flush, extack); 10523 if (err) 10524 goto err_register_fib_notifier; 10525 10526 mlxsw_sp->router->netdevice_nb.notifier_call = 10527 mlxsw_sp_router_netdevice_event; 10528 err = register_netdevice_notifier_net(mlxsw_sp_net(mlxsw_sp), 10529 &mlxsw_sp->router->netdevice_nb); 10530 if (err) 10531 goto err_register_netdev_notifier; 10532 10533 return 0; 10534 10535 err_register_netdev_notifier: 10536 unregister_fib_notifier(mlxsw_sp_net(mlxsw_sp), 10537 &mlxsw_sp->router->fib_nb); 10538 err_register_fib_notifier: 10539 unregister_nexthop_notifier(mlxsw_sp_net(mlxsw_sp), 10540 &mlxsw_sp->router->nexthop_nb); 10541 err_register_nexthop_notifier: 10542 unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb); 10543 err_register_netevent_notifier: 10544 unregister_inet6addr_notifier(&router->inet6addr_nb); 10545 err_register_inet6addr_notifier: 10546 unregister_inetaddr_notifier(&router->inetaddr_nb); 10547 err_register_inetaddr_notifier: 10548 mlxsw_core_flush_owq(); 10549 err_dscp_init: 10550 err_mp_hash_init: 10551 mlxsw_sp_neigh_fini(mlxsw_sp); 10552 err_neigh_init: 10553 mlxsw_sp_lb_rif_fini(mlxsw_sp); 10554 err_lb_rif_init: 10555 mlxsw_sp_vrs_fini(mlxsw_sp); 10556 err_vrs_init: 10557 mlxsw_sp_mr_fini(mlxsw_sp); 10558 err_mr_init: 10559 mlxsw_sp_lpm_fini(mlxsw_sp); 10560 err_lpm_init: 10561 rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht); 10562 err_nexthop_group_ht_init: 10563 rhashtable_destroy(&mlxsw_sp->router->nexthop_ht); 10564 err_nexthop_ht_init: 10565 mlxsw_sp_ipips_fini(mlxsw_sp); 10566 err_ipips_init: 10567 mlxsw_sp_rifs_fini(mlxsw_sp); 10568 err_rifs_init: 10569 __mlxsw_sp_router_fini(mlxsw_sp); 10570 err_router_init: 10571 cancel_delayed_work_sync(&mlxsw_sp->router->nh_grp_activity_dw); 10572 err_router_ops_init: 10573 mutex_destroy(&mlxsw_sp->router->lock); 10574 kfree(mlxsw_sp->router); 10575 return err; 10576 } 10577 10578 void mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp) 10579 { 10580 unregister_netdevice_notifier_net(mlxsw_sp_net(mlxsw_sp), 10581 &mlxsw_sp->router->netdevice_nb); 10582 unregister_fib_notifier(mlxsw_sp_net(mlxsw_sp), 10583 &mlxsw_sp->router->fib_nb); 10584 unregister_nexthop_notifier(mlxsw_sp_net(mlxsw_sp), 10585 &mlxsw_sp->router->nexthop_nb); 10586 unregister_netevent_notifier(&mlxsw_sp->router->netevent_nb); 10587 unregister_inet6addr_notifier(&mlxsw_sp->router->inet6addr_nb); 10588 unregister_inetaddr_notifier(&mlxsw_sp->router->inetaddr_nb); 10589 mlxsw_core_flush_owq(); 10590 mlxsw_sp_neigh_fini(mlxsw_sp); 10591 mlxsw_sp_lb_rif_fini(mlxsw_sp); 10592 mlxsw_sp_vrs_fini(mlxsw_sp); 10593 mlxsw_sp_mr_fini(mlxsw_sp); 10594 mlxsw_sp_lpm_fini(mlxsw_sp); 10595 rhashtable_destroy(&mlxsw_sp->router->nexthop_group_ht); 10596 rhashtable_destroy(&mlxsw_sp->router->nexthop_ht); 10597 mlxsw_sp_ipips_fini(mlxsw_sp); 10598 mlxsw_sp_rifs_fini(mlxsw_sp); 10599 __mlxsw_sp_router_fini(mlxsw_sp); 10600 cancel_delayed_work_sync(&mlxsw_sp->router->nh_grp_activity_dw); 10601 mutex_destroy(&mlxsw_sp->router->lock); 10602 kfree(mlxsw_sp->router); 10603 } 10604