1 /* 2 * drivers/net/team/team.c - Network team device driver 3 * Copyright (c) 2011 Jiri Pirko <jpirko@redhat.com> 4 * 5 * This program is free software; you can redistribute it and/or modify 6 * it under the terms of the GNU General Public License as published by 7 * the Free Software Foundation; either version 2 of the License, or 8 * (at your option) any later version. 9 */ 10 11 #include <linux/kernel.h> 12 #include <linux/types.h> 13 #include <linux/module.h> 14 #include <linux/init.h> 15 #include <linux/slab.h> 16 #include <linux/rcupdate.h> 17 #include <linux/errno.h> 18 #include <linux/ctype.h> 19 #include <linux/notifier.h> 20 #include <linux/netdevice.h> 21 #include <linux/netpoll.h> 22 #include <linux/if_vlan.h> 23 #include <linux/if_arp.h> 24 #include <linux/socket.h> 25 #include <linux/etherdevice.h> 26 #include <linux/rtnetlink.h> 27 #include <net/rtnetlink.h> 28 #include <net/genetlink.h> 29 #include <net/netlink.h> 30 #include <net/sch_generic.h> 31 #include <net/switchdev.h> 32 #include <generated/utsrelease.h> 33 #include <linux/if_team.h> 34 35 #define DRV_NAME "team" 36 37 38 /********** 39 * Helpers 40 **********/ 41 42 #define team_port_exists(dev) (dev->priv_flags & IFF_TEAM_PORT) 43 44 static struct team_port *team_port_get_rcu(const struct net_device *dev) 45 { 46 return rcu_dereference(dev->rx_handler_data); 47 } 48 49 static struct team_port *team_port_get_rtnl(const struct net_device *dev) 50 { 51 struct team_port *port = rtnl_dereference(dev->rx_handler_data); 52 53 return team_port_exists(dev) ? port : NULL; 54 } 55 56 /* 57 * Since the ability to change device address for open port device is tested in 58 * team_port_add, this function can be called without control of return value 59 */ 60 static int __set_port_dev_addr(struct net_device *port_dev, 61 const unsigned char *dev_addr) 62 { 63 struct sockaddr addr; 64 65 memcpy(addr.sa_data, dev_addr, port_dev->addr_len); 66 addr.sa_family = port_dev->type; 67 return dev_set_mac_address(port_dev, &addr); 68 } 69 70 static int team_port_set_orig_dev_addr(struct team_port *port) 71 { 72 return __set_port_dev_addr(port->dev, port->orig.dev_addr); 73 } 74 75 static int team_port_set_team_dev_addr(struct team *team, 76 struct team_port *port) 77 { 78 return __set_port_dev_addr(port->dev, team->dev->dev_addr); 79 } 80 81 int team_modeop_port_enter(struct team *team, struct team_port *port) 82 { 83 return team_port_set_team_dev_addr(team, port); 84 } 85 EXPORT_SYMBOL(team_modeop_port_enter); 86 87 void team_modeop_port_change_dev_addr(struct team *team, 88 struct team_port *port) 89 { 90 team_port_set_team_dev_addr(team, port); 91 } 92 EXPORT_SYMBOL(team_modeop_port_change_dev_addr); 93 94 static void team_refresh_port_linkup(struct team_port *port) 95 { 96 port->linkup = port->user.linkup_enabled ? port->user.linkup : 97 port->state.linkup; 98 } 99 100 101 /******************* 102 * Options handling 103 *******************/ 104 105 struct team_option_inst { /* One for each option instance */ 106 struct list_head list; 107 struct list_head tmp_list; 108 struct team_option *option; 109 struct team_option_inst_info info; 110 bool changed; 111 bool removed; 112 }; 113 114 static struct team_option *__team_find_option(struct team *team, 115 const char *opt_name) 116 { 117 struct team_option *option; 118 119 list_for_each_entry(option, &team->option_list, list) { 120 if (strcmp(option->name, opt_name) == 0) 121 return option; 122 } 123 return NULL; 124 } 125 126 static void __team_option_inst_del(struct team_option_inst *opt_inst) 127 { 128 list_del(&opt_inst->list); 129 kfree(opt_inst); 130 } 131 132 static void __team_option_inst_del_option(struct team *team, 133 struct team_option *option) 134 { 135 struct team_option_inst *opt_inst, *tmp; 136 137 list_for_each_entry_safe(opt_inst, tmp, &team->option_inst_list, list) { 138 if (opt_inst->option == option) 139 __team_option_inst_del(opt_inst); 140 } 141 } 142 143 static int __team_option_inst_add(struct team *team, struct team_option *option, 144 struct team_port *port) 145 { 146 struct team_option_inst *opt_inst; 147 unsigned int array_size; 148 unsigned int i; 149 int err; 150 151 array_size = option->array_size; 152 if (!array_size) 153 array_size = 1; /* No array but still need one instance */ 154 155 for (i = 0; i < array_size; i++) { 156 opt_inst = kmalloc(sizeof(*opt_inst), GFP_KERNEL); 157 if (!opt_inst) 158 return -ENOMEM; 159 opt_inst->option = option; 160 opt_inst->info.port = port; 161 opt_inst->info.array_index = i; 162 opt_inst->changed = true; 163 opt_inst->removed = false; 164 list_add_tail(&opt_inst->list, &team->option_inst_list); 165 if (option->init) { 166 err = option->init(team, &opt_inst->info); 167 if (err) 168 return err; 169 } 170 171 } 172 return 0; 173 } 174 175 static int __team_option_inst_add_option(struct team *team, 176 struct team_option *option) 177 { 178 int err; 179 180 if (!option->per_port) { 181 err = __team_option_inst_add(team, option, NULL); 182 if (err) 183 goto inst_del_option; 184 } 185 return 0; 186 187 inst_del_option: 188 __team_option_inst_del_option(team, option); 189 return err; 190 } 191 192 static void __team_option_inst_mark_removed_option(struct team *team, 193 struct team_option *option) 194 { 195 struct team_option_inst *opt_inst; 196 197 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 198 if (opt_inst->option == option) { 199 opt_inst->changed = true; 200 opt_inst->removed = true; 201 } 202 } 203 } 204 205 static void __team_option_inst_del_port(struct team *team, 206 struct team_port *port) 207 { 208 struct team_option_inst *opt_inst, *tmp; 209 210 list_for_each_entry_safe(opt_inst, tmp, &team->option_inst_list, list) { 211 if (opt_inst->option->per_port && 212 opt_inst->info.port == port) 213 __team_option_inst_del(opt_inst); 214 } 215 } 216 217 static int __team_option_inst_add_port(struct team *team, 218 struct team_port *port) 219 { 220 struct team_option *option; 221 int err; 222 223 list_for_each_entry(option, &team->option_list, list) { 224 if (!option->per_port) 225 continue; 226 err = __team_option_inst_add(team, option, port); 227 if (err) 228 goto inst_del_port; 229 } 230 return 0; 231 232 inst_del_port: 233 __team_option_inst_del_port(team, port); 234 return err; 235 } 236 237 static void __team_option_inst_mark_removed_port(struct team *team, 238 struct team_port *port) 239 { 240 struct team_option_inst *opt_inst; 241 242 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 243 if (opt_inst->info.port == port) { 244 opt_inst->changed = true; 245 opt_inst->removed = true; 246 } 247 } 248 } 249 250 static int __team_options_register(struct team *team, 251 const struct team_option *option, 252 size_t option_count) 253 { 254 int i; 255 struct team_option **dst_opts; 256 int err; 257 258 dst_opts = kzalloc(sizeof(struct team_option *) * option_count, 259 GFP_KERNEL); 260 if (!dst_opts) 261 return -ENOMEM; 262 for (i = 0; i < option_count; i++, option++) { 263 if (__team_find_option(team, option->name)) { 264 err = -EEXIST; 265 goto alloc_rollback; 266 } 267 dst_opts[i] = kmemdup(option, sizeof(*option), GFP_KERNEL); 268 if (!dst_opts[i]) { 269 err = -ENOMEM; 270 goto alloc_rollback; 271 } 272 } 273 274 for (i = 0; i < option_count; i++) { 275 err = __team_option_inst_add_option(team, dst_opts[i]); 276 if (err) 277 goto inst_rollback; 278 list_add_tail(&dst_opts[i]->list, &team->option_list); 279 } 280 281 kfree(dst_opts); 282 return 0; 283 284 inst_rollback: 285 for (i--; i >= 0; i--) 286 __team_option_inst_del_option(team, dst_opts[i]); 287 288 i = option_count - 1; 289 alloc_rollback: 290 for (i--; i >= 0; i--) 291 kfree(dst_opts[i]); 292 293 kfree(dst_opts); 294 return err; 295 } 296 297 static void __team_options_mark_removed(struct team *team, 298 const struct team_option *option, 299 size_t option_count) 300 { 301 int i; 302 303 for (i = 0; i < option_count; i++, option++) { 304 struct team_option *del_opt; 305 306 del_opt = __team_find_option(team, option->name); 307 if (del_opt) 308 __team_option_inst_mark_removed_option(team, del_opt); 309 } 310 } 311 312 static void __team_options_unregister(struct team *team, 313 const struct team_option *option, 314 size_t option_count) 315 { 316 int i; 317 318 for (i = 0; i < option_count; i++, option++) { 319 struct team_option *del_opt; 320 321 del_opt = __team_find_option(team, option->name); 322 if (del_opt) { 323 __team_option_inst_del_option(team, del_opt); 324 list_del(&del_opt->list); 325 kfree(del_opt); 326 } 327 } 328 } 329 330 static void __team_options_change_check(struct team *team); 331 332 int team_options_register(struct team *team, 333 const struct team_option *option, 334 size_t option_count) 335 { 336 int err; 337 338 err = __team_options_register(team, option, option_count); 339 if (err) 340 return err; 341 __team_options_change_check(team); 342 return 0; 343 } 344 EXPORT_SYMBOL(team_options_register); 345 346 void team_options_unregister(struct team *team, 347 const struct team_option *option, 348 size_t option_count) 349 { 350 __team_options_mark_removed(team, option, option_count); 351 __team_options_change_check(team); 352 __team_options_unregister(team, option, option_count); 353 } 354 EXPORT_SYMBOL(team_options_unregister); 355 356 static int team_option_get(struct team *team, 357 struct team_option_inst *opt_inst, 358 struct team_gsetter_ctx *ctx) 359 { 360 if (!opt_inst->option->getter) 361 return -EOPNOTSUPP; 362 return opt_inst->option->getter(team, ctx); 363 } 364 365 static int team_option_set(struct team *team, 366 struct team_option_inst *opt_inst, 367 struct team_gsetter_ctx *ctx) 368 { 369 if (!opt_inst->option->setter) 370 return -EOPNOTSUPP; 371 return opt_inst->option->setter(team, ctx); 372 } 373 374 void team_option_inst_set_change(struct team_option_inst_info *opt_inst_info) 375 { 376 struct team_option_inst *opt_inst; 377 378 opt_inst = container_of(opt_inst_info, struct team_option_inst, info); 379 opt_inst->changed = true; 380 } 381 EXPORT_SYMBOL(team_option_inst_set_change); 382 383 void team_options_change_check(struct team *team) 384 { 385 __team_options_change_check(team); 386 } 387 EXPORT_SYMBOL(team_options_change_check); 388 389 390 /**************** 391 * Mode handling 392 ****************/ 393 394 static LIST_HEAD(mode_list); 395 static DEFINE_SPINLOCK(mode_list_lock); 396 397 struct team_mode_item { 398 struct list_head list; 399 const struct team_mode *mode; 400 }; 401 402 static struct team_mode_item *__find_mode(const char *kind) 403 { 404 struct team_mode_item *mitem; 405 406 list_for_each_entry(mitem, &mode_list, list) { 407 if (strcmp(mitem->mode->kind, kind) == 0) 408 return mitem; 409 } 410 return NULL; 411 } 412 413 static bool is_good_mode_name(const char *name) 414 { 415 while (*name != '\0') { 416 if (!isalpha(*name) && !isdigit(*name) && *name != '_') 417 return false; 418 name++; 419 } 420 return true; 421 } 422 423 int team_mode_register(const struct team_mode *mode) 424 { 425 int err = 0; 426 struct team_mode_item *mitem; 427 428 if (!is_good_mode_name(mode->kind) || 429 mode->priv_size > TEAM_MODE_PRIV_SIZE) 430 return -EINVAL; 431 432 mitem = kmalloc(sizeof(*mitem), GFP_KERNEL); 433 if (!mitem) 434 return -ENOMEM; 435 436 spin_lock(&mode_list_lock); 437 if (__find_mode(mode->kind)) { 438 err = -EEXIST; 439 kfree(mitem); 440 goto unlock; 441 } 442 mitem->mode = mode; 443 list_add_tail(&mitem->list, &mode_list); 444 unlock: 445 spin_unlock(&mode_list_lock); 446 return err; 447 } 448 EXPORT_SYMBOL(team_mode_register); 449 450 void team_mode_unregister(const struct team_mode *mode) 451 { 452 struct team_mode_item *mitem; 453 454 spin_lock(&mode_list_lock); 455 mitem = __find_mode(mode->kind); 456 if (mitem) { 457 list_del_init(&mitem->list); 458 kfree(mitem); 459 } 460 spin_unlock(&mode_list_lock); 461 } 462 EXPORT_SYMBOL(team_mode_unregister); 463 464 static const struct team_mode *team_mode_get(const char *kind) 465 { 466 struct team_mode_item *mitem; 467 const struct team_mode *mode = NULL; 468 469 spin_lock(&mode_list_lock); 470 mitem = __find_mode(kind); 471 if (!mitem) { 472 spin_unlock(&mode_list_lock); 473 request_module("team-mode-%s", kind); 474 spin_lock(&mode_list_lock); 475 mitem = __find_mode(kind); 476 } 477 if (mitem) { 478 mode = mitem->mode; 479 if (!try_module_get(mode->owner)) 480 mode = NULL; 481 } 482 483 spin_unlock(&mode_list_lock); 484 return mode; 485 } 486 487 static void team_mode_put(const struct team_mode *mode) 488 { 489 module_put(mode->owner); 490 } 491 492 static bool team_dummy_transmit(struct team *team, struct sk_buff *skb) 493 { 494 dev_kfree_skb_any(skb); 495 return false; 496 } 497 498 static rx_handler_result_t team_dummy_receive(struct team *team, 499 struct team_port *port, 500 struct sk_buff *skb) 501 { 502 return RX_HANDLER_ANOTHER; 503 } 504 505 static const struct team_mode __team_no_mode = { 506 .kind = "*NOMODE*", 507 }; 508 509 static bool team_is_mode_set(struct team *team) 510 { 511 return team->mode != &__team_no_mode; 512 } 513 514 static void team_set_no_mode(struct team *team) 515 { 516 team->user_carrier_enabled = false; 517 team->mode = &__team_no_mode; 518 } 519 520 static void team_adjust_ops(struct team *team) 521 { 522 /* 523 * To avoid checks in rx/tx skb paths, ensure here that non-null and 524 * correct ops are always set. 525 */ 526 527 if (!team->en_port_count || !team_is_mode_set(team) || 528 !team->mode->ops->transmit) 529 team->ops.transmit = team_dummy_transmit; 530 else 531 team->ops.transmit = team->mode->ops->transmit; 532 533 if (!team->en_port_count || !team_is_mode_set(team) || 534 !team->mode->ops->receive) 535 team->ops.receive = team_dummy_receive; 536 else 537 team->ops.receive = team->mode->ops->receive; 538 } 539 540 /* 541 * We can benefit from the fact that it's ensured no port is present 542 * at the time of mode change. Therefore no packets are in fly so there's no 543 * need to set mode operations in any special way. 544 */ 545 static int __team_change_mode(struct team *team, 546 const struct team_mode *new_mode) 547 { 548 /* Check if mode was previously set and do cleanup if so */ 549 if (team_is_mode_set(team)) { 550 void (*exit_op)(struct team *team) = team->ops.exit; 551 552 /* Clear ops area so no callback is called any longer */ 553 memset(&team->ops, 0, sizeof(struct team_mode_ops)); 554 team_adjust_ops(team); 555 556 if (exit_op) 557 exit_op(team); 558 team_mode_put(team->mode); 559 team_set_no_mode(team); 560 /* zero private data area */ 561 memset(&team->mode_priv, 0, 562 sizeof(struct team) - offsetof(struct team, mode_priv)); 563 } 564 565 if (!new_mode) 566 return 0; 567 568 if (new_mode->ops->init) { 569 int err; 570 571 err = new_mode->ops->init(team); 572 if (err) 573 return err; 574 } 575 576 team->mode = new_mode; 577 memcpy(&team->ops, new_mode->ops, sizeof(struct team_mode_ops)); 578 team_adjust_ops(team); 579 580 return 0; 581 } 582 583 static int team_change_mode(struct team *team, const char *kind) 584 { 585 const struct team_mode *new_mode; 586 struct net_device *dev = team->dev; 587 int err; 588 589 if (!list_empty(&team->port_list)) { 590 netdev_err(dev, "No ports can be present during mode change\n"); 591 return -EBUSY; 592 } 593 594 if (team_is_mode_set(team) && strcmp(team->mode->kind, kind) == 0) { 595 netdev_err(dev, "Unable to change to the same mode the team is in\n"); 596 return -EINVAL; 597 } 598 599 new_mode = team_mode_get(kind); 600 if (!new_mode) { 601 netdev_err(dev, "Mode \"%s\" not found\n", kind); 602 return -EINVAL; 603 } 604 605 err = __team_change_mode(team, new_mode); 606 if (err) { 607 netdev_err(dev, "Failed to change to mode \"%s\"\n", kind); 608 team_mode_put(new_mode); 609 return err; 610 } 611 612 netdev_info(dev, "Mode changed to \"%s\"\n", kind); 613 return 0; 614 } 615 616 617 /********************* 618 * Peers notification 619 *********************/ 620 621 static void team_notify_peers_work(struct work_struct *work) 622 { 623 struct team *team; 624 int val; 625 626 team = container_of(work, struct team, notify_peers.dw.work); 627 628 if (!rtnl_trylock()) { 629 schedule_delayed_work(&team->notify_peers.dw, 0); 630 return; 631 } 632 val = atomic_dec_if_positive(&team->notify_peers.count_pending); 633 if (val < 0) { 634 rtnl_unlock(); 635 return; 636 } 637 call_netdevice_notifiers(NETDEV_NOTIFY_PEERS, team->dev); 638 rtnl_unlock(); 639 if (val) 640 schedule_delayed_work(&team->notify_peers.dw, 641 msecs_to_jiffies(team->notify_peers.interval)); 642 } 643 644 static void team_notify_peers(struct team *team) 645 { 646 if (!team->notify_peers.count || !netif_running(team->dev)) 647 return; 648 atomic_add(team->notify_peers.count, &team->notify_peers.count_pending); 649 schedule_delayed_work(&team->notify_peers.dw, 0); 650 } 651 652 static void team_notify_peers_init(struct team *team) 653 { 654 INIT_DELAYED_WORK(&team->notify_peers.dw, team_notify_peers_work); 655 } 656 657 static void team_notify_peers_fini(struct team *team) 658 { 659 cancel_delayed_work_sync(&team->notify_peers.dw); 660 } 661 662 663 /******************************* 664 * Send multicast group rejoins 665 *******************************/ 666 667 static void team_mcast_rejoin_work(struct work_struct *work) 668 { 669 struct team *team; 670 int val; 671 672 team = container_of(work, struct team, mcast_rejoin.dw.work); 673 674 if (!rtnl_trylock()) { 675 schedule_delayed_work(&team->mcast_rejoin.dw, 0); 676 return; 677 } 678 val = atomic_dec_if_positive(&team->mcast_rejoin.count_pending); 679 if (val < 0) { 680 rtnl_unlock(); 681 return; 682 } 683 call_netdevice_notifiers(NETDEV_RESEND_IGMP, team->dev); 684 rtnl_unlock(); 685 if (val) 686 schedule_delayed_work(&team->mcast_rejoin.dw, 687 msecs_to_jiffies(team->mcast_rejoin.interval)); 688 } 689 690 static void team_mcast_rejoin(struct team *team) 691 { 692 if (!team->mcast_rejoin.count || !netif_running(team->dev)) 693 return; 694 atomic_add(team->mcast_rejoin.count, &team->mcast_rejoin.count_pending); 695 schedule_delayed_work(&team->mcast_rejoin.dw, 0); 696 } 697 698 static void team_mcast_rejoin_init(struct team *team) 699 { 700 INIT_DELAYED_WORK(&team->mcast_rejoin.dw, team_mcast_rejoin_work); 701 } 702 703 static void team_mcast_rejoin_fini(struct team *team) 704 { 705 cancel_delayed_work_sync(&team->mcast_rejoin.dw); 706 } 707 708 709 /************************ 710 * Rx path frame handler 711 ************************/ 712 713 /* note: already called with rcu_read_lock */ 714 static rx_handler_result_t team_handle_frame(struct sk_buff **pskb) 715 { 716 struct sk_buff *skb = *pskb; 717 struct team_port *port; 718 struct team *team; 719 rx_handler_result_t res; 720 721 skb = skb_share_check(skb, GFP_ATOMIC); 722 if (!skb) 723 return RX_HANDLER_CONSUMED; 724 725 *pskb = skb; 726 727 port = team_port_get_rcu(skb->dev); 728 team = port->team; 729 if (!team_port_enabled(port)) { 730 /* allow exact match delivery for disabled ports */ 731 res = RX_HANDLER_EXACT; 732 } else { 733 res = team->ops.receive(team, port, skb); 734 } 735 if (res == RX_HANDLER_ANOTHER) { 736 struct team_pcpu_stats *pcpu_stats; 737 738 pcpu_stats = this_cpu_ptr(team->pcpu_stats); 739 u64_stats_update_begin(&pcpu_stats->syncp); 740 pcpu_stats->rx_packets++; 741 pcpu_stats->rx_bytes += skb->len; 742 if (skb->pkt_type == PACKET_MULTICAST) 743 pcpu_stats->rx_multicast++; 744 u64_stats_update_end(&pcpu_stats->syncp); 745 746 skb->dev = team->dev; 747 } else { 748 this_cpu_inc(team->pcpu_stats->rx_dropped); 749 } 750 751 return res; 752 } 753 754 755 /************************************* 756 * Multiqueue Tx port select override 757 *************************************/ 758 759 static int team_queue_override_init(struct team *team) 760 { 761 struct list_head *listarr; 762 unsigned int queue_cnt = team->dev->num_tx_queues - 1; 763 unsigned int i; 764 765 if (!queue_cnt) 766 return 0; 767 listarr = kmalloc(sizeof(struct list_head) * queue_cnt, GFP_KERNEL); 768 if (!listarr) 769 return -ENOMEM; 770 team->qom_lists = listarr; 771 for (i = 0; i < queue_cnt; i++) 772 INIT_LIST_HEAD(listarr++); 773 return 0; 774 } 775 776 static void team_queue_override_fini(struct team *team) 777 { 778 kfree(team->qom_lists); 779 } 780 781 static struct list_head *__team_get_qom_list(struct team *team, u16 queue_id) 782 { 783 return &team->qom_lists[queue_id - 1]; 784 } 785 786 /* 787 * note: already called with rcu_read_lock 788 */ 789 static bool team_queue_override_transmit(struct team *team, struct sk_buff *skb) 790 { 791 struct list_head *qom_list; 792 struct team_port *port; 793 794 if (!team->queue_override_enabled || !skb->queue_mapping) 795 return false; 796 qom_list = __team_get_qom_list(team, skb->queue_mapping); 797 list_for_each_entry_rcu(port, qom_list, qom_list) { 798 if (!team_dev_queue_xmit(team, port, skb)) 799 return true; 800 } 801 return false; 802 } 803 804 static void __team_queue_override_port_del(struct team *team, 805 struct team_port *port) 806 { 807 if (!port->queue_id) 808 return; 809 list_del_rcu(&port->qom_list); 810 } 811 812 static bool team_queue_override_port_has_gt_prio_than(struct team_port *port, 813 struct team_port *cur) 814 { 815 if (port->priority < cur->priority) 816 return true; 817 if (port->priority > cur->priority) 818 return false; 819 if (port->index < cur->index) 820 return true; 821 return false; 822 } 823 824 static void __team_queue_override_port_add(struct team *team, 825 struct team_port *port) 826 { 827 struct team_port *cur; 828 struct list_head *qom_list; 829 struct list_head *node; 830 831 if (!port->queue_id) 832 return; 833 qom_list = __team_get_qom_list(team, port->queue_id); 834 node = qom_list; 835 list_for_each_entry(cur, qom_list, qom_list) { 836 if (team_queue_override_port_has_gt_prio_than(port, cur)) 837 break; 838 node = &cur->qom_list; 839 } 840 list_add_tail_rcu(&port->qom_list, node); 841 } 842 843 static void __team_queue_override_enabled_check(struct team *team) 844 { 845 struct team_port *port; 846 bool enabled = false; 847 848 list_for_each_entry(port, &team->port_list, list) { 849 if (port->queue_id) { 850 enabled = true; 851 break; 852 } 853 } 854 if (enabled == team->queue_override_enabled) 855 return; 856 netdev_dbg(team->dev, "%s queue override\n", 857 enabled ? "Enabling" : "Disabling"); 858 team->queue_override_enabled = enabled; 859 } 860 861 static void team_queue_override_port_prio_changed(struct team *team, 862 struct team_port *port) 863 { 864 if (!port->queue_id || team_port_enabled(port)) 865 return; 866 __team_queue_override_port_del(team, port); 867 __team_queue_override_port_add(team, port); 868 __team_queue_override_enabled_check(team); 869 } 870 871 static void team_queue_override_port_change_queue_id(struct team *team, 872 struct team_port *port, 873 u16 new_queue_id) 874 { 875 if (team_port_enabled(port)) { 876 __team_queue_override_port_del(team, port); 877 port->queue_id = new_queue_id; 878 __team_queue_override_port_add(team, port); 879 __team_queue_override_enabled_check(team); 880 } else { 881 port->queue_id = new_queue_id; 882 } 883 } 884 885 static void team_queue_override_port_add(struct team *team, 886 struct team_port *port) 887 { 888 __team_queue_override_port_add(team, port); 889 __team_queue_override_enabled_check(team); 890 } 891 892 static void team_queue_override_port_del(struct team *team, 893 struct team_port *port) 894 { 895 __team_queue_override_port_del(team, port); 896 __team_queue_override_enabled_check(team); 897 } 898 899 900 /**************** 901 * Port handling 902 ****************/ 903 904 static bool team_port_find(const struct team *team, 905 const struct team_port *port) 906 { 907 struct team_port *cur; 908 909 list_for_each_entry(cur, &team->port_list, list) 910 if (cur == port) 911 return true; 912 return false; 913 } 914 915 /* 916 * Enable/disable port by adding to enabled port hashlist and setting 917 * port->index (Might be racy so reader could see incorrect ifindex when 918 * processing a flying packet, but that is not a problem). Write guarded 919 * by team->lock. 920 */ 921 static void team_port_enable(struct team *team, 922 struct team_port *port) 923 { 924 if (team_port_enabled(port)) 925 return; 926 port->index = team->en_port_count++; 927 hlist_add_head_rcu(&port->hlist, 928 team_port_index_hash(team, port->index)); 929 team_adjust_ops(team); 930 team_queue_override_port_add(team, port); 931 if (team->ops.port_enabled) 932 team->ops.port_enabled(team, port); 933 team_notify_peers(team); 934 team_mcast_rejoin(team); 935 } 936 937 static void __reconstruct_port_hlist(struct team *team, int rm_index) 938 { 939 int i; 940 struct team_port *port; 941 942 for (i = rm_index + 1; i < team->en_port_count; i++) { 943 port = team_get_port_by_index(team, i); 944 hlist_del_rcu(&port->hlist); 945 port->index--; 946 hlist_add_head_rcu(&port->hlist, 947 team_port_index_hash(team, port->index)); 948 } 949 } 950 951 static void team_port_disable(struct team *team, 952 struct team_port *port) 953 { 954 if (!team_port_enabled(port)) 955 return; 956 if (team->ops.port_disabled) 957 team->ops.port_disabled(team, port); 958 hlist_del_rcu(&port->hlist); 959 __reconstruct_port_hlist(team, port->index); 960 port->index = -1; 961 team->en_port_count--; 962 team_queue_override_port_del(team, port); 963 team_adjust_ops(team); 964 team_notify_peers(team); 965 team_mcast_rejoin(team); 966 } 967 968 #define TEAM_VLAN_FEATURES (NETIF_F_ALL_CSUM | NETIF_F_SG | \ 969 NETIF_F_FRAGLIST | NETIF_F_ALL_TSO | \ 970 NETIF_F_HIGHDMA | NETIF_F_LRO) 971 972 static void __team_compute_features(struct team *team) 973 { 974 struct team_port *port; 975 u32 vlan_features = TEAM_VLAN_FEATURES & NETIF_F_ALL_FOR_ALL; 976 unsigned short max_hard_header_len = ETH_HLEN; 977 unsigned int dst_release_flag = IFF_XMIT_DST_RELEASE | 978 IFF_XMIT_DST_RELEASE_PERM; 979 980 list_for_each_entry(port, &team->port_list, list) { 981 vlan_features = netdev_increment_features(vlan_features, 982 port->dev->vlan_features, 983 TEAM_VLAN_FEATURES); 984 985 dst_release_flag &= port->dev->priv_flags; 986 if (port->dev->hard_header_len > max_hard_header_len) 987 max_hard_header_len = port->dev->hard_header_len; 988 } 989 990 team->dev->vlan_features = vlan_features; 991 team->dev->hard_header_len = max_hard_header_len; 992 993 team->dev->priv_flags &= ~IFF_XMIT_DST_RELEASE; 994 if (dst_release_flag == (IFF_XMIT_DST_RELEASE | IFF_XMIT_DST_RELEASE_PERM)) 995 team->dev->priv_flags |= IFF_XMIT_DST_RELEASE; 996 997 netdev_change_features(team->dev); 998 } 999 1000 static void team_compute_features(struct team *team) 1001 { 1002 mutex_lock(&team->lock); 1003 __team_compute_features(team); 1004 mutex_unlock(&team->lock); 1005 } 1006 1007 static int team_port_enter(struct team *team, struct team_port *port) 1008 { 1009 int err = 0; 1010 1011 dev_hold(team->dev); 1012 if (team->ops.port_enter) { 1013 err = team->ops.port_enter(team, port); 1014 if (err) { 1015 netdev_err(team->dev, "Device %s failed to enter team mode\n", 1016 port->dev->name); 1017 goto err_port_enter; 1018 } 1019 } 1020 1021 return 0; 1022 1023 err_port_enter: 1024 dev_put(team->dev); 1025 1026 return err; 1027 } 1028 1029 static void team_port_leave(struct team *team, struct team_port *port) 1030 { 1031 if (team->ops.port_leave) 1032 team->ops.port_leave(team, port); 1033 dev_put(team->dev); 1034 } 1035 1036 #ifdef CONFIG_NET_POLL_CONTROLLER 1037 static int team_port_enable_netpoll(struct team *team, struct team_port *port) 1038 { 1039 struct netpoll *np; 1040 int err; 1041 1042 if (!team->dev->npinfo) 1043 return 0; 1044 1045 np = kzalloc(sizeof(*np), GFP_KERNEL); 1046 if (!np) 1047 return -ENOMEM; 1048 1049 err = __netpoll_setup(np, port->dev); 1050 if (err) { 1051 kfree(np); 1052 return err; 1053 } 1054 port->np = np; 1055 return err; 1056 } 1057 1058 static void team_port_disable_netpoll(struct team_port *port) 1059 { 1060 struct netpoll *np = port->np; 1061 1062 if (!np) 1063 return; 1064 port->np = NULL; 1065 1066 /* Wait for transmitting packets to finish before freeing. */ 1067 synchronize_rcu_bh(); 1068 __netpoll_cleanup(np); 1069 kfree(np); 1070 } 1071 #else 1072 static int team_port_enable_netpoll(struct team *team, struct team_port *port) 1073 { 1074 return 0; 1075 } 1076 static void team_port_disable_netpoll(struct team_port *port) 1077 { 1078 } 1079 #endif 1080 1081 static int team_upper_dev_link(struct net_device *dev, 1082 struct net_device *port_dev) 1083 { 1084 int err; 1085 1086 err = netdev_master_upper_dev_link(port_dev, dev); 1087 if (err) 1088 return err; 1089 port_dev->priv_flags |= IFF_TEAM_PORT; 1090 return 0; 1091 } 1092 1093 static void team_upper_dev_unlink(struct net_device *dev, 1094 struct net_device *port_dev) 1095 { 1096 netdev_upper_dev_unlink(port_dev, dev); 1097 port_dev->priv_flags &= ~IFF_TEAM_PORT; 1098 } 1099 1100 static void __team_port_change_port_added(struct team_port *port, bool linkup); 1101 static int team_dev_type_check_change(struct net_device *dev, 1102 struct net_device *port_dev); 1103 1104 static int team_port_add(struct team *team, struct net_device *port_dev) 1105 { 1106 struct net_device *dev = team->dev; 1107 struct team_port *port; 1108 char *portname = port_dev->name; 1109 int err; 1110 1111 if (port_dev->flags & IFF_LOOPBACK) { 1112 netdev_err(dev, "Device %s is loopback device. Loopback devices can't be added as a team port\n", 1113 portname); 1114 return -EINVAL; 1115 } 1116 1117 if (team_port_exists(port_dev)) { 1118 netdev_err(dev, "Device %s is already a port " 1119 "of a team device\n", portname); 1120 return -EBUSY; 1121 } 1122 1123 if (port_dev->features & NETIF_F_VLAN_CHALLENGED && 1124 vlan_uses_dev(dev)) { 1125 netdev_err(dev, "Device %s is VLAN challenged and team device has VLAN set up\n", 1126 portname); 1127 return -EPERM; 1128 } 1129 1130 err = team_dev_type_check_change(dev, port_dev); 1131 if (err) 1132 return err; 1133 1134 if (port_dev->flags & IFF_UP) { 1135 netdev_err(dev, "Device %s is up. Set it down before adding it as a team port\n", 1136 portname); 1137 return -EBUSY; 1138 } 1139 1140 port = kzalloc(sizeof(struct team_port) + team->mode->port_priv_size, 1141 GFP_KERNEL); 1142 if (!port) 1143 return -ENOMEM; 1144 1145 port->dev = port_dev; 1146 port->team = team; 1147 INIT_LIST_HEAD(&port->qom_list); 1148 1149 port->orig.mtu = port_dev->mtu; 1150 err = dev_set_mtu(port_dev, dev->mtu); 1151 if (err) { 1152 netdev_dbg(dev, "Error %d calling dev_set_mtu\n", err); 1153 goto err_set_mtu; 1154 } 1155 1156 memcpy(port->orig.dev_addr, port_dev->dev_addr, port_dev->addr_len); 1157 1158 err = team_port_enter(team, port); 1159 if (err) { 1160 netdev_err(dev, "Device %s failed to enter team mode\n", 1161 portname); 1162 goto err_port_enter; 1163 } 1164 1165 err = dev_open(port_dev); 1166 if (err) { 1167 netdev_dbg(dev, "Device %s opening failed\n", 1168 portname); 1169 goto err_dev_open; 1170 } 1171 1172 err = vlan_vids_add_by_dev(port_dev, dev); 1173 if (err) { 1174 netdev_err(dev, "Failed to add vlan ids to device %s\n", 1175 portname); 1176 goto err_vids_add; 1177 } 1178 1179 err = team_port_enable_netpoll(team, port); 1180 if (err) { 1181 netdev_err(dev, "Failed to enable netpoll on device %s\n", 1182 portname); 1183 goto err_enable_netpoll; 1184 } 1185 1186 if (!(dev->features & NETIF_F_LRO)) 1187 dev_disable_lro(port_dev); 1188 1189 err = netdev_rx_handler_register(port_dev, team_handle_frame, 1190 port); 1191 if (err) { 1192 netdev_err(dev, "Device %s failed to register rx_handler\n", 1193 portname); 1194 goto err_handler_register; 1195 } 1196 1197 err = team_upper_dev_link(dev, port_dev); 1198 if (err) { 1199 netdev_err(dev, "Device %s failed to set upper link\n", 1200 portname); 1201 goto err_set_upper_link; 1202 } 1203 1204 err = __team_option_inst_add_port(team, port); 1205 if (err) { 1206 netdev_err(dev, "Device %s failed to add per-port options\n", 1207 portname); 1208 goto err_option_port_add; 1209 } 1210 1211 port->index = -1; 1212 list_add_tail_rcu(&port->list, &team->port_list); 1213 team_port_enable(team, port); 1214 __team_compute_features(team); 1215 __team_port_change_port_added(port, !!netif_carrier_ok(port_dev)); 1216 __team_options_change_check(team); 1217 1218 netdev_info(dev, "Port device %s added\n", portname); 1219 1220 return 0; 1221 1222 err_option_port_add: 1223 team_upper_dev_unlink(dev, port_dev); 1224 1225 err_set_upper_link: 1226 netdev_rx_handler_unregister(port_dev); 1227 1228 err_handler_register: 1229 team_port_disable_netpoll(port); 1230 1231 err_enable_netpoll: 1232 vlan_vids_del_by_dev(port_dev, dev); 1233 1234 err_vids_add: 1235 dev_close(port_dev); 1236 1237 err_dev_open: 1238 team_port_leave(team, port); 1239 team_port_set_orig_dev_addr(port); 1240 1241 err_port_enter: 1242 dev_set_mtu(port_dev, port->orig.mtu); 1243 1244 err_set_mtu: 1245 kfree(port); 1246 1247 return err; 1248 } 1249 1250 static void __team_port_change_port_removed(struct team_port *port); 1251 1252 static int team_port_del(struct team *team, struct net_device *port_dev) 1253 { 1254 struct net_device *dev = team->dev; 1255 struct team_port *port; 1256 char *portname = port_dev->name; 1257 1258 port = team_port_get_rtnl(port_dev); 1259 if (!port || !team_port_find(team, port)) { 1260 netdev_err(dev, "Device %s does not act as a port of this team\n", 1261 portname); 1262 return -ENOENT; 1263 } 1264 1265 team_port_disable(team, port); 1266 list_del_rcu(&port->list); 1267 team_upper_dev_unlink(dev, port_dev); 1268 netdev_rx_handler_unregister(port_dev); 1269 team_port_disable_netpoll(port); 1270 vlan_vids_del_by_dev(port_dev, dev); 1271 dev_uc_unsync(port_dev, dev); 1272 dev_mc_unsync(port_dev, dev); 1273 dev_close(port_dev); 1274 team_port_leave(team, port); 1275 1276 __team_option_inst_mark_removed_port(team, port); 1277 __team_options_change_check(team); 1278 __team_option_inst_del_port(team, port); 1279 __team_port_change_port_removed(port); 1280 1281 team_port_set_orig_dev_addr(port); 1282 dev_set_mtu(port_dev, port->orig.mtu); 1283 kfree_rcu(port, rcu); 1284 netdev_info(dev, "Port device %s removed\n", portname); 1285 __team_compute_features(team); 1286 1287 return 0; 1288 } 1289 1290 1291 /***************** 1292 * Net device ops 1293 *****************/ 1294 1295 static int team_mode_option_get(struct team *team, struct team_gsetter_ctx *ctx) 1296 { 1297 ctx->data.str_val = team->mode->kind; 1298 return 0; 1299 } 1300 1301 static int team_mode_option_set(struct team *team, struct team_gsetter_ctx *ctx) 1302 { 1303 return team_change_mode(team, ctx->data.str_val); 1304 } 1305 1306 static int team_notify_peers_count_get(struct team *team, 1307 struct team_gsetter_ctx *ctx) 1308 { 1309 ctx->data.u32_val = team->notify_peers.count; 1310 return 0; 1311 } 1312 1313 static int team_notify_peers_count_set(struct team *team, 1314 struct team_gsetter_ctx *ctx) 1315 { 1316 team->notify_peers.count = ctx->data.u32_val; 1317 return 0; 1318 } 1319 1320 static int team_notify_peers_interval_get(struct team *team, 1321 struct team_gsetter_ctx *ctx) 1322 { 1323 ctx->data.u32_val = team->notify_peers.interval; 1324 return 0; 1325 } 1326 1327 static int team_notify_peers_interval_set(struct team *team, 1328 struct team_gsetter_ctx *ctx) 1329 { 1330 team->notify_peers.interval = ctx->data.u32_val; 1331 return 0; 1332 } 1333 1334 static int team_mcast_rejoin_count_get(struct team *team, 1335 struct team_gsetter_ctx *ctx) 1336 { 1337 ctx->data.u32_val = team->mcast_rejoin.count; 1338 return 0; 1339 } 1340 1341 static int team_mcast_rejoin_count_set(struct team *team, 1342 struct team_gsetter_ctx *ctx) 1343 { 1344 team->mcast_rejoin.count = ctx->data.u32_val; 1345 return 0; 1346 } 1347 1348 static int team_mcast_rejoin_interval_get(struct team *team, 1349 struct team_gsetter_ctx *ctx) 1350 { 1351 ctx->data.u32_val = team->mcast_rejoin.interval; 1352 return 0; 1353 } 1354 1355 static int team_mcast_rejoin_interval_set(struct team *team, 1356 struct team_gsetter_ctx *ctx) 1357 { 1358 team->mcast_rejoin.interval = ctx->data.u32_val; 1359 return 0; 1360 } 1361 1362 static int team_port_en_option_get(struct team *team, 1363 struct team_gsetter_ctx *ctx) 1364 { 1365 struct team_port *port = ctx->info->port; 1366 1367 ctx->data.bool_val = team_port_enabled(port); 1368 return 0; 1369 } 1370 1371 static int team_port_en_option_set(struct team *team, 1372 struct team_gsetter_ctx *ctx) 1373 { 1374 struct team_port *port = ctx->info->port; 1375 1376 if (ctx->data.bool_val) 1377 team_port_enable(team, port); 1378 else 1379 team_port_disable(team, port); 1380 return 0; 1381 } 1382 1383 static int team_user_linkup_option_get(struct team *team, 1384 struct team_gsetter_ctx *ctx) 1385 { 1386 struct team_port *port = ctx->info->port; 1387 1388 ctx->data.bool_val = port->user.linkup; 1389 return 0; 1390 } 1391 1392 static void __team_carrier_check(struct team *team); 1393 1394 static int team_user_linkup_option_set(struct team *team, 1395 struct team_gsetter_ctx *ctx) 1396 { 1397 struct team_port *port = ctx->info->port; 1398 1399 port->user.linkup = ctx->data.bool_val; 1400 team_refresh_port_linkup(port); 1401 __team_carrier_check(port->team); 1402 return 0; 1403 } 1404 1405 static int team_user_linkup_en_option_get(struct team *team, 1406 struct team_gsetter_ctx *ctx) 1407 { 1408 struct team_port *port = ctx->info->port; 1409 1410 ctx->data.bool_val = port->user.linkup_enabled; 1411 return 0; 1412 } 1413 1414 static int team_user_linkup_en_option_set(struct team *team, 1415 struct team_gsetter_ctx *ctx) 1416 { 1417 struct team_port *port = ctx->info->port; 1418 1419 port->user.linkup_enabled = ctx->data.bool_val; 1420 team_refresh_port_linkup(port); 1421 __team_carrier_check(port->team); 1422 return 0; 1423 } 1424 1425 static int team_priority_option_get(struct team *team, 1426 struct team_gsetter_ctx *ctx) 1427 { 1428 struct team_port *port = ctx->info->port; 1429 1430 ctx->data.s32_val = port->priority; 1431 return 0; 1432 } 1433 1434 static int team_priority_option_set(struct team *team, 1435 struct team_gsetter_ctx *ctx) 1436 { 1437 struct team_port *port = ctx->info->port; 1438 s32 priority = ctx->data.s32_val; 1439 1440 if (port->priority == priority) 1441 return 0; 1442 port->priority = priority; 1443 team_queue_override_port_prio_changed(team, port); 1444 return 0; 1445 } 1446 1447 static int team_queue_id_option_get(struct team *team, 1448 struct team_gsetter_ctx *ctx) 1449 { 1450 struct team_port *port = ctx->info->port; 1451 1452 ctx->data.u32_val = port->queue_id; 1453 return 0; 1454 } 1455 1456 static int team_queue_id_option_set(struct team *team, 1457 struct team_gsetter_ctx *ctx) 1458 { 1459 struct team_port *port = ctx->info->port; 1460 u16 new_queue_id = ctx->data.u32_val; 1461 1462 if (port->queue_id == new_queue_id) 1463 return 0; 1464 if (new_queue_id >= team->dev->real_num_tx_queues) 1465 return -EINVAL; 1466 team_queue_override_port_change_queue_id(team, port, new_queue_id); 1467 return 0; 1468 } 1469 1470 static const struct team_option team_options[] = { 1471 { 1472 .name = "mode", 1473 .type = TEAM_OPTION_TYPE_STRING, 1474 .getter = team_mode_option_get, 1475 .setter = team_mode_option_set, 1476 }, 1477 { 1478 .name = "notify_peers_count", 1479 .type = TEAM_OPTION_TYPE_U32, 1480 .getter = team_notify_peers_count_get, 1481 .setter = team_notify_peers_count_set, 1482 }, 1483 { 1484 .name = "notify_peers_interval", 1485 .type = TEAM_OPTION_TYPE_U32, 1486 .getter = team_notify_peers_interval_get, 1487 .setter = team_notify_peers_interval_set, 1488 }, 1489 { 1490 .name = "mcast_rejoin_count", 1491 .type = TEAM_OPTION_TYPE_U32, 1492 .getter = team_mcast_rejoin_count_get, 1493 .setter = team_mcast_rejoin_count_set, 1494 }, 1495 { 1496 .name = "mcast_rejoin_interval", 1497 .type = TEAM_OPTION_TYPE_U32, 1498 .getter = team_mcast_rejoin_interval_get, 1499 .setter = team_mcast_rejoin_interval_set, 1500 }, 1501 { 1502 .name = "enabled", 1503 .type = TEAM_OPTION_TYPE_BOOL, 1504 .per_port = true, 1505 .getter = team_port_en_option_get, 1506 .setter = team_port_en_option_set, 1507 }, 1508 { 1509 .name = "user_linkup", 1510 .type = TEAM_OPTION_TYPE_BOOL, 1511 .per_port = true, 1512 .getter = team_user_linkup_option_get, 1513 .setter = team_user_linkup_option_set, 1514 }, 1515 { 1516 .name = "user_linkup_enabled", 1517 .type = TEAM_OPTION_TYPE_BOOL, 1518 .per_port = true, 1519 .getter = team_user_linkup_en_option_get, 1520 .setter = team_user_linkup_en_option_set, 1521 }, 1522 { 1523 .name = "priority", 1524 .type = TEAM_OPTION_TYPE_S32, 1525 .per_port = true, 1526 .getter = team_priority_option_get, 1527 .setter = team_priority_option_set, 1528 }, 1529 { 1530 .name = "queue_id", 1531 .type = TEAM_OPTION_TYPE_U32, 1532 .per_port = true, 1533 .getter = team_queue_id_option_get, 1534 .setter = team_queue_id_option_set, 1535 }, 1536 }; 1537 1538 static struct lock_class_key team_netdev_xmit_lock_key; 1539 static struct lock_class_key team_netdev_addr_lock_key; 1540 static struct lock_class_key team_tx_busylock_key; 1541 1542 static void team_set_lockdep_class_one(struct net_device *dev, 1543 struct netdev_queue *txq, 1544 void *unused) 1545 { 1546 lockdep_set_class(&txq->_xmit_lock, &team_netdev_xmit_lock_key); 1547 } 1548 1549 static void team_set_lockdep_class(struct net_device *dev) 1550 { 1551 lockdep_set_class(&dev->addr_list_lock, &team_netdev_addr_lock_key); 1552 netdev_for_each_tx_queue(dev, team_set_lockdep_class_one, NULL); 1553 dev->qdisc_tx_busylock = &team_tx_busylock_key; 1554 } 1555 1556 static int team_init(struct net_device *dev) 1557 { 1558 struct team *team = netdev_priv(dev); 1559 int i; 1560 int err; 1561 1562 team->dev = dev; 1563 mutex_init(&team->lock); 1564 team_set_no_mode(team); 1565 1566 team->pcpu_stats = netdev_alloc_pcpu_stats(struct team_pcpu_stats); 1567 if (!team->pcpu_stats) 1568 return -ENOMEM; 1569 1570 for (i = 0; i < TEAM_PORT_HASHENTRIES; i++) 1571 INIT_HLIST_HEAD(&team->en_port_hlist[i]); 1572 INIT_LIST_HEAD(&team->port_list); 1573 err = team_queue_override_init(team); 1574 if (err) 1575 goto err_team_queue_override_init; 1576 1577 team_adjust_ops(team); 1578 1579 INIT_LIST_HEAD(&team->option_list); 1580 INIT_LIST_HEAD(&team->option_inst_list); 1581 1582 team_notify_peers_init(team); 1583 team_mcast_rejoin_init(team); 1584 1585 err = team_options_register(team, team_options, ARRAY_SIZE(team_options)); 1586 if (err) 1587 goto err_options_register; 1588 netif_carrier_off(dev); 1589 1590 team_set_lockdep_class(dev); 1591 1592 return 0; 1593 1594 err_options_register: 1595 team_mcast_rejoin_fini(team); 1596 team_notify_peers_fini(team); 1597 team_queue_override_fini(team); 1598 err_team_queue_override_init: 1599 free_percpu(team->pcpu_stats); 1600 1601 return err; 1602 } 1603 1604 static void team_uninit(struct net_device *dev) 1605 { 1606 struct team *team = netdev_priv(dev); 1607 struct team_port *port; 1608 struct team_port *tmp; 1609 1610 mutex_lock(&team->lock); 1611 list_for_each_entry_safe(port, tmp, &team->port_list, list) 1612 team_port_del(team, port->dev); 1613 1614 __team_change_mode(team, NULL); /* cleanup */ 1615 __team_options_unregister(team, team_options, ARRAY_SIZE(team_options)); 1616 team_mcast_rejoin_fini(team); 1617 team_notify_peers_fini(team); 1618 team_queue_override_fini(team); 1619 mutex_unlock(&team->lock); 1620 } 1621 1622 static void team_destructor(struct net_device *dev) 1623 { 1624 struct team *team = netdev_priv(dev); 1625 1626 free_percpu(team->pcpu_stats); 1627 free_netdev(dev); 1628 } 1629 1630 static int team_open(struct net_device *dev) 1631 { 1632 return 0; 1633 } 1634 1635 static int team_close(struct net_device *dev) 1636 { 1637 return 0; 1638 } 1639 1640 /* 1641 * note: already called with rcu_read_lock 1642 */ 1643 static netdev_tx_t team_xmit(struct sk_buff *skb, struct net_device *dev) 1644 { 1645 struct team *team = netdev_priv(dev); 1646 bool tx_success; 1647 unsigned int len = skb->len; 1648 1649 tx_success = team_queue_override_transmit(team, skb); 1650 if (!tx_success) 1651 tx_success = team->ops.transmit(team, skb); 1652 if (tx_success) { 1653 struct team_pcpu_stats *pcpu_stats; 1654 1655 pcpu_stats = this_cpu_ptr(team->pcpu_stats); 1656 u64_stats_update_begin(&pcpu_stats->syncp); 1657 pcpu_stats->tx_packets++; 1658 pcpu_stats->tx_bytes += len; 1659 u64_stats_update_end(&pcpu_stats->syncp); 1660 } else { 1661 this_cpu_inc(team->pcpu_stats->tx_dropped); 1662 } 1663 1664 return NETDEV_TX_OK; 1665 } 1666 1667 static u16 team_select_queue(struct net_device *dev, struct sk_buff *skb, 1668 void *accel_priv, select_queue_fallback_t fallback) 1669 { 1670 /* 1671 * This helper function exists to help dev_pick_tx get the correct 1672 * destination queue. Using a helper function skips a call to 1673 * skb_tx_hash and will put the skbs in the queue we expect on their 1674 * way down to the team driver. 1675 */ 1676 u16 txq = skb_rx_queue_recorded(skb) ? skb_get_rx_queue(skb) : 0; 1677 1678 /* 1679 * Save the original txq to restore before passing to the driver 1680 */ 1681 qdisc_skb_cb(skb)->slave_dev_queue_mapping = skb->queue_mapping; 1682 1683 if (unlikely(txq >= dev->real_num_tx_queues)) { 1684 do { 1685 txq -= dev->real_num_tx_queues; 1686 } while (txq >= dev->real_num_tx_queues); 1687 } 1688 return txq; 1689 } 1690 1691 static void team_change_rx_flags(struct net_device *dev, int change) 1692 { 1693 struct team *team = netdev_priv(dev); 1694 struct team_port *port; 1695 int inc; 1696 1697 rcu_read_lock(); 1698 list_for_each_entry_rcu(port, &team->port_list, list) { 1699 if (change & IFF_PROMISC) { 1700 inc = dev->flags & IFF_PROMISC ? 1 : -1; 1701 dev_set_promiscuity(port->dev, inc); 1702 } 1703 if (change & IFF_ALLMULTI) { 1704 inc = dev->flags & IFF_ALLMULTI ? 1 : -1; 1705 dev_set_allmulti(port->dev, inc); 1706 } 1707 } 1708 rcu_read_unlock(); 1709 } 1710 1711 static void team_set_rx_mode(struct net_device *dev) 1712 { 1713 struct team *team = netdev_priv(dev); 1714 struct team_port *port; 1715 1716 rcu_read_lock(); 1717 list_for_each_entry_rcu(port, &team->port_list, list) { 1718 dev_uc_sync_multiple(port->dev, dev); 1719 dev_mc_sync_multiple(port->dev, dev); 1720 } 1721 rcu_read_unlock(); 1722 } 1723 1724 static int team_set_mac_address(struct net_device *dev, void *p) 1725 { 1726 struct sockaddr *addr = p; 1727 struct team *team = netdev_priv(dev); 1728 struct team_port *port; 1729 1730 if (dev->type == ARPHRD_ETHER && !is_valid_ether_addr(addr->sa_data)) 1731 return -EADDRNOTAVAIL; 1732 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len); 1733 rcu_read_lock(); 1734 list_for_each_entry_rcu(port, &team->port_list, list) 1735 if (team->ops.port_change_dev_addr) 1736 team->ops.port_change_dev_addr(team, port); 1737 rcu_read_unlock(); 1738 return 0; 1739 } 1740 1741 static int team_change_mtu(struct net_device *dev, int new_mtu) 1742 { 1743 struct team *team = netdev_priv(dev); 1744 struct team_port *port; 1745 int err; 1746 1747 /* 1748 * Alhough this is reader, it's guarded by team lock. It's not possible 1749 * to traverse list in reverse under rcu_read_lock 1750 */ 1751 mutex_lock(&team->lock); 1752 team->port_mtu_change_allowed = true; 1753 list_for_each_entry(port, &team->port_list, list) { 1754 err = dev_set_mtu(port->dev, new_mtu); 1755 if (err) { 1756 netdev_err(dev, "Device %s failed to change mtu", 1757 port->dev->name); 1758 goto unwind; 1759 } 1760 } 1761 team->port_mtu_change_allowed = false; 1762 mutex_unlock(&team->lock); 1763 1764 dev->mtu = new_mtu; 1765 1766 return 0; 1767 1768 unwind: 1769 list_for_each_entry_continue_reverse(port, &team->port_list, list) 1770 dev_set_mtu(port->dev, dev->mtu); 1771 team->port_mtu_change_allowed = false; 1772 mutex_unlock(&team->lock); 1773 1774 return err; 1775 } 1776 1777 static struct rtnl_link_stats64 * 1778 team_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats) 1779 { 1780 struct team *team = netdev_priv(dev); 1781 struct team_pcpu_stats *p; 1782 u64 rx_packets, rx_bytes, rx_multicast, tx_packets, tx_bytes; 1783 u32 rx_dropped = 0, tx_dropped = 0; 1784 unsigned int start; 1785 int i; 1786 1787 for_each_possible_cpu(i) { 1788 p = per_cpu_ptr(team->pcpu_stats, i); 1789 do { 1790 start = u64_stats_fetch_begin_irq(&p->syncp); 1791 rx_packets = p->rx_packets; 1792 rx_bytes = p->rx_bytes; 1793 rx_multicast = p->rx_multicast; 1794 tx_packets = p->tx_packets; 1795 tx_bytes = p->tx_bytes; 1796 } while (u64_stats_fetch_retry_irq(&p->syncp, start)); 1797 1798 stats->rx_packets += rx_packets; 1799 stats->rx_bytes += rx_bytes; 1800 stats->multicast += rx_multicast; 1801 stats->tx_packets += tx_packets; 1802 stats->tx_bytes += tx_bytes; 1803 /* 1804 * rx_dropped & tx_dropped are u32, updated 1805 * without syncp protection. 1806 */ 1807 rx_dropped += p->rx_dropped; 1808 tx_dropped += p->tx_dropped; 1809 } 1810 stats->rx_dropped = rx_dropped; 1811 stats->tx_dropped = tx_dropped; 1812 return stats; 1813 } 1814 1815 static int team_vlan_rx_add_vid(struct net_device *dev, __be16 proto, u16 vid) 1816 { 1817 struct team *team = netdev_priv(dev); 1818 struct team_port *port; 1819 int err; 1820 1821 /* 1822 * Alhough this is reader, it's guarded by team lock. It's not possible 1823 * to traverse list in reverse under rcu_read_lock 1824 */ 1825 mutex_lock(&team->lock); 1826 list_for_each_entry(port, &team->port_list, list) { 1827 err = vlan_vid_add(port->dev, proto, vid); 1828 if (err) 1829 goto unwind; 1830 } 1831 mutex_unlock(&team->lock); 1832 1833 return 0; 1834 1835 unwind: 1836 list_for_each_entry_continue_reverse(port, &team->port_list, list) 1837 vlan_vid_del(port->dev, proto, vid); 1838 mutex_unlock(&team->lock); 1839 1840 return err; 1841 } 1842 1843 static int team_vlan_rx_kill_vid(struct net_device *dev, __be16 proto, u16 vid) 1844 { 1845 struct team *team = netdev_priv(dev); 1846 struct team_port *port; 1847 1848 rcu_read_lock(); 1849 list_for_each_entry_rcu(port, &team->port_list, list) 1850 vlan_vid_del(port->dev, proto, vid); 1851 rcu_read_unlock(); 1852 1853 return 0; 1854 } 1855 1856 #ifdef CONFIG_NET_POLL_CONTROLLER 1857 static void team_poll_controller(struct net_device *dev) 1858 { 1859 } 1860 1861 static void __team_netpoll_cleanup(struct team *team) 1862 { 1863 struct team_port *port; 1864 1865 list_for_each_entry(port, &team->port_list, list) 1866 team_port_disable_netpoll(port); 1867 } 1868 1869 static void team_netpoll_cleanup(struct net_device *dev) 1870 { 1871 struct team *team = netdev_priv(dev); 1872 1873 mutex_lock(&team->lock); 1874 __team_netpoll_cleanup(team); 1875 mutex_unlock(&team->lock); 1876 } 1877 1878 static int team_netpoll_setup(struct net_device *dev, 1879 struct netpoll_info *npifo) 1880 { 1881 struct team *team = netdev_priv(dev); 1882 struct team_port *port; 1883 int err = 0; 1884 1885 mutex_lock(&team->lock); 1886 list_for_each_entry(port, &team->port_list, list) { 1887 err = team_port_enable_netpoll(team, port); 1888 if (err) { 1889 __team_netpoll_cleanup(team); 1890 break; 1891 } 1892 } 1893 mutex_unlock(&team->lock); 1894 return err; 1895 } 1896 #endif 1897 1898 static int team_add_slave(struct net_device *dev, struct net_device *port_dev) 1899 { 1900 struct team *team = netdev_priv(dev); 1901 int err; 1902 1903 mutex_lock(&team->lock); 1904 err = team_port_add(team, port_dev); 1905 mutex_unlock(&team->lock); 1906 return err; 1907 } 1908 1909 static int team_del_slave(struct net_device *dev, struct net_device *port_dev) 1910 { 1911 struct team *team = netdev_priv(dev); 1912 int err; 1913 1914 mutex_lock(&team->lock); 1915 err = team_port_del(team, port_dev); 1916 mutex_unlock(&team->lock); 1917 return err; 1918 } 1919 1920 static netdev_features_t team_fix_features(struct net_device *dev, 1921 netdev_features_t features) 1922 { 1923 struct team_port *port; 1924 struct team *team = netdev_priv(dev); 1925 netdev_features_t mask; 1926 1927 mask = features | NETIF_F_HW_SWITCH_OFFLOAD; 1928 features &= ~NETIF_F_ONE_FOR_ALL; 1929 features |= NETIF_F_ALL_FOR_ALL; 1930 1931 rcu_read_lock(); 1932 list_for_each_entry_rcu(port, &team->port_list, list) { 1933 features = netdev_increment_features(features, 1934 port->dev->features, 1935 mask); 1936 } 1937 rcu_read_unlock(); 1938 1939 features = netdev_add_tso_features(features, mask); 1940 1941 return features; 1942 } 1943 1944 static int team_change_carrier(struct net_device *dev, bool new_carrier) 1945 { 1946 struct team *team = netdev_priv(dev); 1947 1948 team->user_carrier_enabled = true; 1949 1950 if (new_carrier) 1951 netif_carrier_on(dev); 1952 else 1953 netif_carrier_off(dev); 1954 return 0; 1955 } 1956 1957 static const struct net_device_ops team_netdev_ops = { 1958 .ndo_init = team_init, 1959 .ndo_uninit = team_uninit, 1960 .ndo_open = team_open, 1961 .ndo_stop = team_close, 1962 .ndo_start_xmit = team_xmit, 1963 .ndo_select_queue = team_select_queue, 1964 .ndo_change_rx_flags = team_change_rx_flags, 1965 .ndo_set_rx_mode = team_set_rx_mode, 1966 .ndo_set_mac_address = team_set_mac_address, 1967 .ndo_change_mtu = team_change_mtu, 1968 .ndo_get_stats64 = team_get_stats64, 1969 .ndo_vlan_rx_add_vid = team_vlan_rx_add_vid, 1970 .ndo_vlan_rx_kill_vid = team_vlan_rx_kill_vid, 1971 #ifdef CONFIG_NET_POLL_CONTROLLER 1972 .ndo_poll_controller = team_poll_controller, 1973 .ndo_netpoll_setup = team_netpoll_setup, 1974 .ndo_netpoll_cleanup = team_netpoll_cleanup, 1975 #endif 1976 .ndo_add_slave = team_add_slave, 1977 .ndo_del_slave = team_del_slave, 1978 .ndo_fix_features = team_fix_features, 1979 .ndo_change_carrier = team_change_carrier, 1980 .ndo_bridge_setlink = ndo_dflt_netdev_switch_port_bridge_setlink, 1981 .ndo_bridge_dellink = ndo_dflt_netdev_switch_port_bridge_dellink, 1982 }; 1983 1984 /*********************** 1985 * ethtool interface 1986 ***********************/ 1987 1988 static void team_ethtool_get_drvinfo(struct net_device *dev, 1989 struct ethtool_drvinfo *drvinfo) 1990 { 1991 strlcpy(drvinfo->driver, DRV_NAME, sizeof(drvinfo->driver)); 1992 strlcpy(drvinfo->version, UTS_RELEASE, sizeof(drvinfo->version)); 1993 } 1994 1995 static const struct ethtool_ops team_ethtool_ops = { 1996 .get_drvinfo = team_ethtool_get_drvinfo, 1997 .get_link = ethtool_op_get_link, 1998 }; 1999 2000 /*********************** 2001 * rt netlink interface 2002 ***********************/ 2003 2004 static void team_setup_by_port(struct net_device *dev, 2005 struct net_device *port_dev) 2006 { 2007 dev->header_ops = port_dev->header_ops; 2008 dev->type = port_dev->type; 2009 dev->hard_header_len = port_dev->hard_header_len; 2010 dev->addr_len = port_dev->addr_len; 2011 dev->mtu = port_dev->mtu; 2012 memcpy(dev->broadcast, port_dev->broadcast, port_dev->addr_len); 2013 eth_hw_addr_inherit(dev, port_dev); 2014 } 2015 2016 static int team_dev_type_check_change(struct net_device *dev, 2017 struct net_device *port_dev) 2018 { 2019 struct team *team = netdev_priv(dev); 2020 char *portname = port_dev->name; 2021 int err; 2022 2023 if (dev->type == port_dev->type) 2024 return 0; 2025 if (!list_empty(&team->port_list)) { 2026 netdev_err(dev, "Device %s is of different type\n", portname); 2027 return -EBUSY; 2028 } 2029 err = call_netdevice_notifiers(NETDEV_PRE_TYPE_CHANGE, dev); 2030 err = notifier_to_errno(err); 2031 if (err) { 2032 netdev_err(dev, "Refused to change device type\n"); 2033 return err; 2034 } 2035 dev_uc_flush(dev); 2036 dev_mc_flush(dev); 2037 team_setup_by_port(dev, port_dev); 2038 call_netdevice_notifiers(NETDEV_POST_TYPE_CHANGE, dev); 2039 return 0; 2040 } 2041 2042 static void team_setup(struct net_device *dev) 2043 { 2044 ether_setup(dev); 2045 2046 dev->netdev_ops = &team_netdev_ops; 2047 dev->ethtool_ops = &team_ethtool_ops; 2048 dev->destructor = team_destructor; 2049 dev->tx_queue_len = 0; 2050 dev->flags |= IFF_MULTICAST; 2051 dev->priv_flags &= ~(IFF_XMIT_DST_RELEASE | IFF_TX_SKB_SHARING); 2052 2053 /* 2054 * Indicate we support unicast address filtering. That way core won't 2055 * bring us to promisc mode in case a unicast addr is added. 2056 * Let this up to underlay drivers. 2057 */ 2058 dev->priv_flags |= IFF_UNICAST_FLT | IFF_LIVE_ADDR_CHANGE; 2059 2060 dev->features |= NETIF_F_LLTX; 2061 dev->features |= NETIF_F_GRO; 2062 2063 /* Don't allow team devices to change network namespaces. */ 2064 dev->features |= NETIF_F_NETNS_LOCAL; 2065 2066 dev->hw_features = TEAM_VLAN_FEATURES | 2067 NETIF_F_HW_VLAN_CTAG_TX | 2068 NETIF_F_HW_VLAN_CTAG_RX | 2069 NETIF_F_HW_VLAN_CTAG_FILTER; 2070 2071 dev->hw_features &= ~(NETIF_F_ALL_CSUM & ~NETIF_F_HW_CSUM); 2072 dev->features |= dev->hw_features; 2073 } 2074 2075 static int team_newlink(struct net *src_net, struct net_device *dev, 2076 struct nlattr *tb[], struct nlattr *data[]) 2077 { 2078 if (tb[IFLA_ADDRESS] == NULL) 2079 eth_hw_addr_random(dev); 2080 2081 return register_netdevice(dev); 2082 } 2083 2084 static int team_validate(struct nlattr *tb[], struct nlattr *data[]) 2085 { 2086 if (tb[IFLA_ADDRESS]) { 2087 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN) 2088 return -EINVAL; 2089 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS]))) 2090 return -EADDRNOTAVAIL; 2091 } 2092 return 0; 2093 } 2094 2095 static unsigned int team_get_num_tx_queues(void) 2096 { 2097 return TEAM_DEFAULT_NUM_TX_QUEUES; 2098 } 2099 2100 static unsigned int team_get_num_rx_queues(void) 2101 { 2102 return TEAM_DEFAULT_NUM_RX_QUEUES; 2103 } 2104 2105 static struct rtnl_link_ops team_link_ops __read_mostly = { 2106 .kind = DRV_NAME, 2107 .priv_size = sizeof(struct team), 2108 .setup = team_setup, 2109 .newlink = team_newlink, 2110 .validate = team_validate, 2111 .get_num_tx_queues = team_get_num_tx_queues, 2112 .get_num_rx_queues = team_get_num_rx_queues, 2113 }; 2114 2115 2116 /*********************************** 2117 * Generic netlink custom interface 2118 ***********************************/ 2119 2120 static struct genl_family team_nl_family = { 2121 .id = GENL_ID_GENERATE, 2122 .name = TEAM_GENL_NAME, 2123 .version = TEAM_GENL_VERSION, 2124 .maxattr = TEAM_ATTR_MAX, 2125 .netnsok = true, 2126 }; 2127 2128 static const struct nla_policy team_nl_policy[TEAM_ATTR_MAX + 1] = { 2129 [TEAM_ATTR_UNSPEC] = { .type = NLA_UNSPEC, }, 2130 [TEAM_ATTR_TEAM_IFINDEX] = { .type = NLA_U32 }, 2131 [TEAM_ATTR_LIST_OPTION] = { .type = NLA_NESTED }, 2132 [TEAM_ATTR_LIST_PORT] = { .type = NLA_NESTED }, 2133 }; 2134 2135 static const struct nla_policy 2136 team_nl_option_policy[TEAM_ATTR_OPTION_MAX + 1] = { 2137 [TEAM_ATTR_OPTION_UNSPEC] = { .type = NLA_UNSPEC, }, 2138 [TEAM_ATTR_OPTION_NAME] = { 2139 .type = NLA_STRING, 2140 .len = TEAM_STRING_MAX_LEN, 2141 }, 2142 [TEAM_ATTR_OPTION_CHANGED] = { .type = NLA_FLAG }, 2143 [TEAM_ATTR_OPTION_TYPE] = { .type = NLA_U8 }, 2144 [TEAM_ATTR_OPTION_DATA] = { .type = NLA_BINARY }, 2145 }; 2146 2147 static int team_nl_cmd_noop(struct sk_buff *skb, struct genl_info *info) 2148 { 2149 struct sk_buff *msg; 2150 void *hdr; 2151 int err; 2152 2153 msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL); 2154 if (!msg) 2155 return -ENOMEM; 2156 2157 hdr = genlmsg_put(msg, info->snd_portid, info->snd_seq, 2158 &team_nl_family, 0, TEAM_CMD_NOOP); 2159 if (!hdr) { 2160 err = -EMSGSIZE; 2161 goto err_msg_put; 2162 } 2163 2164 genlmsg_end(msg, hdr); 2165 2166 return genlmsg_unicast(genl_info_net(info), msg, info->snd_portid); 2167 2168 err_msg_put: 2169 nlmsg_free(msg); 2170 2171 return err; 2172 } 2173 2174 /* 2175 * Netlink cmd functions should be locked by following two functions. 2176 * Since dev gets held here, that ensures dev won't disappear in between. 2177 */ 2178 static struct team *team_nl_team_get(struct genl_info *info) 2179 { 2180 struct net *net = genl_info_net(info); 2181 int ifindex; 2182 struct net_device *dev; 2183 struct team *team; 2184 2185 if (!info->attrs[TEAM_ATTR_TEAM_IFINDEX]) 2186 return NULL; 2187 2188 ifindex = nla_get_u32(info->attrs[TEAM_ATTR_TEAM_IFINDEX]); 2189 dev = dev_get_by_index(net, ifindex); 2190 if (!dev || dev->netdev_ops != &team_netdev_ops) { 2191 if (dev) 2192 dev_put(dev); 2193 return NULL; 2194 } 2195 2196 team = netdev_priv(dev); 2197 mutex_lock(&team->lock); 2198 return team; 2199 } 2200 2201 static void team_nl_team_put(struct team *team) 2202 { 2203 mutex_unlock(&team->lock); 2204 dev_put(team->dev); 2205 } 2206 2207 typedef int team_nl_send_func_t(struct sk_buff *skb, 2208 struct team *team, u32 portid); 2209 2210 static int team_nl_send_unicast(struct sk_buff *skb, struct team *team, u32 portid) 2211 { 2212 return genlmsg_unicast(dev_net(team->dev), skb, portid); 2213 } 2214 2215 static int team_nl_fill_one_option_get(struct sk_buff *skb, struct team *team, 2216 struct team_option_inst *opt_inst) 2217 { 2218 struct nlattr *option_item; 2219 struct team_option *option = opt_inst->option; 2220 struct team_option_inst_info *opt_inst_info = &opt_inst->info; 2221 struct team_gsetter_ctx ctx; 2222 int err; 2223 2224 ctx.info = opt_inst_info; 2225 err = team_option_get(team, opt_inst, &ctx); 2226 if (err) 2227 return err; 2228 2229 option_item = nla_nest_start(skb, TEAM_ATTR_ITEM_OPTION); 2230 if (!option_item) 2231 return -EMSGSIZE; 2232 2233 if (nla_put_string(skb, TEAM_ATTR_OPTION_NAME, option->name)) 2234 goto nest_cancel; 2235 if (opt_inst_info->port && 2236 nla_put_u32(skb, TEAM_ATTR_OPTION_PORT_IFINDEX, 2237 opt_inst_info->port->dev->ifindex)) 2238 goto nest_cancel; 2239 if (opt_inst->option->array_size && 2240 nla_put_u32(skb, TEAM_ATTR_OPTION_ARRAY_INDEX, 2241 opt_inst_info->array_index)) 2242 goto nest_cancel; 2243 2244 switch (option->type) { 2245 case TEAM_OPTION_TYPE_U32: 2246 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_U32)) 2247 goto nest_cancel; 2248 if (nla_put_u32(skb, TEAM_ATTR_OPTION_DATA, ctx.data.u32_val)) 2249 goto nest_cancel; 2250 break; 2251 case TEAM_OPTION_TYPE_STRING: 2252 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_STRING)) 2253 goto nest_cancel; 2254 if (nla_put_string(skb, TEAM_ATTR_OPTION_DATA, 2255 ctx.data.str_val)) 2256 goto nest_cancel; 2257 break; 2258 case TEAM_OPTION_TYPE_BINARY: 2259 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_BINARY)) 2260 goto nest_cancel; 2261 if (nla_put(skb, TEAM_ATTR_OPTION_DATA, ctx.data.bin_val.len, 2262 ctx.data.bin_val.ptr)) 2263 goto nest_cancel; 2264 break; 2265 case TEAM_OPTION_TYPE_BOOL: 2266 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_FLAG)) 2267 goto nest_cancel; 2268 if (ctx.data.bool_val && 2269 nla_put_flag(skb, TEAM_ATTR_OPTION_DATA)) 2270 goto nest_cancel; 2271 break; 2272 case TEAM_OPTION_TYPE_S32: 2273 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_S32)) 2274 goto nest_cancel; 2275 if (nla_put_s32(skb, TEAM_ATTR_OPTION_DATA, ctx.data.s32_val)) 2276 goto nest_cancel; 2277 break; 2278 default: 2279 BUG(); 2280 } 2281 if (opt_inst->removed && nla_put_flag(skb, TEAM_ATTR_OPTION_REMOVED)) 2282 goto nest_cancel; 2283 if (opt_inst->changed) { 2284 if (nla_put_flag(skb, TEAM_ATTR_OPTION_CHANGED)) 2285 goto nest_cancel; 2286 opt_inst->changed = false; 2287 } 2288 nla_nest_end(skb, option_item); 2289 return 0; 2290 2291 nest_cancel: 2292 nla_nest_cancel(skb, option_item); 2293 return -EMSGSIZE; 2294 } 2295 2296 static int __send_and_alloc_skb(struct sk_buff **pskb, 2297 struct team *team, u32 portid, 2298 team_nl_send_func_t *send_func) 2299 { 2300 int err; 2301 2302 if (*pskb) { 2303 err = send_func(*pskb, team, portid); 2304 if (err) 2305 return err; 2306 } 2307 *pskb = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL); 2308 if (!*pskb) 2309 return -ENOMEM; 2310 return 0; 2311 } 2312 2313 static int team_nl_send_options_get(struct team *team, u32 portid, u32 seq, 2314 int flags, team_nl_send_func_t *send_func, 2315 struct list_head *sel_opt_inst_list) 2316 { 2317 struct nlattr *option_list; 2318 struct nlmsghdr *nlh; 2319 void *hdr; 2320 struct team_option_inst *opt_inst; 2321 int err; 2322 struct sk_buff *skb = NULL; 2323 bool incomplete; 2324 int i; 2325 2326 opt_inst = list_first_entry(sel_opt_inst_list, 2327 struct team_option_inst, tmp_list); 2328 2329 start_again: 2330 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2331 if (err) 2332 return err; 2333 2334 hdr = genlmsg_put(skb, portid, seq, &team_nl_family, flags | NLM_F_MULTI, 2335 TEAM_CMD_OPTIONS_GET); 2336 if (!hdr) 2337 return -EMSGSIZE; 2338 2339 if (nla_put_u32(skb, TEAM_ATTR_TEAM_IFINDEX, team->dev->ifindex)) 2340 goto nla_put_failure; 2341 option_list = nla_nest_start(skb, TEAM_ATTR_LIST_OPTION); 2342 if (!option_list) 2343 goto nla_put_failure; 2344 2345 i = 0; 2346 incomplete = false; 2347 list_for_each_entry_from(opt_inst, sel_opt_inst_list, tmp_list) { 2348 err = team_nl_fill_one_option_get(skb, team, opt_inst); 2349 if (err) { 2350 if (err == -EMSGSIZE) { 2351 if (!i) 2352 goto errout; 2353 incomplete = true; 2354 break; 2355 } 2356 goto errout; 2357 } 2358 i++; 2359 } 2360 2361 nla_nest_end(skb, option_list); 2362 genlmsg_end(skb, hdr); 2363 if (incomplete) 2364 goto start_again; 2365 2366 send_done: 2367 nlh = nlmsg_put(skb, portid, seq, NLMSG_DONE, 0, flags | NLM_F_MULTI); 2368 if (!nlh) { 2369 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2370 if (err) 2371 goto errout; 2372 goto send_done; 2373 } 2374 2375 return send_func(skb, team, portid); 2376 2377 nla_put_failure: 2378 err = -EMSGSIZE; 2379 errout: 2380 genlmsg_cancel(skb, hdr); 2381 nlmsg_free(skb); 2382 return err; 2383 } 2384 2385 static int team_nl_cmd_options_get(struct sk_buff *skb, struct genl_info *info) 2386 { 2387 struct team *team; 2388 struct team_option_inst *opt_inst; 2389 int err; 2390 LIST_HEAD(sel_opt_inst_list); 2391 2392 team = team_nl_team_get(info); 2393 if (!team) 2394 return -EINVAL; 2395 2396 list_for_each_entry(opt_inst, &team->option_inst_list, list) 2397 list_add_tail(&opt_inst->tmp_list, &sel_opt_inst_list); 2398 err = team_nl_send_options_get(team, info->snd_portid, info->snd_seq, 2399 NLM_F_ACK, team_nl_send_unicast, 2400 &sel_opt_inst_list); 2401 2402 team_nl_team_put(team); 2403 2404 return err; 2405 } 2406 2407 static int team_nl_send_event_options_get(struct team *team, 2408 struct list_head *sel_opt_inst_list); 2409 2410 static int team_nl_cmd_options_set(struct sk_buff *skb, struct genl_info *info) 2411 { 2412 struct team *team; 2413 int err = 0; 2414 int i; 2415 struct nlattr *nl_option; 2416 LIST_HEAD(opt_inst_list); 2417 2418 team = team_nl_team_get(info); 2419 if (!team) 2420 return -EINVAL; 2421 2422 err = -EINVAL; 2423 if (!info->attrs[TEAM_ATTR_LIST_OPTION]) { 2424 err = -EINVAL; 2425 goto team_put; 2426 } 2427 2428 nla_for_each_nested(nl_option, info->attrs[TEAM_ATTR_LIST_OPTION], i) { 2429 struct nlattr *opt_attrs[TEAM_ATTR_OPTION_MAX + 1]; 2430 struct nlattr *attr; 2431 struct nlattr *attr_data; 2432 enum team_option_type opt_type; 2433 int opt_port_ifindex = 0; /* != 0 for per-port options */ 2434 u32 opt_array_index = 0; 2435 bool opt_is_array = false; 2436 struct team_option_inst *opt_inst; 2437 char *opt_name; 2438 bool opt_found = false; 2439 2440 if (nla_type(nl_option) != TEAM_ATTR_ITEM_OPTION) { 2441 err = -EINVAL; 2442 goto team_put; 2443 } 2444 err = nla_parse_nested(opt_attrs, TEAM_ATTR_OPTION_MAX, 2445 nl_option, team_nl_option_policy); 2446 if (err) 2447 goto team_put; 2448 if (!opt_attrs[TEAM_ATTR_OPTION_NAME] || 2449 !opt_attrs[TEAM_ATTR_OPTION_TYPE]) { 2450 err = -EINVAL; 2451 goto team_put; 2452 } 2453 switch (nla_get_u8(opt_attrs[TEAM_ATTR_OPTION_TYPE])) { 2454 case NLA_U32: 2455 opt_type = TEAM_OPTION_TYPE_U32; 2456 break; 2457 case NLA_STRING: 2458 opt_type = TEAM_OPTION_TYPE_STRING; 2459 break; 2460 case NLA_BINARY: 2461 opt_type = TEAM_OPTION_TYPE_BINARY; 2462 break; 2463 case NLA_FLAG: 2464 opt_type = TEAM_OPTION_TYPE_BOOL; 2465 break; 2466 case NLA_S32: 2467 opt_type = TEAM_OPTION_TYPE_S32; 2468 break; 2469 default: 2470 goto team_put; 2471 } 2472 2473 attr_data = opt_attrs[TEAM_ATTR_OPTION_DATA]; 2474 if (opt_type != TEAM_OPTION_TYPE_BOOL && !attr_data) { 2475 err = -EINVAL; 2476 goto team_put; 2477 } 2478 2479 opt_name = nla_data(opt_attrs[TEAM_ATTR_OPTION_NAME]); 2480 attr = opt_attrs[TEAM_ATTR_OPTION_PORT_IFINDEX]; 2481 if (attr) 2482 opt_port_ifindex = nla_get_u32(attr); 2483 2484 attr = opt_attrs[TEAM_ATTR_OPTION_ARRAY_INDEX]; 2485 if (attr) { 2486 opt_is_array = true; 2487 opt_array_index = nla_get_u32(attr); 2488 } 2489 2490 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 2491 struct team_option *option = opt_inst->option; 2492 struct team_gsetter_ctx ctx; 2493 struct team_option_inst_info *opt_inst_info; 2494 int tmp_ifindex; 2495 2496 opt_inst_info = &opt_inst->info; 2497 tmp_ifindex = opt_inst_info->port ? 2498 opt_inst_info->port->dev->ifindex : 0; 2499 if (option->type != opt_type || 2500 strcmp(option->name, opt_name) || 2501 tmp_ifindex != opt_port_ifindex || 2502 (option->array_size && !opt_is_array) || 2503 opt_inst_info->array_index != opt_array_index) 2504 continue; 2505 opt_found = true; 2506 ctx.info = opt_inst_info; 2507 switch (opt_type) { 2508 case TEAM_OPTION_TYPE_U32: 2509 ctx.data.u32_val = nla_get_u32(attr_data); 2510 break; 2511 case TEAM_OPTION_TYPE_STRING: 2512 if (nla_len(attr_data) > TEAM_STRING_MAX_LEN) { 2513 err = -EINVAL; 2514 goto team_put; 2515 } 2516 ctx.data.str_val = nla_data(attr_data); 2517 break; 2518 case TEAM_OPTION_TYPE_BINARY: 2519 ctx.data.bin_val.len = nla_len(attr_data); 2520 ctx.data.bin_val.ptr = nla_data(attr_data); 2521 break; 2522 case TEAM_OPTION_TYPE_BOOL: 2523 ctx.data.bool_val = attr_data ? true : false; 2524 break; 2525 case TEAM_OPTION_TYPE_S32: 2526 ctx.data.s32_val = nla_get_s32(attr_data); 2527 break; 2528 default: 2529 BUG(); 2530 } 2531 err = team_option_set(team, opt_inst, &ctx); 2532 if (err) 2533 goto team_put; 2534 opt_inst->changed = true; 2535 list_add(&opt_inst->tmp_list, &opt_inst_list); 2536 } 2537 if (!opt_found) { 2538 err = -ENOENT; 2539 goto team_put; 2540 } 2541 } 2542 2543 err = team_nl_send_event_options_get(team, &opt_inst_list); 2544 2545 team_put: 2546 team_nl_team_put(team); 2547 2548 return err; 2549 } 2550 2551 static int team_nl_fill_one_port_get(struct sk_buff *skb, 2552 struct team_port *port) 2553 { 2554 struct nlattr *port_item; 2555 2556 port_item = nla_nest_start(skb, TEAM_ATTR_ITEM_PORT); 2557 if (!port_item) 2558 goto nest_cancel; 2559 if (nla_put_u32(skb, TEAM_ATTR_PORT_IFINDEX, port->dev->ifindex)) 2560 goto nest_cancel; 2561 if (port->changed) { 2562 if (nla_put_flag(skb, TEAM_ATTR_PORT_CHANGED)) 2563 goto nest_cancel; 2564 port->changed = false; 2565 } 2566 if ((port->removed && 2567 nla_put_flag(skb, TEAM_ATTR_PORT_REMOVED)) || 2568 (port->state.linkup && 2569 nla_put_flag(skb, TEAM_ATTR_PORT_LINKUP)) || 2570 nla_put_u32(skb, TEAM_ATTR_PORT_SPEED, port->state.speed) || 2571 nla_put_u8(skb, TEAM_ATTR_PORT_DUPLEX, port->state.duplex)) 2572 goto nest_cancel; 2573 nla_nest_end(skb, port_item); 2574 return 0; 2575 2576 nest_cancel: 2577 nla_nest_cancel(skb, port_item); 2578 return -EMSGSIZE; 2579 } 2580 2581 static int team_nl_send_port_list_get(struct team *team, u32 portid, u32 seq, 2582 int flags, team_nl_send_func_t *send_func, 2583 struct team_port *one_port) 2584 { 2585 struct nlattr *port_list; 2586 struct nlmsghdr *nlh; 2587 void *hdr; 2588 struct team_port *port; 2589 int err; 2590 struct sk_buff *skb = NULL; 2591 bool incomplete; 2592 int i; 2593 2594 port = list_first_entry_or_null(&team->port_list, 2595 struct team_port, list); 2596 2597 start_again: 2598 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2599 if (err) 2600 return err; 2601 2602 hdr = genlmsg_put(skb, portid, seq, &team_nl_family, flags | NLM_F_MULTI, 2603 TEAM_CMD_PORT_LIST_GET); 2604 if (!hdr) 2605 return -EMSGSIZE; 2606 2607 if (nla_put_u32(skb, TEAM_ATTR_TEAM_IFINDEX, team->dev->ifindex)) 2608 goto nla_put_failure; 2609 port_list = nla_nest_start(skb, TEAM_ATTR_LIST_PORT); 2610 if (!port_list) 2611 goto nla_put_failure; 2612 2613 i = 0; 2614 incomplete = false; 2615 2616 /* If one port is selected, called wants to send port list containing 2617 * only this port. Otherwise go through all listed ports and send all 2618 */ 2619 if (one_port) { 2620 err = team_nl_fill_one_port_get(skb, one_port); 2621 if (err) 2622 goto errout; 2623 } else if (port) { 2624 list_for_each_entry_from(port, &team->port_list, list) { 2625 err = team_nl_fill_one_port_get(skb, port); 2626 if (err) { 2627 if (err == -EMSGSIZE) { 2628 if (!i) 2629 goto errout; 2630 incomplete = true; 2631 break; 2632 } 2633 goto errout; 2634 } 2635 i++; 2636 } 2637 } 2638 2639 nla_nest_end(skb, port_list); 2640 genlmsg_end(skb, hdr); 2641 if (incomplete) 2642 goto start_again; 2643 2644 send_done: 2645 nlh = nlmsg_put(skb, portid, seq, NLMSG_DONE, 0, flags | NLM_F_MULTI); 2646 if (!nlh) { 2647 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2648 if (err) 2649 goto errout; 2650 goto send_done; 2651 } 2652 2653 return send_func(skb, team, portid); 2654 2655 nla_put_failure: 2656 err = -EMSGSIZE; 2657 errout: 2658 genlmsg_cancel(skb, hdr); 2659 nlmsg_free(skb); 2660 return err; 2661 } 2662 2663 static int team_nl_cmd_port_list_get(struct sk_buff *skb, 2664 struct genl_info *info) 2665 { 2666 struct team *team; 2667 int err; 2668 2669 team = team_nl_team_get(info); 2670 if (!team) 2671 return -EINVAL; 2672 2673 err = team_nl_send_port_list_get(team, info->snd_portid, info->snd_seq, 2674 NLM_F_ACK, team_nl_send_unicast, NULL); 2675 2676 team_nl_team_put(team); 2677 2678 return err; 2679 } 2680 2681 static const struct genl_ops team_nl_ops[] = { 2682 { 2683 .cmd = TEAM_CMD_NOOP, 2684 .doit = team_nl_cmd_noop, 2685 .policy = team_nl_policy, 2686 }, 2687 { 2688 .cmd = TEAM_CMD_OPTIONS_SET, 2689 .doit = team_nl_cmd_options_set, 2690 .policy = team_nl_policy, 2691 .flags = GENL_ADMIN_PERM, 2692 }, 2693 { 2694 .cmd = TEAM_CMD_OPTIONS_GET, 2695 .doit = team_nl_cmd_options_get, 2696 .policy = team_nl_policy, 2697 .flags = GENL_ADMIN_PERM, 2698 }, 2699 { 2700 .cmd = TEAM_CMD_PORT_LIST_GET, 2701 .doit = team_nl_cmd_port_list_get, 2702 .policy = team_nl_policy, 2703 .flags = GENL_ADMIN_PERM, 2704 }, 2705 }; 2706 2707 static const struct genl_multicast_group team_nl_mcgrps[] = { 2708 { .name = TEAM_GENL_CHANGE_EVENT_MC_GRP_NAME, }, 2709 }; 2710 2711 static int team_nl_send_multicast(struct sk_buff *skb, 2712 struct team *team, u32 portid) 2713 { 2714 return genlmsg_multicast_netns(&team_nl_family, dev_net(team->dev), 2715 skb, 0, 0, GFP_KERNEL); 2716 } 2717 2718 static int team_nl_send_event_options_get(struct team *team, 2719 struct list_head *sel_opt_inst_list) 2720 { 2721 return team_nl_send_options_get(team, 0, 0, 0, team_nl_send_multicast, 2722 sel_opt_inst_list); 2723 } 2724 2725 static int team_nl_send_event_port_get(struct team *team, 2726 struct team_port *port) 2727 { 2728 return team_nl_send_port_list_get(team, 0, 0, 0, team_nl_send_multicast, 2729 port); 2730 } 2731 2732 static int team_nl_init(void) 2733 { 2734 return genl_register_family_with_ops_groups(&team_nl_family, team_nl_ops, 2735 team_nl_mcgrps); 2736 } 2737 2738 static void team_nl_fini(void) 2739 { 2740 genl_unregister_family(&team_nl_family); 2741 } 2742 2743 2744 /****************** 2745 * Change checkers 2746 ******************/ 2747 2748 static void __team_options_change_check(struct team *team) 2749 { 2750 int err; 2751 struct team_option_inst *opt_inst; 2752 LIST_HEAD(sel_opt_inst_list); 2753 2754 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 2755 if (opt_inst->changed) 2756 list_add_tail(&opt_inst->tmp_list, &sel_opt_inst_list); 2757 } 2758 err = team_nl_send_event_options_get(team, &sel_opt_inst_list); 2759 if (err && err != -ESRCH) 2760 netdev_warn(team->dev, "Failed to send options change via netlink (err %d)\n", 2761 err); 2762 } 2763 2764 /* rtnl lock is held */ 2765 2766 static void __team_port_change_send(struct team_port *port, bool linkup) 2767 { 2768 int err; 2769 2770 port->changed = true; 2771 port->state.linkup = linkup; 2772 team_refresh_port_linkup(port); 2773 if (linkup) { 2774 struct ethtool_cmd ecmd; 2775 2776 err = __ethtool_get_settings(port->dev, &ecmd); 2777 if (!err) { 2778 port->state.speed = ethtool_cmd_speed(&ecmd); 2779 port->state.duplex = ecmd.duplex; 2780 goto send_event; 2781 } 2782 } 2783 port->state.speed = 0; 2784 port->state.duplex = 0; 2785 2786 send_event: 2787 err = team_nl_send_event_port_get(port->team, port); 2788 if (err && err != -ESRCH) 2789 netdev_warn(port->team->dev, "Failed to send port change of device %s via netlink (err %d)\n", 2790 port->dev->name, err); 2791 2792 } 2793 2794 static void __team_carrier_check(struct team *team) 2795 { 2796 struct team_port *port; 2797 bool team_linkup; 2798 2799 if (team->user_carrier_enabled) 2800 return; 2801 2802 team_linkup = false; 2803 list_for_each_entry(port, &team->port_list, list) { 2804 if (port->linkup) { 2805 team_linkup = true; 2806 break; 2807 } 2808 } 2809 2810 if (team_linkup) 2811 netif_carrier_on(team->dev); 2812 else 2813 netif_carrier_off(team->dev); 2814 } 2815 2816 static void __team_port_change_check(struct team_port *port, bool linkup) 2817 { 2818 if (port->state.linkup != linkup) 2819 __team_port_change_send(port, linkup); 2820 __team_carrier_check(port->team); 2821 } 2822 2823 static void __team_port_change_port_added(struct team_port *port, bool linkup) 2824 { 2825 __team_port_change_send(port, linkup); 2826 __team_carrier_check(port->team); 2827 } 2828 2829 static void __team_port_change_port_removed(struct team_port *port) 2830 { 2831 port->removed = true; 2832 __team_port_change_send(port, false); 2833 __team_carrier_check(port->team); 2834 } 2835 2836 static void team_port_change_check(struct team_port *port, bool linkup) 2837 { 2838 struct team *team = port->team; 2839 2840 mutex_lock(&team->lock); 2841 __team_port_change_check(port, linkup); 2842 mutex_unlock(&team->lock); 2843 } 2844 2845 2846 /************************************ 2847 * Net device notifier event handler 2848 ************************************/ 2849 2850 static int team_device_event(struct notifier_block *unused, 2851 unsigned long event, void *ptr) 2852 { 2853 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 2854 struct team_port *port; 2855 2856 port = team_port_get_rtnl(dev); 2857 if (!port) 2858 return NOTIFY_DONE; 2859 2860 switch (event) { 2861 case NETDEV_UP: 2862 if (netif_carrier_ok(dev)) 2863 team_port_change_check(port, true); 2864 break; 2865 case NETDEV_DOWN: 2866 team_port_change_check(port, false); 2867 break; 2868 case NETDEV_CHANGE: 2869 if (netif_running(port->dev)) 2870 team_port_change_check(port, 2871 !!netif_carrier_ok(port->dev)); 2872 break; 2873 case NETDEV_UNREGISTER: 2874 team_del_slave(port->team->dev, dev); 2875 break; 2876 case NETDEV_FEAT_CHANGE: 2877 team_compute_features(port->team); 2878 break; 2879 case NETDEV_PRECHANGEMTU: 2880 /* Forbid to change mtu of underlaying device */ 2881 if (!port->team->port_mtu_change_allowed) 2882 return NOTIFY_BAD; 2883 break; 2884 case NETDEV_PRE_TYPE_CHANGE: 2885 /* Forbid to change type of underlaying device */ 2886 return NOTIFY_BAD; 2887 case NETDEV_RESEND_IGMP: 2888 /* Propagate to master device */ 2889 call_netdevice_notifiers(event, port->team->dev); 2890 break; 2891 } 2892 return NOTIFY_DONE; 2893 } 2894 2895 static struct notifier_block team_notifier_block __read_mostly = { 2896 .notifier_call = team_device_event, 2897 }; 2898 2899 2900 /*********************** 2901 * Module init and exit 2902 ***********************/ 2903 2904 static int __init team_module_init(void) 2905 { 2906 int err; 2907 2908 register_netdevice_notifier(&team_notifier_block); 2909 2910 err = rtnl_link_register(&team_link_ops); 2911 if (err) 2912 goto err_rtnl_reg; 2913 2914 err = team_nl_init(); 2915 if (err) 2916 goto err_nl_init; 2917 2918 return 0; 2919 2920 err_nl_init: 2921 rtnl_link_unregister(&team_link_ops); 2922 2923 err_rtnl_reg: 2924 unregister_netdevice_notifier(&team_notifier_block); 2925 2926 return err; 2927 } 2928 2929 static void __exit team_module_exit(void) 2930 { 2931 team_nl_fini(); 2932 rtnl_link_unregister(&team_link_ops); 2933 unregister_netdevice_notifier(&team_notifier_block); 2934 } 2935 2936 module_init(team_module_init); 2937 module_exit(team_module_exit); 2938 2939 MODULE_LICENSE("GPL v2"); 2940 MODULE_AUTHOR("Jiri Pirko <jpirko@redhat.com>"); 2941 MODULE_DESCRIPTION("Ethernet team device driver"); 2942 MODULE_ALIAS_RTNL_LINK(DRV_NAME); 2943