1 /* 2 * drivers/net/team/team.c - Network team device driver 3 * Copyright (c) 2011 Jiri Pirko <jpirko@redhat.com> 4 * 5 * This program is free software; you can redistribute it and/or modify 6 * it under the terms of the GNU General Public License as published by 7 * the Free Software Foundation; either version 2 of the License, or 8 * (at your option) any later version. 9 */ 10 11 #include <linux/kernel.h> 12 #include <linux/types.h> 13 #include <linux/module.h> 14 #include <linux/init.h> 15 #include <linux/slab.h> 16 #include <linux/rcupdate.h> 17 #include <linux/errno.h> 18 #include <linux/ctype.h> 19 #include <linux/notifier.h> 20 #include <linux/netdevice.h> 21 #include <linux/netpoll.h> 22 #include <linux/if_vlan.h> 23 #include <linux/if_arp.h> 24 #include <linux/socket.h> 25 #include <linux/etherdevice.h> 26 #include <linux/rtnetlink.h> 27 #include <net/rtnetlink.h> 28 #include <net/genetlink.h> 29 #include <net/netlink.h> 30 #include <net/sch_generic.h> 31 #include <generated/utsrelease.h> 32 #include <linux/if_team.h> 33 34 #define DRV_NAME "team" 35 36 37 /********** 38 * Helpers 39 **********/ 40 41 #define team_port_exists(dev) (dev->priv_flags & IFF_TEAM_PORT) 42 43 static struct team_port *team_port_get_rcu(const struct net_device *dev) 44 { 45 struct team_port *port = rcu_dereference(dev->rx_handler_data); 46 47 return team_port_exists(dev) ? port : NULL; 48 } 49 50 static struct team_port *team_port_get_rtnl(const struct net_device *dev) 51 { 52 struct team_port *port = rtnl_dereference(dev->rx_handler_data); 53 54 return team_port_exists(dev) ? port : NULL; 55 } 56 57 /* 58 * Since the ability to change device address for open port device is tested in 59 * team_port_add, this function can be called without control of return value 60 */ 61 static int __set_port_dev_addr(struct net_device *port_dev, 62 const unsigned char *dev_addr) 63 { 64 struct sockaddr addr; 65 66 memcpy(addr.sa_data, dev_addr, port_dev->addr_len); 67 addr.sa_family = port_dev->type; 68 return dev_set_mac_address(port_dev, &addr); 69 } 70 71 static int team_port_set_orig_dev_addr(struct team_port *port) 72 { 73 return __set_port_dev_addr(port->dev, port->orig.dev_addr); 74 } 75 76 static int team_port_set_team_dev_addr(struct team *team, 77 struct team_port *port) 78 { 79 return __set_port_dev_addr(port->dev, team->dev->dev_addr); 80 } 81 82 int team_modeop_port_enter(struct team *team, struct team_port *port) 83 { 84 return team_port_set_team_dev_addr(team, port); 85 } 86 EXPORT_SYMBOL(team_modeop_port_enter); 87 88 void team_modeop_port_change_dev_addr(struct team *team, 89 struct team_port *port) 90 { 91 team_port_set_team_dev_addr(team, port); 92 } 93 EXPORT_SYMBOL(team_modeop_port_change_dev_addr); 94 95 static void team_refresh_port_linkup(struct team_port *port) 96 { 97 port->linkup = port->user.linkup_enabled ? port->user.linkup : 98 port->state.linkup; 99 } 100 101 102 /******************* 103 * Options handling 104 *******************/ 105 106 struct team_option_inst { /* One for each option instance */ 107 struct list_head list; 108 struct list_head tmp_list; 109 struct team_option *option; 110 struct team_option_inst_info info; 111 bool changed; 112 bool removed; 113 }; 114 115 static struct team_option *__team_find_option(struct team *team, 116 const char *opt_name) 117 { 118 struct team_option *option; 119 120 list_for_each_entry(option, &team->option_list, list) { 121 if (strcmp(option->name, opt_name) == 0) 122 return option; 123 } 124 return NULL; 125 } 126 127 static void __team_option_inst_del(struct team_option_inst *opt_inst) 128 { 129 list_del(&opt_inst->list); 130 kfree(opt_inst); 131 } 132 133 static void __team_option_inst_del_option(struct team *team, 134 struct team_option *option) 135 { 136 struct team_option_inst *opt_inst, *tmp; 137 138 list_for_each_entry_safe(opt_inst, tmp, &team->option_inst_list, list) { 139 if (opt_inst->option == option) 140 __team_option_inst_del(opt_inst); 141 } 142 } 143 144 static int __team_option_inst_add(struct team *team, struct team_option *option, 145 struct team_port *port) 146 { 147 struct team_option_inst *opt_inst; 148 unsigned int array_size; 149 unsigned int i; 150 int err; 151 152 array_size = option->array_size; 153 if (!array_size) 154 array_size = 1; /* No array but still need one instance */ 155 156 for (i = 0; i < array_size; i++) { 157 opt_inst = kmalloc(sizeof(*opt_inst), GFP_KERNEL); 158 if (!opt_inst) 159 return -ENOMEM; 160 opt_inst->option = option; 161 opt_inst->info.port = port; 162 opt_inst->info.array_index = i; 163 opt_inst->changed = true; 164 opt_inst->removed = false; 165 list_add_tail(&opt_inst->list, &team->option_inst_list); 166 if (option->init) { 167 err = option->init(team, &opt_inst->info); 168 if (err) 169 return err; 170 } 171 172 } 173 return 0; 174 } 175 176 static int __team_option_inst_add_option(struct team *team, 177 struct team_option *option) 178 { 179 struct team_port *port; 180 int err; 181 182 if (!option->per_port) { 183 err = __team_option_inst_add(team, option, NULL); 184 if (err) 185 goto inst_del_option; 186 } 187 188 list_for_each_entry(port, &team->port_list, list) { 189 err = __team_option_inst_add(team, option, port); 190 if (err) 191 goto inst_del_option; 192 } 193 return 0; 194 195 inst_del_option: 196 __team_option_inst_del_option(team, option); 197 return err; 198 } 199 200 static void __team_option_inst_mark_removed_option(struct team *team, 201 struct team_option *option) 202 { 203 struct team_option_inst *opt_inst; 204 205 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 206 if (opt_inst->option == option) { 207 opt_inst->changed = true; 208 opt_inst->removed = true; 209 } 210 } 211 } 212 213 static void __team_option_inst_del_port(struct team *team, 214 struct team_port *port) 215 { 216 struct team_option_inst *opt_inst, *tmp; 217 218 list_for_each_entry_safe(opt_inst, tmp, &team->option_inst_list, list) { 219 if (opt_inst->option->per_port && 220 opt_inst->info.port == port) 221 __team_option_inst_del(opt_inst); 222 } 223 } 224 225 static int __team_option_inst_add_port(struct team *team, 226 struct team_port *port) 227 { 228 struct team_option *option; 229 int err; 230 231 list_for_each_entry(option, &team->option_list, list) { 232 if (!option->per_port) 233 continue; 234 err = __team_option_inst_add(team, option, port); 235 if (err) 236 goto inst_del_port; 237 } 238 return 0; 239 240 inst_del_port: 241 __team_option_inst_del_port(team, port); 242 return err; 243 } 244 245 static void __team_option_inst_mark_removed_port(struct team *team, 246 struct team_port *port) 247 { 248 struct team_option_inst *opt_inst; 249 250 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 251 if (opt_inst->info.port == port) { 252 opt_inst->changed = true; 253 opt_inst->removed = true; 254 } 255 } 256 } 257 258 static int __team_options_register(struct team *team, 259 const struct team_option *option, 260 size_t option_count) 261 { 262 int i; 263 struct team_option **dst_opts; 264 int err; 265 266 dst_opts = kzalloc(sizeof(struct team_option *) * option_count, 267 GFP_KERNEL); 268 if (!dst_opts) 269 return -ENOMEM; 270 for (i = 0; i < option_count; i++, option++) { 271 if (__team_find_option(team, option->name)) { 272 err = -EEXIST; 273 goto alloc_rollback; 274 } 275 dst_opts[i] = kmemdup(option, sizeof(*option), GFP_KERNEL); 276 if (!dst_opts[i]) { 277 err = -ENOMEM; 278 goto alloc_rollback; 279 } 280 } 281 282 for (i = 0; i < option_count; i++) { 283 err = __team_option_inst_add_option(team, dst_opts[i]); 284 if (err) 285 goto inst_rollback; 286 list_add_tail(&dst_opts[i]->list, &team->option_list); 287 } 288 289 kfree(dst_opts); 290 return 0; 291 292 inst_rollback: 293 for (i--; i >= 0; i--) 294 __team_option_inst_del_option(team, dst_opts[i]); 295 296 i = option_count - 1; 297 alloc_rollback: 298 for (i--; i >= 0; i--) 299 kfree(dst_opts[i]); 300 301 kfree(dst_opts); 302 return err; 303 } 304 305 static void __team_options_mark_removed(struct team *team, 306 const struct team_option *option, 307 size_t option_count) 308 { 309 int i; 310 311 for (i = 0; i < option_count; i++, option++) { 312 struct team_option *del_opt; 313 314 del_opt = __team_find_option(team, option->name); 315 if (del_opt) 316 __team_option_inst_mark_removed_option(team, del_opt); 317 } 318 } 319 320 static void __team_options_unregister(struct team *team, 321 const struct team_option *option, 322 size_t option_count) 323 { 324 int i; 325 326 for (i = 0; i < option_count; i++, option++) { 327 struct team_option *del_opt; 328 329 del_opt = __team_find_option(team, option->name); 330 if (del_opt) { 331 __team_option_inst_del_option(team, del_opt); 332 list_del(&del_opt->list); 333 kfree(del_opt); 334 } 335 } 336 } 337 338 static void __team_options_change_check(struct team *team); 339 340 int team_options_register(struct team *team, 341 const struct team_option *option, 342 size_t option_count) 343 { 344 int err; 345 346 err = __team_options_register(team, option, option_count); 347 if (err) 348 return err; 349 __team_options_change_check(team); 350 return 0; 351 } 352 EXPORT_SYMBOL(team_options_register); 353 354 void team_options_unregister(struct team *team, 355 const struct team_option *option, 356 size_t option_count) 357 { 358 __team_options_mark_removed(team, option, option_count); 359 __team_options_change_check(team); 360 __team_options_unregister(team, option, option_count); 361 } 362 EXPORT_SYMBOL(team_options_unregister); 363 364 static int team_option_get(struct team *team, 365 struct team_option_inst *opt_inst, 366 struct team_gsetter_ctx *ctx) 367 { 368 if (!opt_inst->option->getter) 369 return -EOPNOTSUPP; 370 return opt_inst->option->getter(team, ctx); 371 } 372 373 static int team_option_set(struct team *team, 374 struct team_option_inst *opt_inst, 375 struct team_gsetter_ctx *ctx) 376 { 377 if (!opt_inst->option->setter) 378 return -EOPNOTSUPP; 379 return opt_inst->option->setter(team, ctx); 380 } 381 382 void team_option_inst_set_change(struct team_option_inst_info *opt_inst_info) 383 { 384 struct team_option_inst *opt_inst; 385 386 opt_inst = container_of(opt_inst_info, struct team_option_inst, info); 387 opt_inst->changed = true; 388 } 389 EXPORT_SYMBOL(team_option_inst_set_change); 390 391 void team_options_change_check(struct team *team) 392 { 393 __team_options_change_check(team); 394 } 395 EXPORT_SYMBOL(team_options_change_check); 396 397 398 /**************** 399 * Mode handling 400 ****************/ 401 402 static LIST_HEAD(mode_list); 403 static DEFINE_SPINLOCK(mode_list_lock); 404 405 struct team_mode_item { 406 struct list_head list; 407 const struct team_mode *mode; 408 }; 409 410 static struct team_mode_item *__find_mode(const char *kind) 411 { 412 struct team_mode_item *mitem; 413 414 list_for_each_entry(mitem, &mode_list, list) { 415 if (strcmp(mitem->mode->kind, kind) == 0) 416 return mitem; 417 } 418 return NULL; 419 } 420 421 static bool is_good_mode_name(const char *name) 422 { 423 while (*name != '\0') { 424 if (!isalpha(*name) && !isdigit(*name) && *name != '_') 425 return false; 426 name++; 427 } 428 return true; 429 } 430 431 int team_mode_register(const struct team_mode *mode) 432 { 433 int err = 0; 434 struct team_mode_item *mitem; 435 436 if (!is_good_mode_name(mode->kind) || 437 mode->priv_size > TEAM_MODE_PRIV_SIZE) 438 return -EINVAL; 439 440 mitem = kmalloc(sizeof(*mitem), GFP_KERNEL); 441 if (!mitem) 442 return -ENOMEM; 443 444 spin_lock(&mode_list_lock); 445 if (__find_mode(mode->kind)) { 446 err = -EEXIST; 447 kfree(mitem); 448 goto unlock; 449 } 450 mitem->mode = mode; 451 list_add_tail(&mitem->list, &mode_list); 452 unlock: 453 spin_unlock(&mode_list_lock); 454 return err; 455 } 456 EXPORT_SYMBOL(team_mode_register); 457 458 void team_mode_unregister(const struct team_mode *mode) 459 { 460 struct team_mode_item *mitem; 461 462 spin_lock(&mode_list_lock); 463 mitem = __find_mode(mode->kind); 464 if (mitem) { 465 list_del_init(&mitem->list); 466 kfree(mitem); 467 } 468 spin_unlock(&mode_list_lock); 469 } 470 EXPORT_SYMBOL(team_mode_unregister); 471 472 static const struct team_mode *team_mode_get(const char *kind) 473 { 474 struct team_mode_item *mitem; 475 const struct team_mode *mode = NULL; 476 477 spin_lock(&mode_list_lock); 478 mitem = __find_mode(kind); 479 if (!mitem) { 480 spin_unlock(&mode_list_lock); 481 request_module("team-mode-%s", kind); 482 spin_lock(&mode_list_lock); 483 mitem = __find_mode(kind); 484 } 485 if (mitem) { 486 mode = mitem->mode; 487 if (!try_module_get(mode->owner)) 488 mode = NULL; 489 } 490 491 spin_unlock(&mode_list_lock); 492 return mode; 493 } 494 495 static void team_mode_put(const struct team_mode *mode) 496 { 497 module_put(mode->owner); 498 } 499 500 static bool team_dummy_transmit(struct team *team, struct sk_buff *skb) 501 { 502 dev_kfree_skb_any(skb); 503 return false; 504 } 505 506 static rx_handler_result_t team_dummy_receive(struct team *team, 507 struct team_port *port, 508 struct sk_buff *skb) 509 { 510 return RX_HANDLER_ANOTHER; 511 } 512 513 static const struct team_mode __team_no_mode = { 514 .kind = "*NOMODE*", 515 }; 516 517 static bool team_is_mode_set(struct team *team) 518 { 519 return team->mode != &__team_no_mode; 520 } 521 522 static void team_set_no_mode(struct team *team) 523 { 524 team->user_carrier_enabled = false; 525 team->mode = &__team_no_mode; 526 } 527 528 static void team_adjust_ops(struct team *team) 529 { 530 /* 531 * To avoid checks in rx/tx skb paths, ensure here that non-null and 532 * correct ops are always set. 533 */ 534 535 if (!team->en_port_count || !team_is_mode_set(team) || 536 !team->mode->ops->transmit) 537 team->ops.transmit = team_dummy_transmit; 538 else 539 team->ops.transmit = team->mode->ops->transmit; 540 541 if (!team->en_port_count || !team_is_mode_set(team) || 542 !team->mode->ops->receive) 543 team->ops.receive = team_dummy_receive; 544 else 545 team->ops.receive = team->mode->ops->receive; 546 } 547 548 /* 549 * We can benefit from the fact that it's ensured no port is present 550 * at the time of mode change. Therefore no packets are in fly so there's no 551 * need to set mode operations in any special way. 552 */ 553 static int __team_change_mode(struct team *team, 554 const struct team_mode *new_mode) 555 { 556 /* Check if mode was previously set and do cleanup if so */ 557 if (team_is_mode_set(team)) { 558 void (*exit_op)(struct team *team) = team->ops.exit; 559 560 /* Clear ops area so no callback is called any longer */ 561 memset(&team->ops, 0, sizeof(struct team_mode_ops)); 562 team_adjust_ops(team); 563 564 if (exit_op) 565 exit_op(team); 566 team_mode_put(team->mode); 567 team_set_no_mode(team); 568 /* zero private data area */ 569 memset(&team->mode_priv, 0, 570 sizeof(struct team) - offsetof(struct team, mode_priv)); 571 } 572 573 if (!new_mode) 574 return 0; 575 576 if (new_mode->ops->init) { 577 int err; 578 579 err = new_mode->ops->init(team); 580 if (err) 581 return err; 582 } 583 584 team->mode = new_mode; 585 memcpy(&team->ops, new_mode->ops, sizeof(struct team_mode_ops)); 586 team_adjust_ops(team); 587 588 return 0; 589 } 590 591 static int team_change_mode(struct team *team, const char *kind) 592 { 593 const struct team_mode *new_mode; 594 struct net_device *dev = team->dev; 595 int err; 596 597 if (!list_empty(&team->port_list)) { 598 netdev_err(dev, "No ports can be present during mode change\n"); 599 return -EBUSY; 600 } 601 602 if (team_is_mode_set(team) && strcmp(team->mode->kind, kind) == 0) { 603 netdev_err(dev, "Unable to change to the same mode the team is in\n"); 604 return -EINVAL; 605 } 606 607 new_mode = team_mode_get(kind); 608 if (!new_mode) { 609 netdev_err(dev, "Mode \"%s\" not found\n", kind); 610 return -EINVAL; 611 } 612 613 err = __team_change_mode(team, new_mode); 614 if (err) { 615 netdev_err(dev, "Failed to change to mode \"%s\"\n", kind); 616 team_mode_put(new_mode); 617 return err; 618 } 619 620 netdev_info(dev, "Mode changed to \"%s\"\n", kind); 621 return 0; 622 } 623 624 625 /********************* 626 * Peers notification 627 *********************/ 628 629 static void team_notify_peers_work(struct work_struct *work) 630 { 631 struct team *team; 632 int val; 633 634 team = container_of(work, struct team, notify_peers.dw.work); 635 636 if (!rtnl_trylock()) { 637 schedule_delayed_work(&team->notify_peers.dw, 0); 638 return; 639 } 640 val = atomic_dec_if_positive(&team->notify_peers.count_pending); 641 if (val < 0) { 642 rtnl_unlock(); 643 return; 644 } 645 call_netdevice_notifiers(NETDEV_NOTIFY_PEERS, team->dev); 646 rtnl_unlock(); 647 if (val) 648 schedule_delayed_work(&team->notify_peers.dw, 649 msecs_to_jiffies(team->notify_peers.interval)); 650 } 651 652 static void team_notify_peers(struct team *team) 653 { 654 if (!team->notify_peers.count || !netif_running(team->dev)) 655 return; 656 atomic_add(team->notify_peers.count, &team->notify_peers.count_pending); 657 schedule_delayed_work(&team->notify_peers.dw, 0); 658 } 659 660 static void team_notify_peers_init(struct team *team) 661 { 662 INIT_DELAYED_WORK(&team->notify_peers.dw, team_notify_peers_work); 663 } 664 665 static void team_notify_peers_fini(struct team *team) 666 { 667 cancel_delayed_work_sync(&team->notify_peers.dw); 668 } 669 670 671 /******************************* 672 * Send multicast group rejoins 673 *******************************/ 674 675 static void team_mcast_rejoin_work(struct work_struct *work) 676 { 677 struct team *team; 678 int val; 679 680 team = container_of(work, struct team, mcast_rejoin.dw.work); 681 682 if (!rtnl_trylock()) { 683 schedule_delayed_work(&team->mcast_rejoin.dw, 0); 684 return; 685 } 686 val = atomic_dec_if_positive(&team->mcast_rejoin.count_pending); 687 if (val < 0) { 688 rtnl_unlock(); 689 return; 690 } 691 call_netdevice_notifiers(NETDEV_RESEND_IGMP, team->dev); 692 rtnl_unlock(); 693 if (val) 694 schedule_delayed_work(&team->mcast_rejoin.dw, 695 msecs_to_jiffies(team->mcast_rejoin.interval)); 696 } 697 698 static void team_mcast_rejoin(struct team *team) 699 { 700 if (!team->mcast_rejoin.count || !netif_running(team->dev)) 701 return; 702 atomic_add(team->mcast_rejoin.count, &team->mcast_rejoin.count_pending); 703 schedule_delayed_work(&team->mcast_rejoin.dw, 0); 704 } 705 706 static void team_mcast_rejoin_init(struct team *team) 707 { 708 INIT_DELAYED_WORK(&team->mcast_rejoin.dw, team_mcast_rejoin_work); 709 } 710 711 static void team_mcast_rejoin_fini(struct team *team) 712 { 713 cancel_delayed_work_sync(&team->mcast_rejoin.dw); 714 } 715 716 717 /************************ 718 * Rx path frame handler 719 ************************/ 720 721 /* note: already called with rcu_read_lock */ 722 static rx_handler_result_t team_handle_frame(struct sk_buff **pskb) 723 { 724 struct sk_buff *skb = *pskb; 725 struct team_port *port; 726 struct team *team; 727 rx_handler_result_t res; 728 729 skb = skb_share_check(skb, GFP_ATOMIC); 730 if (!skb) 731 return RX_HANDLER_CONSUMED; 732 733 *pskb = skb; 734 735 port = team_port_get_rcu(skb->dev); 736 team = port->team; 737 if (!team_port_enabled(port)) { 738 /* allow exact match delivery for disabled ports */ 739 res = RX_HANDLER_EXACT; 740 } else { 741 res = team->ops.receive(team, port, skb); 742 } 743 if (res == RX_HANDLER_ANOTHER) { 744 struct team_pcpu_stats *pcpu_stats; 745 746 pcpu_stats = this_cpu_ptr(team->pcpu_stats); 747 u64_stats_update_begin(&pcpu_stats->syncp); 748 pcpu_stats->rx_packets++; 749 pcpu_stats->rx_bytes += skb->len; 750 if (skb->pkt_type == PACKET_MULTICAST) 751 pcpu_stats->rx_multicast++; 752 u64_stats_update_end(&pcpu_stats->syncp); 753 754 skb->dev = team->dev; 755 } else { 756 this_cpu_inc(team->pcpu_stats->rx_dropped); 757 } 758 759 return res; 760 } 761 762 763 /************************************* 764 * Multiqueue Tx port select override 765 *************************************/ 766 767 static int team_queue_override_init(struct team *team) 768 { 769 struct list_head *listarr; 770 unsigned int queue_cnt = team->dev->num_tx_queues - 1; 771 unsigned int i; 772 773 if (!queue_cnt) 774 return 0; 775 listarr = kmalloc(sizeof(struct list_head) * queue_cnt, GFP_KERNEL); 776 if (!listarr) 777 return -ENOMEM; 778 team->qom_lists = listarr; 779 for (i = 0; i < queue_cnt; i++) 780 INIT_LIST_HEAD(listarr++); 781 return 0; 782 } 783 784 static void team_queue_override_fini(struct team *team) 785 { 786 kfree(team->qom_lists); 787 } 788 789 static struct list_head *__team_get_qom_list(struct team *team, u16 queue_id) 790 { 791 return &team->qom_lists[queue_id - 1]; 792 } 793 794 /* 795 * note: already called with rcu_read_lock 796 */ 797 static bool team_queue_override_transmit(struct team *team, struct sk_buff *skb) 798 { 799 struct list_head *qom_list; 800 struct team_port *port; 801 802 if (!team->queue_override_enabled || !skb->queue_mapping) 803 return false; 804 qom_list = __team_get_qom_list(team, skb->queue_mapping); 805 list_for_each_entry_rcu(port, qom_list, qom_list) { 806 if (!team_dev_queue_xmit(team, port, skb)) 807 return true; 808 } 809 return false; 810 } 811 812 static void __team_queue_override_port_del(struct team *team, 813 struct team_port *port) 814 { 815 if (!port->queue_id) 816 return; 817 list_del_rcu(&port->qom_list); 818 } 819 820 static bool team_queue_override_port_has_gt_prio_than(struct team_port *port, 821 struct team_port *cur) 822 { 823 if (port->priority < cur->priority) 824 return true; 825 if (port->priority > cur->priority) 826 return false; 827 if (port->index < cur->index) 828 return true; 829 return false; 830 } 831 832 static void __team_queue_override_port_add(struct team *team, 833 struct team_port *port) 834 { 835 struct team_port *cur; 836 struct list_head *qom_list; 837 struct list_head *node; 838 839 if (!port->queue_id) 840 return; 841 qom_list = __team_get_qom_list(team, port->queue_id); 842 node = qom_list; 843 list_for_each_entry(cur, qom_list, qom_list) { 844 if (team_queue_override_port_has_gt_prio_than(port, cur)) 845 break; 846 node = &cur->qom_list; 847 } 848 list_add_tail_rcu(&port->qom_list, node); 849 } 850 851 static void __team_queue_override_enabled_check(struct team *team) 852 { 853 struct team_port *port; 854 bool enabled = false; 855 856 list_for_each_entry(port, &team->port_list, list) { 857 if (port->queue_id) { 858 enabled = true; 859 break; 860 } 861 } 862 if (enabled == team->queue_override_enabled) 863 return; 864 netdev_dbg(team->dev, "%s queue override\n", 865 enabled ? "Enabling" : "Disabling"); 866 team->queue_override_enabled = enabled; 867 } 868 869 static void team_queue_override_port_prio_changed(struct team *team, 870 struct team_port *port) 871 { 872 if (!port->queue_id || team_port_enabled(port)) 873 return; 874 __team_queue_override_port_del(team, port); 875 __team_queue_override_port_add(team, port); 876 __team_queue_override_enabled_check(team); 877 } 878 879 static void team_queue_override_port_change_queue_id(struct team *team, 880 struct team_port *port, 881 u16 new_queue_id) 882 { 883 if (team_port_enabled(port)) { 884 __team_queue_override_port_del(team, port); 885 port->queue_id = new_queue_id; 886 __team_queue_override_port_add(team, port); 887 __team_queue_override_enabled_check(team); 888 } else { 889 port->queue_id = new_queue_id; 890 } 891 } 892 893 static void team_queue_override_port_add(struct team *team, 894 struct team_port *port) 895 { 896 __team_queue_override_port_add(team, port); 897 __team_queue_override_enabled_check(team); 898 } 899 900 static void team_queue_override_port_del(struct team *team, 901 struct team_port *port) 902 { 903 __team_queue_override_port_del(team, port); 904 __team_queue_override_enabled_check(team); 905 } 906 907 908 /**************** 909 * Port handling 910 ****************/ 911 912 static bool team_port_find(const struct team *team, 913 const struct team_port *port) 914 { 915 struct team_port *cur; 916 917 list_for_each_entry(cur, &team->port_list, list) 918 if (cur == port) 919 return true; 920 return false; 921 } 922 923 /* 924 * Enable/disable port by adding to enabled port hashlist and setting 925 * port->index (Might be racy so reader could see incorrect ifindex when 926 * processing a flying packet, but that is not a problem). Write guarded 927 * by team->lock. 928 */ 929 static void team_port_enable(struct team *team, 930 struct team_port *port) 931 { 932 if (team_port_enabled(port)) 933 return; 934 port->index = team->en_port_count++; 935 hlist_add_head_rcu(&port->hlist, 936 team_port_index_hash(team, port->index)); 937 team_adjust_ops(team); 938 team_queue_override_port_add(team, port); 939 if (team->ops.port_enabled) 940 team->ops.port_enabled(team, port); 941 team_notify_peers(team); 942 team_mcast_rejoin(team); 943 } 944 945 static void __reconstruct_port_hlist(struct team *team, int rm_index) 946 { 947 int i; 948 struct team_port *port; 949 950 for (i = rm_index + 1; i < team->en_port_count; i++) { 951 port = team_get_port_by_index(team, i); 952 hlist_del_rcu(&port->hlist); 953 port->index--; 954 hlist_add_head_rcu(&port->hlist, 955 team_port_index_hash(team, port->index)); 956 } 957 } 958 959 static void team_port_disable(struct team *team, 960 struct team_port *port) 961 { 962 if (!team_port_enabled(port)) 963 return; 964 if (team->ops.port_disabled) 965 team->ops.port_disabled(team, port); 966 hlist_del_rcu(&port->hlist); 967 __reconstruct_port_hlist(team, port->index); 968 port->index = -1; 969 team->en_port_count--; 970 team_queue_override_port_del(team, port); 971 team_adjust_ops(team); 972 team_notify_peers(team); 973 team_mcast_rejoin(team); 974 } 975 976 #define TEAM_VLAN_FEATURES (NETIF_F_ALL_CSUM | NETIF_F_SG | \ 977 NETIF_F_FRAGLIST | NETIF_F_ALL_TSO | \ 978 NETIF_F_HIGHDMA | NETIF_F_LRO) 979 980 static void __team_compute_features(struct team *team) 981 { 982 struct team_port *port; 983 u32 vlan_features = TEAM_VLAN_FEATURES & NETIF_F_ALL_FOR_ALL; 984 unsigned short max_hard_header_len = ETH_HLEN; 985 unsigned int dst_release_flag = IFF_XMIT_DST_RELEASE | 986 IFF_XMIT_DST_RELEASE_PERM; 987 988 list_for_each_entry(port, &team->port_list, list) { 989 vlan_features = netdev_increment_features(vlan_features, 990 port->dev->vlan_features, 991 TEAM_VLAN_FEATURES); 992 993 dst_release_flag &= port->dev->priv_flags; 994 if (port->dev->hard_header_len > max_hard_header_len) 995 max_hard_header_len = port->dev->hard_header_len; 996 } 997 998 team->dev->vlan_features = vlan_features; 999 team->dev->hard_header_len = max_hard_header_len; 1000 1001 team->dev->priv_flags &= ~IFF_XMIT_DST_RELEASE; 1002 if (dst_release_flag == (IFF_XMIT_DST_RELEASE | IFF_XMIT_DST_RELEASE_PERM)) 1003 team->dev->priv_flags |= IFF_XMIT_DST_RELEASE; 1004 1005 netdev_change_features(team->dev); 1006 } 1007 1008 static void team_compute_features(struct team *team) 1009 { 1010 mutex_lock(&team->lock); 1011 __team_compute_features(team); 1012 mutex_unlock(&team->lock); 1013 } 1014 1015 static int team_port_enter(struct team *team, struct team_port *port) 1016 { 1017 int err = 0; 1018 1019 dev_hold(team->dev); 1020 if (team->ops.port_enter) { 1021 err = team->ops.port_enter(team, port); 1022 if (err) { 1023 netdev_err(team->dev, "Device %s failed to enter team mode\n", 1024 port->dev->name); 1025 goto err_port_enter; 1026 } 1027 } 1028 1029 return 0; 1030 1031 err_port_enter: 1032 dev_put(team->dev); 1033 1034 return err; 1035 } 1036 1037 static void team_port_leave(struct team *team, struct team_port *port) 1038 { 1039 if (team->ops.port_leave) 1040 team->ops.port_leave(team, port); 1041 dev_put(team->dev); 1042 } 1043 1044 #ifdef CONFIG_NET_POLL_CONTROLLER 1045 static int team_port_enable_netpoll(struct team *team, struct team_port *port) 1046 { 1047 struct netpoll *np; 1048 int err; 1049 1050 if (!team->dev->npinfo) 1051 return 0; 1052 1053 np = kzalloc(sizeof(*np), GFP_KERNEL); 1054 if (!np) 1055 return -ENOMEM; 1056 1057 err = __netpoll_setup(np, port->dev); 1058 if (err) { 1059 kfree(np); 1060 return err; 1061 } 1062 port->np = np; 1063 return err; 1064 } 1065 1066 static void team_port_disable_netpoll(struct team_port *port) 1067 { 1068 struct netpoll *np = port->np; 1069 1070 if (!np) 1071 return; 1072 port->np = NULL; 1073 1074 /* Wait for transmitting packets to finish before freeing. */ 1075 synchronize_rcu_bh(); 1076 __netpoll_cleanup(np); 1077 kfree(np); 1078 } 1079 #else 1080 static int team_port_enable_netpoll(struct team *team, struct team_port *port) 1081 { 1082 return 0; 1083 } 1084 static void team_port_disable_netpoll(struct team_port *port) 1085 { 1086 } 1087 #endif 1088 1089 static int team_upper_dev_link(struct net_device *dev, 1090 struct net_device *port_dev) 1091 { 1092 int err; 1093 1094 err = netdev_master_upper_dev_link(port_dev, dev); 1095 if (err) 1096 return err; 1097 port_dev->priv_flags |= IFF_TEAM_PORT; 1098 return 0; 1099 } 1100 1101 static void team_upper_dev_unlink(struct net_device *dev, 1102 struct net_device *port_dev) 1103 { 1104 netdev_upper_dev_unlink(port_dev, dev); 1105 port_dev->priv_flags &= ~IFF_TEAM_PORT; 1106 } 1107 1108 static void __team_port_change_port_added(struct team_port *port, bool linkup); 1109 static int team_dev_type_check_change(struct net_device *dev, 1110 struct net_device *port_dev); 1111 1112 static int team_port_add(struct team *team, struct net_device *port_dev) 1113 { 1114 struct net_device *dev = team->dev; 1115 struct team_port *port; 1116 char *portname = port_dev->name; 1117 int err; 1118 1119 if (port_dev->flags & IFF_LOOPBACK) { 1120 netdev_err(dev, "Device %s is loopback device. Loopback devices can't be added as a team port\n", 1121 portname); 1122 return -EINVAL; 1123 } 1124 1125 if (team_port_exists(port_dev)) { 1126 netdev_err(dev, "Device %s is already a port " 1127 "of a team device\n", portname); 1128 return -EBUSY; 1129 } 1130 1131 if (port_dev->features & NETIF_F_VLAN_CHALLENGED && 1132 vlan_uses_dev(dev)) { 1133 netdev_err(dev, "Device %s is VLAN challenged and team device has VLAN set up\n", 1134 portname); 1135 return -EPERM; 1136 } 1137 1138 err = team_dev_type_check_change(dev, port_dev); 1139 if (err) 1140 return err; 1141 1142 if (port_dev->flags & IFF_UP) { 1143 netdev_err(dev, "Device %s is up. Set it down before adding it as a team port\n", 1144 portname); 1145 return -EBUSY; 1146 } 1147 1148 port = kzalloc(sizeof(struct team_port) + team->mode->port_priv_size, 1149 GFP_KERNEL); 1150 if (!port) 1151 return -ENOMEM; 1152 1153 port->dev = port_dev; 1154 port->team = team; 1155 INIT_LIST_HEAD(&port->qom_list); 1156 1157 port->orig.mtu = port_dev->mtu; 1158 err = dev_set_mtu(port_dev, dev->mtu); 1159 if (err) { 1160 netdev_dbg(dev, "Error %d calling dev_set_mtu\n", err); 1161 goto err_set_mtu; 1162 } 1163 1164 memcpy(port->orig.dev_addr, port_dev->dev_addr, port_dev->addr_len); 1165 1166 err = team_port_enter(team, port); 1167 if (err) { 1168 netdev_err(dev, "Device %s failed to enter team mode\n", 1169 portname); 1170 goto err_port_enter; 1171 } 1172 1173 err = dev_open(port_dev); 1174 if (err) { 1175 netdev_dbg(dev, "Device %s opening failed\n", 1176 portname); 1177 goto err_dev_open; 1178 } 1179 1180 err = vlan_vids_add_by_dev(port_dev, dev); 1181 if (err) { 1182 netdev_err(dev, "Failed to add vlan ids to device %s\n", 1183 portname); 1184 goto err_vids_add; 1185 } 1186 1187 err = team_port_enable_netpoll(team, port); 1188 if (err) { 1189 netdev_err(dev, "Failed to enable netpoll on device %s\n", 1190 portname); 1191 goto err_enable_netpoll; 1192 } 1193 1194 if (!(dev->features & NETIF_F_LRO)) 1195 dev_disable_lro(port_dev); 1196 1197 err = netdev_rx_handler_register(port_dev, team_handle_frame, 1198 port); 1199 if (err) { 1200 netdev_err(dev, "Device %s failed to register rx_handler\n", 1201 portname); 1202 goto err_handler_register; 1203 } 1204 1205 err = team_upper_dev_link(dev, port_dev); 1206 if (err) { 1207 netdev_err(dev, "Device %s failed to set upper link\n", 1208 portname); 1209 goto err_set_upper_link; 1210 } 1211 1212 err = __team_option_inst_add_port(team, port); 1213 if (err) { 1214 netdev_err(dev, "Device %s failed to add per-port options\n", 1215 portname); 1216 goto err_option_port_add; 1217 } 1218 1219 port->index = -1; 1220 list_add_tail_rcu(&port->list, &team->port_list); 1221 team_port_enable(team, port); 1222 __team_compute_features(team); 1223 __team_port_change_port_added(port, !!netif_carrier_ok(port_dev)); 1224 __team_options_change_check(team); 1225 1226 netdev_info(dev, "Port device %s added\n", portname); 1227 1228 return 0; 1229 1230 err_option_port_add: 1231 team_upper_dev_unlink(dev, port_dev); 1232 1233 err_set_upper_link: 1234 netdev_rx_handler_unregister(port_dev); 1235 1236 err_handler_register: 1237 team_port_disable_netpoll(port); 1238 1239 err_enable_netpoll: 1240 vlan_vids_del_by_dev(port_dev, dev); 1241 1242 err_vids_add: 1243 dev_close(port_dev); 1244 1245 err_dev_open: 1246 team_port_leave(team, port); 1247 team_port_set_orig_dev_addr(port); 1248 1249 err_port_enter: 1250 dev_set_mtu(port_dev, port->orig.mtu); 1251 1252 err_set_mtu: 1253 kfree(port); 1254 1255 return err; 1256 } 1257 1258 static void __team_port_change_port_removed(struct team_port *port); 1259 1260 static int team_port_del(struct team *team, struct net_device *port_dev) 1261 { 1262 struct net_device *dev = team->dev; 1263 struct team_port *port; 1264 char *portname = port_dev->name; 1265 1266 port = team_port_get_rtnl(port_dev); 1267 if (!port || !team_port_find(team, port)) { 1268 netdev_err(dev, "Device %s does not act as a port of this team\n", 1269 portname); 1270 return -ENOENT; 1271 } 1272 1273 team_port_disable(team, port); 1274 list_del_rcu(&port->list); 1275 team_upper_dev_unlink(dev, port_dev); 1276 netdev_rx_handler_unregister(port_dev); 1277 team_port_disable_netpoll(port); 1278 vlan_vids_del_by_dev(port_dev, dev); 1279 dev_uc_unsync(port_dev, dev); 1280 dev_mc_unsync(port_dev, dev); 1281 dev_close(port_dev); 1282 team_port_leave(team, port); 1283 1284 __team_option_inst_mark_removed_port(team, port); 1285 __team_options_change_check(team); 1286 __team_option_inst_del_port(team, port); 1287 __team_port_change_port_removed(port); 1288 1289 team_port_set_orig_dev_addr(port); 1290 dev_set_mtu(port_dev, port->orig.mtu); 1291 kfree_rcu(port, rcu); 1292 netdev_info(dev, "Port device %s removed\n", portname); 1293 __team_compute_features(team); 1294 1295 return 0; 1296 } 1297 1298 1299 /***************** 1300 * Net device ops 1301 *****************/ 1302 1303 static int team_mode_option_get(struct team *team, struct team_gsetter_ctx *ctx) 1304 { 1305 ctx->data.str_val = team->mode->kind; 1306 return 0; 1307 } 1308 1309 static int team_mode_option_set(struct team *team, struct team_gsetter_ctx *ctx) 1310 { 1311 return team_change_mode(team, ctx->data.str_val); 1312 } 1313 1314 static int team_notify_peers_count_get(struct team *team, 1315 struct team_gsetter_ctx *ctx) 1316 { 1317 ctx->data.u32_val = team->notify_peers.count; 1318 return 0; 1319 } 1320 1321 static int team_notify_peers_count_set(struct team *team, 1322 struct team_gsetter_ctx *ctx) 1323 { 1324 team->notify_peers.count = ctx->data.u32_val; 1325 return 0; 1326 } 1327 1328 static int team_notify_peers_interval_get(struct team *team, 1329 struct team_gsetter_ctx *ctx) 1330 { 1331 ctx->data.u32_val = team->notify_peers.interval; 1332 return 0; 1333 } 1334 1335 static int team_notify_peers_interval_set(struct team *team, 1336 struct team_gsetter_ctx *ctx) 1337 { 1338 team->notify_peers.interval = ctx->data.u32_val; 1339 return 0; 1340 } 1341 1342 static int team_mcast_rejoin_count_get(struct team *team, 1343 struct team_gsetter_ctx *ctx) 1344 { 1345 ctx->data.u32_val = team->mcast_rejoin.count; 1346 return 0; 1347 } 1348 1349 static int team_mcast_rejoin_count_set(struct team *team, 1350 struct team_gsetter_ctx *ctx) 1351 { 1352 team->mcast_rejoin.count = ctx->data.u32_val; 1353 return 0; 1354 } 1355 1356 static int team_mcast_rejoin_interval_get(struct team *team, 1357 struct team_gsetter_ctx *ctx) 1358 { 1359 ctx->data.u32_val = team->mcast_rejoin.interval; 1360 return 0; 1361 } 1362 1363 static int team_mcast_rejoin_interval_set(struct team *team, 1364 struct team_gsetter_ctx *ctx) 1365 { 1366 team->mcast_rejoin.interval = ctx->data.u32_val; 1367 return 0; 1368 } 1369 1370 static int team_port_en_option_get(struct team *team, 1371 struct team_gsetter_ctx *ctx) 1372 { 1373 struct team_port *port = ctx->info->port; 1374 1375 ctx->data.bool_val = team_port_enabled(port); 1376 return 0; 1377 } 1378 1379 static int team_port_en_option_set(struct team *team, 1380 struct team_gsetter_ctx *ctx) 1381 { 1382 struct team_port *port = ctx->info->port; 1383 1384 if (ctx->data.bool_val) 1385 team_port_enable(team, port); 1386 else 1387 team_port_disable(team, port); 1388 return 0; 1389 } 1390 1391 static int team_user_linkup_option_get(struct team *team, 1392 struct team_gsetter_ctx *ctx) 1393 { 1394 struct team_port *port = ctx->info->port; 1395 1396 ctx->data.bool_val = port->user.linkup; 1397 return 0; 1398 } 1399 1400 static void __team_carrier_check(struct team *team); 1401 1402 static int team_user_linkup_option_set(struct team *team, 1403 struct team_gsetter_ctx *ctx) 1404 { 1405 struct team_port *port = ctx->info->port; 1406 1407 port->user.linkup = ctx->data.bool_val; 1408 team_refresh_port_linkup(port); 1409 __team_carrier_check(port->team); 1410 return 0; 1411 } 1412 1413 static int team_user_linkup_en_option_get(struct team *team, 1414 struct team_gsetter_ctx *ctx) 1415 { 1416 struct team_port *port = ctx->info->port; 1417 1418 ctx->data.bool_val = port->user.linkup_enabled; 1419 return 0; 1420 } 1421 1422 static int team_user_linkup_en_option_set(struct team *team, 1423 struct team_gsetter_ctx *ctx) 1424 { 1425 struct team_port *port = ctx->info->port; 1426 1427 port->user.linkup_enabled = ctx->data.bool_val; 1428 team_refresh_port_linkup(port); 1429 __team_carrier_check(port->team); 1430 return 0; 1431 } 1432 1433 static int team_priority_option_get(struct team *team, 1434 struct team_gsetter_ctx *ctx) 1435 { 1436 struct team_port *port = ctx->info->port; 1437 1438 ctx->data.s32_val = port->priority; 1439 return 0; 1440 } 1441 1442 static int team_priority_option_set(struct team *team, 1443 struct team_gsetter_ctx *ctx) 1444 { 1445 struct team_port *port = ctx->info->port; 1446 s32 priority = ctx->data.s32_val; 1447 1448 if (port->priority == priority) 1449 return 0; 1450 port->priority = priority; 1451 team_queue_override_port_prio_changed(team, port); 1452 return 0; 1453 } 1454 1455 static int team_queue_id_option_get(struct team *team, 1456 struct team_gsetter_ctx *ctx) 1457 { 1458 struct team_port *port = ctx->info->port; 1459 1460 ctx->data.u32_val = port->queue_id; 1461 return 0; 1462 } 1463 1464 static int team_queue_id_option_set(struct team *team, 1465 struct team_gsetter_ctx *ctx) 1466 { 1467 struct team_port *port = ctx->info->port; 1468 u16 new_queue_id = ctx->data.u32_val; 1469 1470 if (port->queue_id == new_queue_id) 1471 return 0; 1472 if (new_queue_id >= team->dev->real_num_tx_queues) 1473 return -EINVAL; 1474 team_queue_override_port_change_queue_id(team, port, new_queue_id); 1475 return 0; 1476 } 1477 1478 static const struct team_option team_options[] = { 1479 { 1480 .name = "mode", 1481 .type = TEAM_OPTION_TYPE_STRING, 1482 .getter = team_mode_option_get, 1483 .setter = team_mode_option_set, 1484 }, 1485 { 1486 .name = "notify_peers_count", 1487 .type = TEAM_OPTION_TYPE_U32, 1488 .getter = team_notify_peers_count_get, 1489 .setter = team_notify_peers_count_set, 1490 }, 1491 { 1492 .name = "notify_peers_interval", 1493 .type = TEAM_OPTION_TYPE_U32, 1494 .getter = team_notify_peers_interval_get, 1495 .setter = team_notify_peers_interval_set, 1496 }, 1497 { 1498 .name = "mcast_rejoin_count", 1499 .type = TEAM_OPTION_TYPE_U32, 1500 .getter = team_mcast_rejoin_count_get, 1501 .setter = team_mcast_rejoin_count_set, 1502 }, 1503 { 1504 .name = "mcast_rejoin_interval", 1505 .type = TEAM_OPTION_TYPE_U32, 1506 .getter = team_mcast_rejoin_interval_get, 1507 .setter = team_mcast_rejoin_interval_set, 1508 }, 1509 { 1510 .name = "enabled", 1511 .type = TEAM_OPTION_TYPE_BOOL, 1512 .per_port = true, 1513 .getter = team_port_en_option_get, 1514 .setter = team_port_en_option_set, 1515 }, 1516 { 1517 .name = "user_linkup", 1518 .type = TEAM_OPTION_TYPE_BOOL, 1519 .per_port = true, 1520 .getter = team_user_linkup_option_get, 1521 .setter = team_user_linkup_option_set, 1522 }, 1523 { 1524 .name = "user_linkup_enabled", 1525 .type = TEAM_OPTION_TYPE_BOOL, 1526 .per_port = true, 1527 .getter = team_user_linkup_en_option_get, 1528 .setter = team_user_linkup_en_option_set, 1529 }, 1530 { 1531 .name = "priority", 1532 .type = TEAM_OPTION_TYPE_S32, 1533 .per_port = true, 1534 .getter = team_priority_option_get, 1535 .setter = team_priority_option_set, 1536 }, 1537 { 1538 .name = "queue_id", 1539 .type = TEAM_OPTION_TYPE_U32, 1540 .per_port = true, 1541 .getter = team_queue_id_option_get, 1542 .setter = team_queue_id_option_set, 1543 }, 1544 }; 1545 1546 static struct lock_class_key team_netdev_xmit_lock_key; 1547 static struct lock_class_key team_netdev_addr_lock_key; 1548 static struct lock_class_key team_tx_busylock_key; 1549 1550 static void team_set_lockdep_class_one(struct net_device *dev, 1551 struct netdev_queue *txq, 1552 void *unused) 1553 { 1554 lockdep_set_class(&txq->_xmit_lock, &team_netdev_xmit_lock_key); 1555 } 1556 1557 static void team_set_lockdep_class(struct net_device *dev) 1558 { 1559 lockdep_set_class(&dev->addr_list_lock, &team_netdev_addr_lock_key); 1560 netdev_for_each_tx_queue(dev, team_set_lockdep_class_one, NULL); 1561 dev->qdisc_tx_busylock = &team_tx_busylock_key; 1562 } 1563 1564 static int team_init(struct net_device *dev) 1565 { 1566 struct team *team = netdev_priv(dev); 1567 int i; 1568 int err; 1569 1570 team->dev = dev; 1571 mutex_init(&team->lock); 1572 team_set_no_mode(team); 1573 1574 team->pcpu_stats = netdev_alloc_pcpu_stats(struct team_pcpu_stats); 1575 if (!team->pcpu_stats) 1576 return -ENOMEM; 1577 1578 for (i = 0; i < TEAM_PORT_HASHENTRIES; i++) 1579 INIT_HLIST_HEAD(&team->en_port_hlist[i]); 1580 INIT_LIST_HEAD(&team->port_list); 1581 err = team_queue_override_init(team); 1582 if (err) 1583 goto err_team_queue_override_init; 1584 1585 team_adjust_ops(team); 1586 1587 INIT_LIST_HEAD(&team->option_list); 1588 INIT_LIST_HEAD(&team->option_inst_list); 1589 1590 team_notify_peers_init(team); 1591 team_mcast_rejoin_init(team); 1592 1593 err = team_options_register(team, team_options, ARRAY_SIZE(team_options)); 1594 if (err) 1595 goto err_options_register; 1596 netif_carrier_off(dev); 1597 1598 team_set_lockdep_class(dev); 1599 1600 return 0; 1601 1602 err_options_register: 1603 team_mcast_rejoin_fini(team); 1604 team_notify_peers_fini(team); 1605 team_queue_override_fini(team); 1606 err_team_queue_override_init: 1607 free_percpu(team->pcpu_stats); 1608 1609 return err; 1610 } 1611 1612 static void team_uninit(struct net_device *dev) 1613 { 1614 struct team *team = netdev_priv(dev); 1615 struct team_port *port; 1616 struct team_port *tmp; 1617 1618 mutex_lock(&team->lock); 1619 list_for_each_entry_safe(port, tmp, &team->port_list, list) 1620 team_port_del(team, port->dev); 1621 1622 __team_change_mode(team, NULL); /* cleanup */ 1623 __team_options_unregister(team, team_options, ARRAY_SIZE(team_options)); 1624 team_mcast_rejoin_fini(team); 1625 team_notify_peers_fini(team); 1626 team_queue_override_fini(team); 1627 mutex_unlock(&team->lock); 1628 } 1629 1630 static void team_destructor(struct net_device *dev) 1631 { 1632 struct team *team = netdev_priv(dev); 1633 1634 free_percpu(team->pcpu_stats); 1635 free_netdev(dev); 1636 } 1637 1638 static int team_open(struct net_device *dev) 1639 { 1640 return 0; 1641 } 1642 1643 static int team_close(struct net_device *dev) 1644 { 1645 return 0; 1646 } 1647 1648 /* 1649 * note: already called with rcu_read_lock 1650 */ 1651 static netdev_tx_t team_xmit(struct sk_buff *skb, struct net_device *dev) 1652 { 1653 struct team *team = netdev_priv(dev); 1654 bool tx_success; 1655 unsigned int len = skb->len; 1656 1657 tx_success = team_queue_override_transmit(team, skb); 1658 if (!tx_success) 1659 tx_success = team->ops.transmit(team, skb); 1660 if (tx_success) { 1661 struct team_pcpu_stats *pcpu_stats; 1662 1663 pcpu_stats = this_cpu_ptr(team->pcpu_stats); 1664 u64_stats_update_begin(&pcpu_stats->syncp); 1665 pcpu_stats->tx_packets++; 1666 pcpu_stats->tx_bytes += len; 1667 u64_stats_update_end(&pcpu_stats->syncp); 1668 } else { 1669 this_cpu_inc(team->pcpu_stats->tx_dropped); 1670 } 1671 1672 return NETDEV_TX_OK; 1673 } 1674 1675 static u16 team_select_queue(struct net_device *dev, struct sk_buff *skb, 1676 void *accel_priv, select_queue_fallback_t fallback) 1677 { 1678 /* 1679 * This helper function exists to help dev_pick_tx get the correct 1680 * destination queue. Using a helper function skips a call to 1681 * skb_tx_hash and will put the skbs in the queue we expect on their 1682 * way down to the team driver. 1683 */ 1684 u16 txq = skb_rx_queue_recorded(skb) ? skb_get_rx_queue(skb) : 0; 1685 1686 /* 1687 * Save the original txq to restore before passing to the driver 1688 */ 1689 qdisc_skb_cb(skb)->slave_dev_queue_mapping = skb->queue_mapping; 1690 1691 if (unlikely(txq >= dev->real_num_tx_queues)) { 1692 do { 1693 txq -= dev->real_num_tx_queues; 1694 } while (txq >= dev->real_num_tx_queues); 1695 } 1696 return txq; 1697 } 1698 1699 static void team_change_rx_flags(struct net_device *dev, int change) 1700 { 1701 struct team *team = netdev_priv(dev); 1702 struct team_port *port; 1703 int inc; 1704 1705 rcu_read_lock(); 1706 list_for_each_entry_rcu(port, &team->port_list, list) { 1707 if (change & IFF_PROMISC) { 1708 inc = dev->flags & IFF_PROMISC ? 1 : -1; 1709 dev_set_promiscuity(port->dev, inc); 1710 } 1711 if (change & IFF_ALLMULTI) { 1712 inc = dev->flags & IFF_ALLMULTI ? 1 : -1; 1713 dev_set_allmulti(port->dev, inc); 1714 } 1715 } 1716 rcu_read_unlock(); 1717 } 1718 1719 static void team_set_rx_mode(struct net_device *dev) 1720 { 1721 struct team *team = netdev_priv(dev); 1722 struct team_port *port; 1723 1724 rcu_read_lock(); 1725 list_for_each_entry_rcu(port, &team->port_list, list) { 1726 dev_uc_sync_multiple(port->dev, dev); 1727 dev_mc_sync_multiple(port->dev, dev); 1728 } 1729 rcu_read_unlock(); 1730 } 1731 1732 static int team_set_mac_address(struct net_device *dev, void *p) 1733 { 1734 struct sockaddr *addr = p; 1735 struct team *team = netdev_priv(dev); 1736 struct team_port *port; 1737 1738 if (dev->type == ARPHRD_ETHER && !is_valid_ether_addr(addr->sa_data)) 1739 return -EADDRNOTAVAIL; 1740 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len); 1741 rcu_read_lock(); 1742 list_for_each_entry_rcu(port, &team->port_list, list) 1743 if (team->ops.port_change_dev_addr) 1744 team->ops.port_change_dev_addr(team, port); 1745 rcu_read_unlock(); 1746 return 0; 1747 } 1748 1749 static int team_change_mtu(struct net_device *dev, int new_mtu) 1750 { 1751 struct team *team = netdev_priv(dev); 1752 struct team_port *port; 1753 int err; 1754 1755 /* 1756 * Alhough this is reader, it's guarded by team lock. It's not possible 1757 * to traverse list in reverse under rcu_read_lock 1758 */ 1759 mutex_lock(&team->lock); 1760 team->port_mtu_change_allowed = true; 1761 list_for_each_entry(port, &team->port_list, list) { 1762 err = dev_set_mtu(port->dev, new_mtu); 1763 if (err) { 1764 netdev_err(dev, "Device %s failed to change mtu", 1765 port->dev->name); 1766 goto unwind; 1767 } 1768 } 1769 team->port_mtu_change_allowed = false; 1770 mutex_unlock(&team->lock); 1771 1772 dev->mtu = new_mtu; 1773 1774 return 0; 1775 1776 unwind: 1777 list_for_each_entry_continue_reverse(port, &team->port_list, list) 1778 dev_set_mtu(port->dev, dev->mtu); 1779 team->port_mtu_change_allowed = false; 1780 mutex_unlock(&team->lock); 1781 1782 return err; 1783 } 1784 1785 static struct rtnl_link_stats64 * 1786 team_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats) 1787 { 1788 struct team *team = netdev_priv(dev); 1789 struct team_pcpu_stats *p; 1790 u64 rx_packets, rx_bytes, rx_multicast, tx_packets, tx_bytes; 1791 u32 rx_dropped = 0, tx_dropped = 0; 1792 unsigned int start; 1793 int i; 1794 1795 for_each_possible_cpu(i) { 1796 p = per_cpu_ptr(team->pcpu_stats, i); 1797 do { 1798 start = u64_stats_fetch_begin_irq(&p->syncp); 1799 rx_packets = p->rx_packets; 1800 rx_bytes = p->rx_bytes; 1801 rx_multicast = p->rx_multicast; 1802 tx_packets = p->tx_packets; 1803 tx_bytes = p->tx_bytes; 1804 } while (u64_stats_fetch_retry_irq(&p->syncp, start)); 1805 1806 stats->rx_packets += rx_packets; 1807 stats->rx_bytes += rx_bytes; 1808 stats->multicast += rx_multicast; 1809 stats->tx_packets += tx_packets; 1810 stats->tx_bytes += tx_bytes; 1811 /* 1812 * rx_dropped & tx_dropped are u32, updated 1813 * without syncp protection. 1814 */ 1815 rx_dropped += p->rx_dropped; 1816 tx_dropped += p->tx_dropped; 1817 } 1818 stats->rx_dropped = rx_dropped; 1819 stats->tx_dropped = tx_dropped; 1820 return stats; 1821 } 1822 1823 static int team_vlan_rx_add_vid(struct net_device *dev, __be16 proto, u16 vid) 1824 { 1825 struct team *team = netdev_priv(dev); 1826 struct team_port *port; 1827 int err; 1828 1829 /* 1830 * Alhough this is reader, it's guarded by team lock. It's not possible 1831 * to traverse list in reverse under rcu_read_lock 1832 */ 1833 mutex_lock(&team->lock); 1834 list_for_each_entry(port, &team->port_list, list) { 1835 err = vlan_vid_add(port->dev, proto, vid); 1836 if (err) 1837 goto unwind; 1838 } 1839 mutex_unlock(&team->lock); 1840 1841 return 0; 1842 1843 unwind: 1844 list_for_each_entry_continue_reverse(port, &team->port_list, list) 1845 vlan_vid_del(port->dev, proto, vid); 1846 mutex_unlock(&team->lock); 1847 1848 return err; 1849 } 1850 1851 static int team_vlan_rx_kill_vid(struct net_device *dev, __be16 proto, u16 vid) 1852 { 1853 struct team *team = netdev_priv(dev); 1854 struct team_port *port; 1855 1856 rcu_read_lock(); 1857 list_for_each_entry_rcu(port, &team->port_list, list) 1858 vlan_vid_del(port->dev, proto, vid); 1859 rcu_read_unlock(); 1860 1861 return 0; 1862 } 1863 1864 #ifdef CONFIG_NET_POLL_CONTROLLER 1865 static void team_poll_controller(struct net_device *dev) 1866 { 1867 } 1868 1869 static void __team_netpoll_cleanup(struct team *team) 1870 { 1871 struct team_port *port; 1872 1873 list_for_each_entry(port, &team->port_list, list) 1874 team_port_disable_netpoll(port); 1875 } 1876 1877 static void team_netpoll_cleanup(struct net_device *dev) 1878 { 1879 struct team *team = netdev_priv(dev); 1880 1881 mutex_lock(&team->lock); 1882 __team_netpoll_cleanup(team); 1883 mutex_unlock(&team->lock); 1884 } 1885 1886 static int team_netpoll_setup(struct net_device *dev, 1887 struct netpoll_info *npifo) 1888 { 1889 struct team *team = netdev_priv(dev); 1890 struct team_port *port; 1891 int err = 0; 1892 1893 mutex_lock(&team->lock); 1894 list_for_each_entry(port, &team->port_list, list) { 1895 err = team_port_enable_netpoll(team, port); 1896 if (err) { 1897 __team_netpoll_cleanup(team); 1898 break; 1899 } 1900 } 1901 mutex_unlock(&team->lock); 1902 return err; 1903 } 1904 #endif 1905 1906 static int team_add_slave(struct net_device *dev, struct net_device *port_dev) 1907 { 1908 struct team *team = netdev_priv(dev); 1909 int err; 1910 1911 mutex_lock(&team->lock); 1912 err = team_port_add(team, port_dev); 1913 mutex_unlock(&team->lock); 1914 return err; 1915 } 1916 1917 static int team_del_slave(struct net_device *dev, struct net_device *port_dev) 1918 { 1919 struct team *team = netdev_priv(dev); 1920 int err; 1921 1922 mutex_lock(&team->lock); 1923 err = team_port_del(team, port_dev); 1924 mutex_unlock(&team->lock); 1925 return err; 1926 } 1927 1928 static netdev_features_t team_fix_features(struct net_device *dev, 1929 netdev_features_t features) 1930 { 1931 struct team_port *port; 1932 struct team *team = netdev_priv(dev); 1933 netdev_features_t mask; 1934 1935 mask = features; 1936 features &= ~NETIF_F_ONE_FOR_ALL; 1937 features |= NETIF_F_ALL_FOR_ALL; 1938 1939 rcu_read_lock(); 1940 list_for_each_entry_rcu(port, &team->port_list, list) { 1941 features = netdev_increment_features(features, 1942 port->dev->features, 1943 mask); 1944 } 1945 rcu_read_unlock(); 1946 return features; 1947 } 1948 1949 static int team_change_carrier(struct net_device *dev, bool new_carrier) 1950 { 1951 struct team *team = netdev_priv(dev); 1952 1953 team->user_carrier_enabled = true; 1954 1955 if (new_carrier) 1956 netif_carrier_on(dev); 1957 else 1958 netif_carrier_off(dev); 1959 return 0; 1960 } 1961 1962 static const struct net_device_ops team_netdev_ops = { 1963 .ndo_init = team_init, 1964 .ndo_uninit = team_uninit, 1965 .ndo_open = team_open, 1966 .ndo_stop = team_close, 1967 .ndo_start_xmit = team_xmit, 1968 .ndo_select_queue = team_select_queue, 1969 .ndo_change_rx_flags = team_change_rx_flags, 1970 .ndo_set_rx_mode = team_set_rx_mode, 1971 .ndo_set_mac_address = team_set_mac_address, 1972 .ndo_change_mtu = team_change_mtu, 1973 .ndo_get_stats64 = team_get_stats64, 1974 .ndo_vlan_rx_add_vid = team_vlan_rx_add_vid, 1975 .ndo_vlan_rx_kill_vid = team_vlan_rx_kill_vid, 1976 #ifdef CONFIG_NET_POLL_CONTROLLER 1977 .ndo_poll_controller = team_poll_controller, 1978 .ndo_netpoll_setup = team_netpoll_setup, 1979 .ndo_netpoll_cleanup = team_netpoll_cleanup, 1980 #endif 1981 .ndo_add_slave = team_add_slave, 1982 .ndo_del_slave = team_del_slave, 1983 .ndo_fix_features = team_fix_features, 1984 .ndo_change_carrier = team_change_carrier, 1985 }; 1986 1987 /*********************** 1988 * ethtool interface 1989 ***********************/ 1990 1991 static void team_ethtool_get_drvinfo(struct net_device *dev, 1992 struct ethtool_drvinfo *drvinfo) 1993 { 1994 strlcpy(drvinfo->driver, DRV_NAME, sizeof(drvinfo->driver)); 1995 strlcpy(drvinfo->version, UTS_RELEASE, sizeof(drvinfo->version)); 1996 } 1997 1998 static const struct ethtool_ops team_ethtool_ops = { 1999 .get_drvinfo = team_ethtool_get_drvinfo, 2000 .get_link = ethtool_op_get_link, 2001 }; 2002 2003 /*********************** 2004 * rt netlink interface 2005 ***********************/ 2006 2007 static void team_setup_by_port(struct net_device *dev, 2008 struct net_device *port_dev) 2009 { 2010 dev->header_ops = port_dev->header_ops; 2011 dev->type = port_dev->type; 2012 dev->hard_header_len = port_dev->hard_header_len; 2013 dev->addr_len = port_dev->addr_len; 2014 dev->mtu = port_dev->mtu; 2015 memcpy(dev->broadcast, port_dev->broadcast, port_dev->addr_len); 2016 eth_hw_addr_inherit(dev, port_dev); 2017 } 2018 2019 static int team_dev_type_check_change(struct net_device *dev, 2020 struct net_device *port_dev) 2021 { 2022 struct team *team = netdev_priv(dev); 2023 char *portname = port_dev->name; 2024 int err; 2025 2026 if (dev->type == port_dev->type) 2027 return 0; 2028 if (!list_empty(&team->port_list)) { 2029 netdev_err(dev, "Device %s is of different type\n", portname); 2030 return -EBUSY; 2031 } 2032 err = call_netdevice_notifiers(NETDEV_PRE_TYPE_CHANGE, dev); 2033 err = notifier_to_errno(err); 2034 if (err) { 2035 netdev_err(dev, "Refused to change device type\n"); 2036 return err; 2037 } 2038 dev_uc_flush(dev); 2039 dev_mc_flush(dev); 2040 team_setup_by_port(dev, port_dev); 2041 call_netdevice_notifiers(NETDEV_POST_TYPE_CHANGE, dev); 2042 return 0; 2043 } 2044 2045 static void team_setup(struct net_device *dev) 2046 { 2047 ether_setup(dev); 2048 2049 dev->netdev_ops = &team_netdev_ops; 2050 dev->ethtool_ops = &team_ethtool_ops; 2051 dev->destructor = team_destructor; 2052 dev->tx_queue_len = 0; 2053 dev->flags |= IFF_MULTICAST; 2054 dev->priv_flags &= ~(IFF_XMIT_DST_RELEASE | IFF_TX_SKB_SHARING); 2055 2056 /* 2057 * Indicate we support unicast address filtering. That way core won't 2058 * bring us to promisc mode in case a unicast addr is added. 2059 * Let this up to underlay drivers. 2060 */ 2061 dev->priv_flags |= IFF_UNICAST_FLT | IFF_LIVE_ADDR_CHANGE; 2062 2063 dev->features |= NETIF_F_LLTX; 2064 dev->features |= NETIF_F_GRO; 2065 2066 /* Don't allow team devices to change network namespaces. */ 2067 dev->features |= NETIF_F_NETNS_LOCAL; 2068 2069 dev->hw_features = TEAM_VLAN_FEATURES | 2070 NETIF_F_HW_VLAN_CTAG_TX | 2071 NETIF_F_HW_VLAN_CTAG_RX | 2072 NETIF_F_HW_VLAN_CTAG_FILTER; 2073 2074 dev->hw_features &= ~(NETIF_F_ALL_CSUM & ~NETIF_F_HW_CSUM); 2075 dev->features |= dev->hw_features; 2076 } 2077 2078 static int team_newlink(struct net *src_net, struct net_device *dev, 2079 struct nlattr *tb[], struct nlattr *data[]) 2080 { 2081 if (tb[IFLA_ADDRESS] == NULL) 2082 eth_hw_addr_random(dev); 2083 2084 return register_netdevice(dev); 2085 } 2086 2087 static int team_validate(struct nlattr *tb[], struct nlattr *data[]) 2088 { 2089 if (tb[IFLA_ADDRESS]) { 2090 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN) 2091 return -EINVAL; 2092 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS]))) 2093 return -EADDRNOTAVAIL; 2094 } 2095 return 0; 2096 } 2097 2098 static unsigned int team_get_num_tx_queues(void) 2099 { 2100 return TEAM_DEFAULT_NUM_TX_QUEUES; 2101 } 2102 2103 static unsigned int team_get_num_rx_queues(void) 2104 { 2105 return TEAM_DEFAULT_NUM_RX_QUEUES; 2106 } 2107 2108 static struct rtnl_link_ops team_link_ops __read_mostly = { 2109 .kind = DRV_NAME, 2110 .priv_size = sizeof(struct team), 2111 .setup = team_setup, 2112 .newlink = team_newlink, 2113 .validate = team_validate, 2114 .get_num_tx_queues = team_get_num_tx_queues, 2115 .get_num_rx_queues = team_get_num_rx_queues, 2116 }; 2117 2118 2119 /*********************************** 2120 * Generic netlink custom interface 2121 ***********************************/ 2122 2123 static struct genl_family team_nl_family = { 2124 .id = GENL_ID_GENERATE, 2125 .name = TEAM_GENL_NAME, 2126 .version = TEAM_GENL_VERSION, 2127 .maxattr = TEAM_ATTR_MAX, 2128 .netnsok = true, 2129 }; 2130 2131 static const struct nla_policy team_nl_policy[TEAM_ATTR_MAX + 1] = { 2132 [TEAM_ATTR_UNSPEC] = { .type = NLA_UNSPEC, }, 2133 [TEAM_ATTR_TEAM_IFINDEX] = { .type = NLA_U32 }, 2134 [TEAM_ATTR_LIST_OPTION] = { .type = NLA_NESTED }, 2135 [TEAM_ATTR_LIST_PORT] = { .type = NLA_NESTED }, 2136 }; 2137 2138 static const struct nla_policy 2139 team_nl_option_policy[TEAM_ATTR_OPTION_MAX + 1] = { 2140 [TEAM_ATTR_OPTION_UNSPEC] = { .type = NLA_UNSPEC, }, 2141 [TEAM_ATTR_OPTION_NAME] = { 2142 .type = NLA_STRING, 2143 .len = TEAM_STRING_MAX_LEN, 2144 }, 2145 [TEAM_ATTR_OPTION_CHANGED] = { .type = NLA_FLAG }, 2146 [TEAM_ATTR_OPTION_TYPE] = { .type = NLA_U8 }, 2147 [TEAM_ATTR_OPTION_DATA] = { .type = NLA_BINARY }, 2148 }; 2149 2150 static int team_nl_cmd_noop(struct sk_buff *skb, struct genl_info *info) 2151 { 2152 struct sk_buff *msg; 2153 void *hdr; 2154 int err; 2155 2156 msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL); 2157 if (!msg) 2158 return -ENOMEM; 2159 2160 hdr = genlmsg_put(msg, info->snd_portid, info->snd_seq, 2161 &team_nl_family, 0, TEAM_CMD_NOOP); 2162 if (!hdr) { 2163 err = -EMSGSIZE; 2164 goto err_msg_put; 2165 } 2166 2167 genlmsg_end(msg, hdr); 2168 2169 return genlmsg_unicast(genl_info_net(info), msg, info->snd_portid); 2170 2171 err_msg_put: 2172 nlmsg_free(msg); 2173 2174 return err; 2175 } 2176 2177 /* 2178 * Netlink cmd functions should be locked by following two functions. 2179 * Since dev gets held here, that ensures dev won't disappear in between. 2180 */ 2181 static struct team *team_nl_team_get(struct genl_info *info) 2182 { 2183 struct net *net = genl_info_net(info); 2184 int ifindex; 2185 struct net_device *dev; 2186 struct team *team; 2187 2188 if (!info->attrs[TEAM_ATTR_TEAM_IFINDEX]) 2189 return NULL; 2190 2191 ifindex = nla_get_u32(info->attrs[TEAM_ATTR_TEAM_IFINDEX]); 2192 dev = dev_get_by_index(net, ifindex); 2193 if (!dev || dev->netdev_ops != &team_netdev_ops) { 2194 if (dev) 2195 dev_put(dev); 2196 return NULL; 2197 } 2198 2199 team = netdev_priv(dev); 2200 mutex_lock(&team->lock); 2201 return team; 2202 } 2203 2204 static void team_nl_team_put(struct team *team) 2205 { 2206 mutex_unlock(&team->lock); 2207 dev_put(team->dev); 2208 } 2209 2210 typedef int team_nl_send_func_t(struct sk_buff *skb, 2211 struct team *team, u32 portid); 2212 2213 static int team_nl_send_unicast(struct sk_buff *skb, struct team *team, u32 portid) 2214 { 2215 return genlmsg_unicast(dev_net(team->dev), skb, portid); 2216 } 2217 2218 static int team_nl_fill_one_option_get(struct sk_buff *skb, struct team *team, 2219 struct team_option_inst *opt_inst) 2220 { 2221 struct nlattr *option_item; 2222 struct team_option *option = opt_inst->option; 2223 struct team_option_inst_info *opt_inst_info = &opt_inst->info; 2224 struct team_gsetter_ctx ctx; 2225 int err; 2226 2227 ctx.info = opt_inst_info; 2228 err = team_option_get(team, opt_inst, &ctx); 2229 if (err) 2230 return err; 2231 2232 option_item = nla_nest_start(skb, TEAM_ATTR_ITEM_OPTION); 2233 if (!option_item) 2234 return -EMSGSIZE; 2235 2236 if (nla_put_string(skb, TEAM_ATTR_OPTION_NAME, option->name)) 2237 goto nest_cancel; 2238 if (opt_inst_info->port && 2239 nla_put_u32(skb, TEAM_ATTR_OPTION_PORT_IFINDEX, 2240 opt_inst_info->port->dev->ifindex)) 2241 goto nest_cancel; 2242 if (opt_inst->option->array_size && 2243 nla_put_u32(skb, TEAM_ATTR_OPTION_ARRAY_INDEX, 2244 opt_inst_info->array_index)) 2245 goto nest_cancel; 2246 2247 switch (option->type) { 2248 case TEAM_OPTION_TYPE_U32: 2249 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_U32)) 2250 goto nest_cancel; 2251 if (nla_put_u32(skb, TEAM_ATTR_OPTION_DATA, ctx.data.u32_val)) 2252 goto nest_cancel; 2253 break; 2254 case TEAM_OPTION_TYPE_STRING: 2255 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_STRING)) 2256 goto nest_cancel; 2257 if (nla_put_string(skb, TEAM_ATTR_OPTION_DATA, 2258 ctx.data.str_val)) 2259 goto nest_cancel; 2260 break; 2261 case TEAM_OPTION_TYPE_BINARY: 2262 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_BINARY)) 2263 goto nest_cancel; 2264 if (nla_put(skb, TEAM_ATTR_OPTION_DATA, ctx.data.bin_val.len, 2265 ctx.data.bin_val.ptr)) 2266 goto nest_cancel; 2267 break; 2268 case TEAM_OPTION_TYPE_BOOL: 2269 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_FLAG)) 2270 goto nest_cancel; 2271 if (ctx.data.bool_val && 2272 nla_put_flag(skb, TEAM_ATTR_OPTION_DATA)) 2273 goto nest_cancel; 2274 break; 2275 case TEAM_OPTION_TYPE_S32: 2276 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_S32)) 2277 goto nest_cancel; 2278 if (nla_put_s32(skb, TEAM_ATTR_OPTION_DATA, ctx.data.s32_val)) 2279 goto nest_cancel; 2280 break; 2281 default: 2282 BUG(); 2283 } 2284 if (opt_inst->removed && nla_put_flag(skb, TEAM_ATTR_OPTION_REMOVED)) 2285 goto nest_cancel; 2286 if (opt_inst->changed) { 2287 if (nla_put_flag(skb, TEAM_ATTR_OPTION_CHANGED)) 2288 goto nest_cancel; 2289 opt_inst->changed = false; 2290 } 2291 nla_nest_end(skb, option_item); 2292 return 0; 2293 2294 nest_cancel: 2295 nla_nest_cancel(skb, option_item); 2296 return -EMSGSIZE; 2297 } 2298 2299 static int __send_and_alloc_skb(struct sk_buff **pskb, 2300 struct team *team, u32 portid, 2301 team_nl_send_func_t *send_func) 2302 { 2303 int err; 2304 2305 if (*pskb) { 2306 err = send_func(*pskb, team, portid); 2307 if (err) 2308 return err; 2309 } 2310 *pskb = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL); 2311 if (!*pskb) 2312 return -ENOMEM; 2313 return 0; 2314 } 2315 2316 static int team_nl_send_options_get(struct team *team, u32 portid, u32 seq, 2317 int flags, team_nl_send_func_t *send_func, 2318 struct list_head *sel_opt_inst_list) 2319 { 2320 struct nlattr *option_list; 2321 struct nlmsghdr *nlh; 2322 void *hdr; 2323 struct team_option_inst *opt_inst; 2324 int err; 2325 struct sk_buff *skb = NULL; 2326 bool incomplete; 2327 int i; 2328 2329 opt_inst = list_first_entry(sel_opt_inst_list, 2330 struct team_option_inst, tmp_list); 2331 2332 start_again: 2333 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2334 if (err) 2335 return err; 2336 2337 hdr = genlmsg_put(skb, portid, seq, &team_nl_family, flags | NLM_F_MULTI, 2338 TEAM_CMD_OPTIONS_GET); 2339 if (!hdr) 2340 return -EMSGSIZE; 2341 2342 if (nla_put_u32(skb, TEAM_ATTR_TEAM_IFINDEX, team->dev->ifindex)) 2343 goto nla_put_failure; 2344 option_list = nla_nest_start(skb, TEAM_ATTR_LIST_OPTION); 2345 if (!option_list) 2346 goto nla_put_failure; 2347 2348 i = 0; 2349 incomplete = false; 2350 list_for_each_entry_from(opt_inst, sel_opt_inst_list, tmp_list) { 2351 err = team_nl_fill_one_option_get(skb, team, opt_inst); 2352 if (err) { 2353 if (err == -EMSGSIZE) { 2354 if (!i) 2355 goto errout; 2356 incomplete = true; 2357 break; 2358 } 2359 goto errout; 2360 } 2361 i++; 2362 } 2363 2364 nla_nest_end(skb, option_list); 2365 genlmsg_end(skb, hdr); 2366 if (incomplete) 2367 goto start_again; 2368 2369 send_done: 2370 nlh = nlmsg_put(skb, portid, seq, NLMSG_DONE, 0, flags | NLM_F_MULTI); 2371 if (!nlh) { 2372 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2373 if (err) 2374 goto errout; 2375 goto send_done; 2376 } 2377 2378 return send_func(skb, team, portid); 2379 2380 nla_put_failure: 2381 err = -EMSGSIZE; 2382 errout: 2383 genlmsg_cancel(skb, hdr); 2384 nlmsg_free(skb); 2385 return err; 2386 } 2387 2388 static int team_nl_cmd_options_get(struct sk_buff *skb, struct genl_info *info) 2389 { 2390 struct team *team; 2391 struct team_option_inst *opt_inst; 2392 int err; 2393 LIST_HEAD(sel_opt_inst_list); 2394 2395 team = team_nl_team_get(info); 2396 if (!team) 2397 return -EINVAL; 2398 2399 list_for_each_entry(opt_inst, &team->option_inst_list, list) 2400 list_add_tail(&opt_inst->tmp_list, &sel_opt_inst_list); 2401 err = team_nl_send_options_get(team, info->snd_portid, info->snd_seq, 2402 NLM_F_ACK, team_nl_send_unicast, 2403 &sel_opt_inst_list); 2404 2405 team_nl_team_put(team); 2406 2407 return err; 2408 } 2409 2410 static int team_nl_send_event_options_get(struct team *team, 2411 struct list_head *sel_opt_inst_list); 2412 2413 static int team_nl_cmd_options_set(struct sk_buff *skb, struct genl_info *info) 2414 { 2415 struct team *team; 2416 int err = 0; 2417 int i; 2418 struct nlattr *nl_option; 2419 LIST_HEAD(opt_inst_list); 2420 2421 team = team_nl_team_get(info); 2422 if (!team) 2423 return -EINVAL; 2424 2425 err = -EINVAL; 2426 if (!info->attrs[TEAM_ATTR_LIST_OPTION]) { 2427 err = -EINVAL; 2428 goto team_put; 2429 } 2430 2431 nla_for_each_nested(nl_option, info->attrs[TEAM_ATTR_LIST_OPTION], i) { 2432 struct nlattr *opt_attrs[TEAM_ATTR_OPTION_MAX + 1]; 2433 struct nlattr *attr; 2434 struct nlattr *attr_data; 2435 enum team_option_type opt_type; 2436 int opt_port_ifindex = 0; /* != 0 for per-port options */ 2437 u32 opt_array_index = 0; 2438 bool opt_is_array = false; 2439 struct team_option_inst *opt_inst; 2440 char *opt_name; 2441 bool opt_found = false; 2442 2443 if (nla_type(nl_option) != TEAM_ATTR_ITEM_OPTION) { 2444 err = -EINVAL; 2445 goto team_put; 2446 } 2447 err = nla_parse_nested(opt_attrs, TEAM_ATTR_OPTION_MAX, 2448 nl_option, team_nl_option_policy); 2449 if (err) 2450 goto team_put; 2451 if (!opt_attrs[TEAM_ATTR_OPTION_NAME] || 2452 !opt_attrs[TEAM_ATTR_OPTION_TYPE]) { 2453 err = -EINVAL; 2454 goto team_put; 2455 } 2456 switch (nla_get_u8(opt_attrs[TEAM_ATTR_OPTION_TYPE])) { 2457 case NLA_U32: 2458 opt_type = TEAM_OPTION_TYPE_U32; 2459 break; 2460 case NLA_STRING: 2461 opt_type = TEAM_OPTION_TYPE_STRING; 2462 break; 2463 case NLA_BINARY: 2464 opt_type = TEAM_OPTION_TYPE_BINARY; 2465 break; 2466 case NLA_FLAG: 2467 opt_type = TEAM_OPTION_TYPE_BOOL; 2468 break; 2469 case NLA_S32: 2470 opt_type = TEAM_OPTION_TYPE_S32; 2471 break; 2472 default: 2473 goto team_put; 2474 } 2475 2476 attr_data = opt_attrs[TEAM_ATTR_OPTION_DATA]; 2477 if (opt_type != TEAM_OPTION_TYPE_BOOL && !attr_data) { 2478 err = -EINVAL; 2479 goto team_put; 2480 } 2481 2482 opt_name = nla_data(opt_attrs[TEAM_ATTR_OPTION_NAME]); 2483 attr = opt_attrs[TEAM_ATTR_OPTION_PORT_IFINDEX]; 2484 if (attr) 2485 opt_port_ifindex = nla_get_u32(attr); 2486 2487 attr = opt_attrs[TEAM_ATTR_OPTION_ARRAY_INDEX]; 2488 if (attr) { 2489 opt_is_array = true; 2490 opt_array_index = nla_get_u32(attr); 2491 } 2492 2493 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 2494 struct team_option *option = opt_inst->option; 2495 struct team_gsetter_ctx ctx; 2496 struct team_option_inst_info *opt_inst_info; 2497 int tmp_ifindex; 2498 2499 opt_inst_info = &opt_inst->info; 2500 tmp_ifindex = opt_inst_info->port ? 2501 opt_inst_info->port->dev->ifindex : 0; 2502 if (option->type != opt_type || 2503 strcmp(option->name, opt_name) || 2504 tmp_ifindex != opt_port_ifindex || 2505 (option->array_size && !opt_is_array) || 2506 opt_inst_info->array_index != opt_array_index) 2507 continue; 2508 opt_found = true; 2509 ctx.info = opt_inst_info; 2510 switch (opt_type) { 2511 case TEAM_OPTION_TYPE_U32: 2512 ctx.data.u32_val = nla_get_u32(attr_data); 2513 break; 2514 case TEAM_OPTION_TYPE_STRING: 2515 if (nla_len(attr_data) > TEAM_STRING_MAX_LEN) { 2516 err = -EINVAL; 2517 goto team_put; 2518 } 2519 ctx.data.str_val = nla_data(attr_data); 2520 break; 2521 case TEAM_OPTION_TYPE_BINARY: 2522 ctx.data.bin_val.len = nla_len(attr_data); 2523 ctx.data.bin_val.ptr = nla_data(attr_data); 2524 break; 2525 case TEAM_OPTION_TYPE_BOOL: 2526 ctx.data.bool_val = attr_data ? true : false; 2527 break; 2528 case TEAM_OPTION_TYPE_S32: 2529 ctx.data.s32_val = nla_get_s32(attr_data); 2530 break; 2531 default: 2532 BUG(); 2533 } 2534 err = team_option_set(team, opt_inst, &ctx); 2535 if (err) 2536 goto team_put; 2537 opt_inst->changed = true; 2538 list_add(&opt_inst->tmp_list, &opt_inst_list); 2539 } 2540 if (!opt_found) { 2541 err = -ENOENT; 2542 goto team_put; 2543 } 2544 } 2545 2546 err = team_nl_send_event_options_get(team, &opt_inst_list); 2547 2548 team_put: 2549 team_nl_team_put(team); 2550 2551 return err; 2552 } 2553 2554 static int team_nl_fill_one_port_get(struct sk_buff *skb, 2555 struct team_port *port) 2556 { 2557 struct nlattr *port_item; 2558 2559 port_item = nla_nest_start(skb, TEAM_ATTR_ITEM_PORT); 2560 if (!port_item) 2561 goto nest_cancel; 2562 if (nla_put_u32(skb, TEAM_ATTR_PORT_IFINDEX, port->dev->ifindex)) 2563 goto nest_cancel; 2564 if (port->changed) { 2565 if (nla_put_flag(skb, TEAM_ATTR_PORT_CHANGED)) 2566 goto nest_cancel; 2567 port->changed = false; 2568 } 2569 if ((port->removed && 2570 nla_put_flag(skb, TEAM_ATTR_PORT_REMOVED)) || 2571 (port->state.linkup && 2572 nla_put_flag(skb, TEAM_ATTR_PORT_LINKUP)) || 2573 nla_put_u32(skb, TEAM_ATTR_PORT_SPEED, port->state.speed) || 2574 nla_put_u8(skb, TEAM_ATTR_PORT_DUPLEX, port->state.duplex)) 2575 goto nest_cancel; 2576 nla_nest_end(skb, port_item); 2577 return 0; 2578 2579 nest_cancel: 2580 nla_nest_cancel(skb, port_item); 2581 return -EMSGSIZE; 2582 } 2583 2584 static int team_nl_send_port_list_get(struct team *team, u32 portid, u32 seq, 2585 int flags, team_nl_send_func_t *send_func, 2586 struct team_port *one_port) 2587 { 2588 struct nlattr *port_list; 2589 struct nlmsghdr *nlh; 2590 void *hdr; 2591 struct team_port *port; 2592 int err; 2593 struct sk_buff *skb = NULL; 2594 bool incomplete; 2595 int i; 2596 2597 port = list_first_entry_or_null(&team->port_list, 2598 struct team_port, list); 2599 2600 start_again: 2601 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2602 if (err) 2603 return err; 2604 2605 hdr = genlmsg_put(skb, portid, seq, &team_nl_family, flags | NLM_F_MULTI, 2606 TEAM_CMD_PORT_LIST_GET); 2607 if (!hdr) 2608 return -EMSGSIZE; 2609 2610 if (nla_put_u32(skb, TEAM_ATTR_TEAM_IFINDEX, team->dev->ifindex)) 2611 goto nla_put_failure; 2612 port_list = nla_nest_start(skb, TEAM_ATTR_LIST_PORT); 2613 if (!port_list) 2614 goto nla_put_failure; 2615 2616 i = 0; 2617 incomplete = false; 2618 2619 /* If one port is selected, called wants to send port list containing 2620 * only this port. Otherwise go through all listed ports and send all 2621 */ 2622 if (one_port) { 2623 err = team_nl_fill_one_port_get(skb, one_port); 2624 if (err) 2625 goto errout; 2626 } else if (port) { 2627 list_for_each_entry_from(port, &team->port_list, list) { 2628 err = team_nl_fill_one_port_get(skb, port); 2629 if (err) { 2630 if (err == -EMSGSIZE) { 2631 if (!i) 2632 goto errout; 2633 incomplete = true; 2634 break; 2635 } 2636 goto errout; 2637 } 2638 i++; 2639 } 2640 } 2641 2642 nla_nest_end(skb, port_list); 2643 genlmsg_end(skb, hdr); 2644 if (incomplete) 2645 goto start_again; 2646 2647 send_done: 2648 nlh = nlmsg_put(skb, portid, seq, NLMSG_DONE, 0, flags | NLM_F_MULTI); 2649 if (!nlh) { 2650 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2651 if (err) 2652 goto errout; 2653 goto send_done; 2654 } 2655 2656 return send_func(skb, team, portid); 2657 2658 nla_put_failure: 2659 err = -EMSGSIZE; 2660 errout: 2661 genlmsg_cancel(skb, hdr); 2662 nlmsg_free(skb); 2663 return err; 2664 } 2665 2666 static int team_nl_cmd_port_list_get(struct sk_buff *skb, 2667 struct genl_info *info) 2668 { 2669 struct team *team; 2670 int err; 2671 2672 team = team_nl_team_get(info); 2673 if (!team) 2674 return -EINVAL; 2675 2676 err = team_nl_send_port_list_get(team, info->snd_portid, info->snd_seq, 2677 NLM_F_ACK, team_nl_send_unicast, NULL); 2678 2679 team_nl_team_put(team); 2680 2681 return err; 2682 } 2683 2684 static const struct genl_ops team_nl_ops[] = { 2685 { 2686 .cmd = TEAM_CMD_NOOP, 2687 .doit = team_nl_cmd_noop, 2688 .policy = team_nl_policy, 2689 }, 2690 { 2691 .cmd = TEAM_CMD_OPTIONS_SET, 2692 .doit = team_nl_cmd_options_set, 2693 .policy = team_nl_policy, 2694 .flags = GENL_ADMIN_PERM, 2695 }, 2696 { 2697 .cmd = TEAM_CMD_OPTIONS_GET, 2698 .doit = team_nl_cmd_options_get, 2699 .policy = team_nl_policy, 2700 .flags = GENL_ADMIN_PERM, 2701 }, 2702 { 2703 .cmd = TEAM_CMD_PORT_LIST_GET, 2704 .doit = team_nl_cmd_port_list_get, 2705 .policy = team_nl_policy, 2706 .flags = GENL_ADMIN_PERM, 2707 }, 2708 }; 2709 2710 static const struct genl_multicast_group team_nl_mcgrps[] = { 2711 { .name = TEAM_GENL_CHANGE_EVENT_MC_GRP_NAME, }, 2712 }; 2713 2714 static int team_nl_send_multicast(struct sk_buff *skb, 2715 struct team *team, u32 portid) 2716 { 2717 return genlmsg_multicast_netns(&team_nl_family, dev_net(team->dev), 2718 skb, 0, 0, GFP_KERNEL); 2719 } 2720 2721 static int team_nl_send_event_options_get(struct team *team, 2722 struct list_head *sel_opt_inst_list) 2723 { 2724 return team_nl_send_options_get(team, 0, 0, 0, team_nl_send_multicast, 2725 sel_opt_inst_list); 2726 } 2727 2728 static int team_nl_send_event_port_get(struct team *team, 2729 struct team_port *port) 2730 { 2731 return team_nl_send_port_list_get(team, 0, 0, 0, team_nl_send_multicast, 2732 port); 2733 } 2734 2735 static int team_nl_init(void) 2736 { 2737 return genl_register_family_with_ops_groups(&team_nl_family, team_nl_ops, 2738 team_nl_mcgrps); 2739 } 2740 2741 static void team_nl_fini(void) 2742 { 2743 genl_unregister_family(&team_nl_family); 2744 } 2745 2746 2747 /****************** 2748 * Change checkers 2749 ******************/ 2750 2751 static void __team_options_change_check(struct team *team) 2752 { 2753 int err; 2754 struct team_option_inst *opt_inst; 2755 LIST_HEAD(sel_opt_inst_list); 2756 2757 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 2758 if (opt_inst->changed) 2759 list_add_tail(&opt_inst->tmp_list, &sel_opt_inst_list); 2760 } 2761 err = team_nl_send_event_options_get(team, &sel_opt_inst_list); 2762 if (err && err != -ESRCH) 2763 netdev_warn(team->dev, "Failed to send options change via netlink (err %d)\n", 2764 err); 2765 } 2766 2767 /* rtnl lock is held */ 2768 2769 static void __team_port_change_send(struct team_port *port, bool linkup) 2770 { 2771 int err; 2772 2773 port->changed = true; 2774 port->state.linkup = linkup; 2775 team_refresh_port_linkup(port); 2776 if (linkup) { 2777 struct ethtool_cmd ecmd; 2778 2779 err = __ethtool_get_settings(port->dev, &ecmd); 2780 if (!err) { 2781 port->state.speed = ethtool_cmd_speed(&ecmd); 2782 port->state.duplex = ecmd.duplex; 2783 goto send_event; 2784 } 2785 } 2786 port->state.speed = 0; 2787 port->state.duplex = 0; 2788 2789 send_event: 2790 err = team_nl_send_event_port_get(port->team, port); 2791 if (err && err != -ESRCH) 2792 netdev_warn(port->team->dev, "Failed to send port change of device %s via netlink (err %d)\n", 2793 port->dev->name, err); 2794 2795 } 2796 2797 static void __team_carrier_check(struct team *team) 2798 { 2799 struct team_port *port; 2800 bool team_linkup; 2801 2802 if (team->user_carrier_enabled) 2803 return; 2804 2805 team_linkup = false; 2806 list_for_each_entry(port, &team->port_list, list) { 2807 if (port->linkup) { 2808 team_linkup = true; 2809 break; 2810 } 2811 } 2812 2813 if (team_linkup) 2814 netif_carrier_on(team->dev); 2815 else 2816 netif_carrier_off(team->dev); 2817 } 2818 2819 static void __team_port_change_check(struct team_port *port, bool linkup) 2820 { 2821 if (port->state.linkup != linkup) 2822 __team_port_change_send(port, linkup); 2823 __team_carrier_check(port->team); 2824 } 2825 2826 static void __team_port_change_port_added(struct team_port *port, bool linkup) 2827 { 2828 __team_port_change_send(port, linkup); 2829 __team_carrier_check(port->team); 2830 } 2831 2832 static void __team_port_change_port_removed(struct team_port *port) 2833 { 2834 port->removed = true; 2835 __team_port_change_send(port, false); 2836 __team_carrier_check(port->team); 2837 } 2838 2839 static void team_port_change_check(struct team_port *port, bool linkup) 2840 { 2841 struct team *team = port->team; 2842 2843 mutex_lock(&team->lock); 2844 __team_port_change_check(port, linkup); 2845 mutex_unlock(&team->lock); 2846 } 2847 2848 2849 /************************************ 2850 * Net device notifier event handler 2851 ************************************/ 2852 2853 static int team_device_event(struct notifier_block *unused, 2854 unsigned long event, void *ptr) 2855 { 2856 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 2857 struct team_port *port; 2858 2859 port = team_port_get_rtnl(dev); 2860 if (!port) 2861 return NOTIFY_DONE; 2862 2863 switch (event) { 2864 case NETDEV_UP: 2865 if (netif_carrier_ok(dev)) 2866 team_port_change_check(port, true); 2867 break; 2868 case NETDEV_DOWN: 2869 team_port_change_check(port, false); 2870 break; 2871 case NETDEV_CHANGE: 2872 if (netif_running(port->dev)) 2873 team_port_change_check(port, 2874 !!netif_carrier_ok(port->dev)); 2875 break; 2876 case NETDEV_UNREGISTER: 2877 team_del_slave(port->team->dev, dev); 2878 break; 2879 case NETDEV_FEAT_CHANGE: 2880 team_compute_features(port->team); 2881 break; 2882 case NETDEV_PRECHANGEMTU: 2883 /* Forbid to change mtu of underlaying device */ 2884 if (!port->team->port_mtu_change_allowed) 2885 return NOTIFY_BAD; 2886 break; 2887 case NETDEV_PRE_TYPE_CHANGE: 2888 /* Forbid to change type of underlaying device */ 2889 return NOTIFY_BAD; 2890 case NETDEV_RESEND_IGMP: 2891 /* Propagate to master device */ 2892 call_netdevice_notifiers(event, port->team->dev); 2893 break; 2894 } 2895 return NOTIFY_DONE; 2896 } 2897 2898 static struct notifier_block team_notifier_block __read_mostly = { 2899 .notifier_call = team_device_event, 2900 }; 2901 2902 2903 /*********************** 2904 * Module init and exit 2905 ***********************/ 2906 2907 static int __init team_module_init(void) 2908 { 2909 int err; 2910 2911 register_netdevice_notifier(&team_notifier_block); 2912 2913 err = rtnl_link_register(&team_link_ops); 2914 if (err) 2915 goto err_rtnl_reg; 2916 2917 err = team_nl_init(); 2918 if (err) 2919 goto err_nl_init; 2920 2921 return 0; 2922 2923 err_nl_init: 2924 rtnl_link_unregister(&team_link_ops); 2925 2926 err_rtnl_reg: 2927 unregister_netdevice_notifier(&team_notifier_block); 2928 2929 return err; 2930 } 2931 2932 static void __exit team_module_exit(void) 2933 { 2934 team_nl_fini(); 2935 rtnl_link_unregister(&team_link_ops); 2936 unregister_netdevice_notifier(&team_notifier_block); 2937 } 2938 2939 module_init(team_module_init); 2940 module_exit(team_module_exit); 2941 2942 MODULE_LICENSE("GPL v2"); 2943 MODULE_AUTHOR("Jiri Pirko <jpirko@redhat.com>"); 2944 MODULE_DESCRIPTION("Ethernet team device driver"); 2945 MODULE_ALIAS_RTNL_LINK(DRV_NAME); 2946