1 /* 2 * drivers/net/team/team.c - Network team device driver 3 * Copyright (c) 2011 Jiri Pirko <jpirko@redhat.com> 4 * 5 * This program is free software; you can redistribute it and/or modify 6 * it under the terms of the GNU General Public License as published by 7 * the Free Software Foundation; either version 2 of the License, or 8 * (at your option) any later version. 9 */ 10 11 #include <linux/kernel.h> 12 #include <linux/types.h> 13 #include <linux/module.h> 14 #include <linux/init.h> 15 #include <linux/slab.h> 16 #include <linux/rcupdate.h> 17 #include <linux/errno.h> 18 #include <linux/ctype.h> 19 #include <linux/notifier.h> 20 #include <linux/netdevice.h> 21 #include <linux/netpoll.h> 22 #include <linux/if_vlan.h> 23 #include <linux/if_arp.h> 24 #include <linux/socket.h> 25 #include <linux/etherdevice.h> 26 #include <linux/rtnetlink.h> 27 #include <net/rtnetlink.h> 28 #include <net/genetlink.h> 29 #include <net/netlink.h> 30 #include <net/sch_generic.h> 31 #include <generated/utsrelease.h> 32 #include <linux/if_team.h> 33 34 #define DRV_NAME "team" 35 36 37 /********** 38 * Helpers 39 **********/ 40 41 #define team_port_exists(dev) (dev->priv_flags & IFF_TEAM_PORT) 42 43 static struct team_port *team_port_get_rcu(const struct net_device *dev) 44 { 45 struct team_port *port = rcu_dereference(dev->rx_handler_data); 46 47 return team_port_exists(dev) ? port : NULL; 48 } 49 50 static struct team_port *team_port_get_rtnl(const struct net_device *dev) 51 { 52 struct team_port *port = rtnl_dereference(dev->rx_handler_data); 53 54 return team_port_exists(dev) ? port : NULL; 55 } 56 57 /* 58 * Since the ability to change device address for open port device is tested in 59 * team_port_add, this function can be called without control of return value 60 */ 61 static int __set_port_dev_addr(struct net_device *port_dev, 62 const unsigned char *dev_addr) 63 { 64 struct sockaddr addr; 65 66 memcpy(addr.sa_data, dev_addr, port_dev->addr_len); 67 addr.sa_family = port_dev->type; 68 return dev_set_mac_address(port_dev, &addr); 69 } 70 71 static int team_port_set_orig_dev_addr(struct team_port *port) 72 { 73 return __set_port_dev_addr(port->dev, port->orig.dev_addr); 74 } 75 76 static int team_port_set_team_dev_addr(struct team *team, 77 struct team_port *port) 78 { 79 return __set_port_dev_addr(port->dev, team->dev->dev_addr); 80 } 81 82 int team_modeop_port_enter(struct team *team, struct team_port *port) 83 { 84 return team_port_set_team_dev_addr(team, port); 85 } 86 EXPORT_SYMBOL(team_modeop_port_enter); 87 88 void team_modeop_port_change_dev_addr(struct team *team, 89 struct team_port *port) 90 { 91 team_port_set_team_dev_addr(team, port); 92 } 93 EXPORT_SYMBOL(team_modeop_port_change_dev_addr); 94 95 static void team_refresh_port_linkup(struct team_port *port) 96 { 97 port->linkup = port->user.linkup_enabled ? port->user.linkup : 98 port->state.linkup; 99 } 100 101 102 /******************* 103 * Options handling 104 *******************/ 105 106 struct team_option_inst { /* One for each option instance */ 107 struct list_head list; 108 struct list_head tmp_list; 109 struct team_option *option; 110 struct team_option_inst_info info; 111 bool changed; 112 bool removed; 113 }; 114 115 static struct team_option *__team_find_option(struct team *team, 116 const char *opt_name) 117 { 118 struct team_option *option; 119 120 list_for_each_entry(option, &team->option_list, list) { 121 if (strcmp(option->name, opt_name) == 0) 122 return option; 123 } 124 return NULL; 125 } 126 127 static void __team_option_inst_del(struct team_option_inst *opt_inst) 128 { 129 list_del(&opt_inst->list); 130 kfree(opt_inst); 131 } 132 133 static void __team_option_inst_del_option(struct team *team, 134 struct team_option *option) 135 { 136 struct team_option_inst *opt_inst, *tmp; 137 138 list_for_each_entry_safe(opt_inst, tmp, &team->option_inst_list, list) { 139 if (opt_inst->option == option) 140 __team_option_inst_del(opt_inst); 141 } 142 } 143 144 static int __team_option_inst_add(struct team *team, struct team_option *option, 145 struct team_port *port) 146 { 147 struct team_option_inst *opt_inst; 148 unsigned int array_size; 149 unsigned int i; 150 int err; 151 152 array_size = option->array_size; 153 if (!array_size) 154 array_size = 1; /* No array but still need one instance */ 155 156 for (i = 0; i < array_size; i++) { 157 opt_inst = kmalloc(sizeof(*opt_inst), GFP_KERNEL); 158 if (!opt_inst) 159 return -ENOMEM; 160 opt_inst->option = option; 161 opt_inst->info.port = port; 162 opt_inst->info.array_index = i; 163 opt_inst->changed = true; 164 opt_inst->removed = false; 165 list_add_tail(&opt_inst->list, &team->option_inst_list); 166 if (option->init) { 167 err = option->init(team, &opt_inst->info); 168 if (err) 169 return err; 170 } 171 172 } 173 return 0; 174 } 175 176 static int __team_option_inst_add_option(struct team *team, 177 struct team_option *option) 178 { 179 struct team_port *port; 180 int err; 181 182 if (!option->per_port) { 183 err = __team_option_inst_add(team, option, NULL); 184 if (err) 185 goto inst_del_option; 186 } 187 188 list_for_each_entry(port, &team->port_list, list) { 189 err = __team_option_inst_add(team, option, port); 190 if (err) 191 goto inst_del_option; 192 } 193 return 0; 194 195 inst_del_option: 196 __team_option_inst_del_option(team, option); 197 return err; 198 } 199 200 static void __team_option_inst_mark_removed_option(struct team *team, 201 struct team_option *option) 202 { 203 struct team_option_inst *opt_inst; 204 205 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 206 if (opt_inst->option == option) { 207 opt_inst->changed = true; 208 opt_inst->removed = true; 209 } 210 } 211 } 212 213 static void __team_option_inst_del_port(struct team *team, 214 struct team_port *port) 215 { 216 struct team_option_inst *opt_inst, *tmp; 217 218 list_for_each_entry_safe(opt_inst, tmp, &team->option_inst_list, list) { 219 if (opt_inst->option->per_port && 220 opt_inst->info.port == port) 221 __team_option_inst_del(opt_inst); 222 } 223 } 224 225 static int __team_option_inst_add_port(struct team *team, 226 struct team_port *port) 227 { 228 struct team_option *option; 229 int err; 230 231 list_for_each_entry(option, &team->option_list, list) { 232 if (!option->per_port) 233 continue; 234 err = __team_option_inst_add(team, option, port); 235 if (err) 236 goto inst_del_port; 237 } 238 return 0; 239 240 inst_del_port: 241 __team_option_inst_del_port(team, port); 242 return err; 243 } 244 245 static void __team_option_inst_mark_removed_port(struct team *team, 246 struct team_port *port) 247 { 248 struct team_option_inst *opt_inst; 249 250 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 251 if (opt_inst->info.port == port) { 252 opt_inst->changed = true; 253 opt_inst->removed = true; 254 } 255 } 256 } 257 258 static int __team_options_register(struct team *team, 259 const struct team_option *option, 260 size_t option_count) 261 { 262 int i; 263 struct team_option **dst_opts; 264 int err; 265 266 dst_opts = kzalloc(sizeof(struct team_option *) * option_count, 267 GFP_KERNEL); 268 if (!dst_opts) 269 return -ENOMEM; 270 for (i = 0; i < option_count; i++, option++) { 271 if (__team_find_option(team, option->name)) { 272 err = -EEXIST; 273 goto alloc_rollback; 274 } 275 dst_opts[i] = kmemdup(option, sizeof(*option), GFP_KERNEL); 276 if (!dst_opts[i]) { 277 err = -ENOMEM; 278 goto alloc_rollback; 279 } 280 } 281 282 for (i = 0; i < option_count; i++) { 283 err = __team_option_inst_add_option(team, dst_opts[i]); 284 if (err) 285 goto inst_rollback; 286 list_add_tail(&dst_opts[i]->list, &team->option_list); 287 } 288 289 kfree(dst_opts); 290 return 0; 291 292 inst_rollback: 293 for (i--; i >= 0; i--) 294 __team_option_inst_del_option(team, dst_opts[i]); 295 296 i = option_count - 1; 297 alloc_rollback: 298 for (i--; i >= 0; i--) 299 kfree(dst_opts[i]); 300 301 kfree(dst_opts); 302 return err; 303 } 304 305 static void __team_options_mark_removed(struct team *team, 306 const struct team_option *option, 307 size_t option_count) 308 { 309 int i; 310 311 for (i = 0; i < option_count; i++, option++) { 312 struct team_option *del_opt; 313 314 del_opt = __team_find_option(team, option->name); 315 if (del_opt) 316 __team_option_inst_mark_removed_option(team, del_opt); 317 } 318 } 319 320 static void __team_options_unregister(struct team *team, 321 const struct team_option *option, 322 size_t option_count) 323 { 324 int i; 325 326 for (i = 0; i < option_count; i++, option++) { 327 struct team_option *del_opt; 328 329 del_opt = __team_find_option(team, option->name); 330 if (del_opt) { 331 __team_option_inst_del_option(team, del_opt); 332 list_del(&del_opt->list); 333 kfree(del_opt); 334 } 335 } 336 } 337 338 static void __team_options_change_check(struct team *team); 339 340 int team_options_register(struct team *team, 341 const struct team_option *option, 342 size_t option_count) 343 { 344 int err; 345 346 err = __team_options_register(team, option, option_count); 347 if (err) 348 return err; 349 __team_options_change_check(team); 350 return 0; 351 } 352 EXPORT_SYMBOL(team_options_register); 353 354 void team_options_unregister(struct team *team, 355 const struct team_option *option, 356 size_t option_count) 357 { 358 __team_options_mark_removed(team, option, option_count); 359 __team_options_change_check(team); 360 __team_options_unregister(team, option, option_count); 361 } 362 EXPORT_SYMBOL(team_options_unregister); 363 364 static int team_option_get(struct team *team, 365 struct team_option_inst *opt_inst, 366 struct team_gsetter_ctx *ctx) 367 { 368 if (!opt_inst->option->getter) 369 return -EOPNOTSUPP; 370 return opt_inst->option->getter(team, ctx); 371 } 372 373 static int team_option_set(struct team *team, 374 struct team_option_inst *opt_inst, 375 struct team_gsetter_ctx *ctx) 376 { 377 if (!opt_inst->option->setter) 378 return -EOPNOTSUPP; 379 return opt_inst->option->setter(team, ctx); 380 } 381 382 void team_option_inst_set_change(struct team_option_inst_info *opt_inst_info) 383 { 384 struct team_option_inst *opt_inst; 385 386 opt_inst = container_of(opt_inst_info, struct team_option_inst, info); 387 opt_inst->changed = true; 388 } 389 EXPORT_SYMBOL(team_option_inst_set_change); 390 391 void team_options_change_check(struct team *team) 392 { 393 __team_options_change_check(team); 394 } 395 EXPORT_SYMBOL(team_options_change_check); 396 397 398 /**************** 399 * Mode handling 400 ****************/ 401 402 static LIST_HEAD(mode_list); 403 static DEFINE_SPINLOCK(mode_list_lock); 404 405 struct team_mode_item { 406 struct list_head list; 407 const struct team_mode *mode; 408 }; 409 410 static struct team_mode_item *__find_mode(const char *kind) 411 { 412 struct team_mode_item *mitem; 413 414 list_for_each_entry(mitem, &mode_list, list) { 415 if (strcmp(mitem->mode->kind, kind) == 0) 416 return mitem; 417 } 418 return NULL; 419 } 420 421 static bool is_good_mode_name(const char *name) 422 { 423 while (*name != '\0') { 424 if (!isalpha(*name) && !isdigit(*name) && *name != '_') 425 return false; 426 name++; 427 } 428 return true; 429 } 430 431 int team_mode_register(const struct team_mode *mode) 432 { 433 int err = 0; 434 struct team_mode_item *mitem; 435 436 if (!is_good_mode_name(mode->kind) || 437 mode->priv_size > TEAM_MODE_PRIV_SIZE) 438 return -EINVAL; 439 440 mitem = kmalloc(sizeof(*mitem), GFP_KERNEL); 441 if (!mitem) 442 return -ENOMEM; 443 444 spin_lock(&mode_list_lock); 445 if (__find_mode(mode->kind)) { 446 err = -EEXIST; 447 kfree(mitem); 448 goto unlock; 449 } 450 mitem->mode = mode; 451 list_add_tail(&mitem->list, &mode_list); 452 unlock: 453 spin_unlock(&mode_list_lock); 454 return err; 455 } 456 EXPORT_SYMBOL(team_mode_register); 457 458 void team_mode_unregister(const struct team_mode *mode) 459 { 460 struct team_mode_item *mitem; 461 462 spin_lock(&mode_list_lock); 463 mitem = __find_mode(mode->kind); 464 if (mitem) { 465 list_del_init(&mitem->list); 466 kfree(mitem); 467 } 468 spin_unlock(&mode_list_lock); 469 } 470 EXPORT_SYMBOL(team_mode_unregister); 471 472 static const struct team_mode *team_mode_get(const char *kind) 473 { 474 struct team_mode_item *mitem; 475 const struct team_mode *mode = NULL; 476 477 spin_lock(&mode_list_lock); 478 mitem = __find_mode(kind); 479 if (!mitem) { 480 spin_unlock(&mode_list_lock); 481 request_module("team-mode-%s", kind); 482 spin_lock(&mode_list_lock); 483 mitem = __find_mode(kind); 484 } 485 if (mitem) { 486 mode = mitem->mode; 487 if (!try_module_get(mode->owner)) 488 mode = NULL; 489 } 490 491 spin_unlock(&mode_list_lock); 492 return mode; 493 } 494 495 static void team_mode_put(const struct team_mode *mode) 496 { 497 module_put(mode->owner); 498 } 499 500 static bool team_dummy_transmit(struct team *team, struct sk_buff *skb) 501 { 502 dev_kfree_skb_any(skb); 503 return false; 504 } 505 506 static rx_handler_result_t team_dummy_receive(struct team *team, 507 struct team_port *port, 508 struct sk_buff *skb) 509 { 510 return RX_HANDLER_ANOTHER; 511 } 512 513 static const struct team_mode __team_no_mode = { 514 .kind = "*NOMODE*", 515 }; 516 517 static bool team_is_mode_set(struct team *team) 518 { 519 return team->mode != &__team_no_mode; 520 } 521 522 static void team_set_no_mode(struct team *team) 523 { 524 team->user_carrier_enabled = false; 525 team->mode = &__team_no_mode; 526 } 527 528 static void team_adjust_ops(struct team *team) 529 { 530 /* 531 * To avoid checks in rx/tx skb paths, ensure here that non-null and 532 * correct ops are always set. 533 */ 534 535 if (!team->en_port_count || !team_is_mode_set(team) || 536 !team->mode->ops->transmit) 537 team->ops.transmit = team_dummy_transmit; 538 else 539 team->ops.transmit = team->mode->ops->transmit; 540 541 if (!team->en_port_count || !team_is_mode_set(team) || 542 !team->mode->ops->receive) 543 team->ops.receive = team_dummy_receive; 544 else 545 team->ops.receive = team->mode->ops->receive; 546 } 547 548 /* 549 * We can benefit from the fact that it's ensured no port is present 550 * at the time of mode change. Therefore no packets are in fly so there's no 551 * need to set mode operations in any special way. 552 */ 553 static int __team_change_mode(struct team *team, 554 const struct team_mode *new_mode) 555 { 556 /* Check if mode was previously set and do cleanup if so */ 557 if (team_is_mode_set(team)) { 558 void (*exit_op)(struct team *team) = team->ops.exit; 559 560 /* Clear ops area so no callback is called any longer */ 561 memset(&team->ops, 0, sizeof(struct team_mode_ops)); 562 team_adjust_ops(team); 563 564 if (exit_op) 565 exit_op(team); 566 team_mode_put(team->mode); 567 team_set_no_mode(team); 568 /* zero private data area */ 569 memset(&team->mode_priv, 0, 570 sizeof(struct team) - offsetof(struct team, mode_priv)); 571 } 572 573 if (!new_mode) 574 return 0; 575 576 if (new_mode->ops->init) { 577 int err; 578 579 err = new_mode->ops->init(team); 580 if (err) 581 return err; 582 } 583 584 team->mode = new_mode; 585 memcpy(&team->ops, new_mode->ops, sizeof(struct team_mode_ops)); 586 team_adjust_ops(team); 587 588 return 0; 589 } 590 591 static int team_change_mode(struct team *team, const char *kind) 592 { 593 const struct team_mode *new_mode; 594 struct net_device *dev = team->dev; 595 int err; 596 597 if (!list_empty(&team->port_list)) { 598 netdev_err(dev, "No ports can be present during mode change\n"); 599 return -EBUSY; 600 } 601 602 if (team_is_mode_set(team) && strcmp(team->mode->kind, kind) == 0) { 603 netdev_err(dev, "Unable to change to the same mode the team is in\n"); 604 return -EINVAL; 605 } 606 607 new_mode = team_mode_get(kind); 608 if (!new_mode) { 609 netdev_err(dev, "Mode \"%s\" not found\n", kind); 610 return -EINVAL; 611 } 612 613 err = __team_change_mode(team, new_mode); 614 if (err) { 615 netdev_err(dev, "Failed to change to mode \"%s\"\n", kind); 616 team_mode_put(new_mode); 617 return err; 618 } 619 620 netdev_info(dev, "Mode changed to \"%s\"\n", kind); 621 return 0; 622 } 623 624 625 /********************* 626 * Peers notification 627 *********************/ 628 629 static void team_notify_peers_work(struct work_struct *work) 630 { 631 struct team *team; 632 633 team = container_of(work, struct team, notify_peers.dw.work); 634 635 if (!rtnl_trylock()) { 636 schedule_delayed_work(&team->notify_peers.dw, 0); 637 return; 638 } 639 call_netdevice_notifiers(NETDEV_NOTIFY_PEERS, team->dev); 640 rtnl_unlock(); 641 if (!atomic_dec_and_test(&team->notify_peers.count_pending)) 642 schedule_delayed_work(&team->notify_peers.dw, 643 msecs_to_jiffies(team->notify_peers.interval)); 644 } 645 646 static void team_notify_peers(struct team *team) 647 { 648 if (!team->notify_peers.count || !netif_running(team->dev)) 649 return; 650 atomic_add(team->notify_peers.count, &team->notify_peers.count_pending); 651 schedule_delayed_work(&team->notify_peers.dw, 0); 652 } 653 654 static void team_notify_peers_init(struct team *team) 655 { 656 INIT_DELAYED_WORK(&team->notify_peers.dw, team_notify_peers_work); 657 } 658 659 static void team_notify_peers_fini(struct team *team) 660 { 661 cancel_delayed_work_sync(&team->notify_peers.dw); 662 } 663 664 665 /******************************* 666 * Send multicast group rejoins 667 *******************************/ 668 669 static void team_mcast_rejoin_work(struct work_struct *work) 670 { 671 struct team *team; 672 673 team = container_of(work, struct team, mcast_rejoin.dw.work); 674 675 if (!rtnl_trylock()) { 676 schedule_delayed_work(&team->mcast_rejoin.dw, 0); 677 return; 678 } 679 call_netdevice_notifiers(NETDEV_RESEND_IGMP, team->dev); 680 rtnl_unlock(); 681 if (!atomic_dec_and_test(&team->mcast_rejoin.count_pending)) 682 schedule_delayed_work(&team->mcast_rejoin.dw, 683 msecs_to_jiffies(team->mcast_rejoin.interval)); 684 } 685 686 static void team_mcast_rejoin(struct team *team) 687 { 688 if (!team->mcast_rejoin.count || !netif_running(team->dev)) 689 return; 690 atomic_add(team->mcast_rejoin.count, &team->mcast_rejoin.count_pending); 691 schedule_delayed_work(&team->mcast_rejoin.dw, 0); 692 } 693 694 static void team_mcast_rejoin_init(struct team *team) 695 { 696 INIT_DELAYED_WORK(&team->mcast_rejoin.dw, team_mcast_rejoin_work); 697 } 698 699 static void team_mcast_rejoin_fini(struct team *team) 700 { 701 cancel_delayed_work_sync(&team->mcast_rejoin.dw); 702 } 703 704 705 /************************ 706 * Rx path frame handler 707 ************************/ 708 709 /* note: already called with rcu_read_lock */ 710 static rx_handler_result_t team_handle_frame(struct sk_buff **pskb) 711 { 712 struct sk_buff *skb = *pskb; 713 struct team_port *port; 714 struct team *team; 715 rx_handler_result_t res; 716 717 skb = skb_share_check(skb, GFP_ATOMIC); 718 if (!skb) 719 return RX_HANDLER_CONSUMED; 720 721 *pskb = skb; 722 723 port = team_port_get_rcu(skb->dev); 724 team = port->team; 725 if (!team_port_enabled(port)) { 726 /* allow exact match delivery for disabled ports */ 727 res = RX_HANDLER_EXACT; 728 } else { 729 res = team->ops.receive(team, port, skb); 730 } 731 if (res == RX_HANDLER_ANOTHER) { 732 struct team_pcpu_stats *pcpu_stats; 733 734 pcpu_stats = this_cpu_ptr(team->pcpu_stats); 735 u64_stats_update_begin(&pcpu_stats->syncp); 736 pcpu_stats->rx_packets++; 737 pcpu_stats->rx_bytes += skb->len; 738 if (skb->pkt_type == PACKET_MULTICAST) 739 pcpu_stats->rx_multicast++; 740 u64_stats_update_end(&pcpu_stats->syncp); 741 742 skb->dev = team->dev; 743 } else { 744 this_cpu_inc(team->pcpu_stats->rx_dropped); 745 } 746 747 return res; 748 } 749 750 751 /************************************* 752 * Multiqueue Tx port select override 753 *************************************/ 754 755 static int team_queue_override_init(struct team *team) 756 { 757 struct list_head *listarr; 758 unsigned int queue_cnt = team->dev->num_tx_queues - 1; 759 unsigned int i; 760 761 if (!queue_cnt) 762 return 0; 763 listarr = kmalloc(sizeof(struct list_head) * queue_cnt, GFP_KERNEL); 764 if (!listarr) 765 return -ENOMEM; 766 team->qom_lists = listarr; 767 for (i = 0; i < queue_cnt; i++) 768 INIT_LIST_HEAD(listarr++); 769 return 0; 770 } 771 772 static void team_queue_override_fini(struct team *team) 773 { 774 kfree(team->qom_lists); 775 } 776 777 static struct list_head *__team_get_qom_list(struct team *team, u16 queue_id) 778 { 779 return &team->qom_lists[queue_id - 1]; 780 } 781 782 /* 783 * note: already called with rcu_read_lock 784 */ 785 static bool team_queue_override_transmit(struct team *team, struct sk_buff *skb) 786 { 787 struct list_head *qom_list; 788 struct team_port *port; 789 790 if (!team->queue_override_enabled || !skb->queue_mapping) 791 return false; 792 qom_list = __team_get_qom_list(team, skb->queue_mapping); 793 list_for_each_entry_rcu(port, qom_list, qom_list) { 794 if (!team_dev_queue_xmit(team, port, skb)) 795 return true; 796 } 797 return false; 798 } 799 800 static void __team_queue_override_port_del(struct team *team, 801 struct team_port *port) 802 { 803 if (!port->queue_id) 804 return; 805 list_del_rcu(&port->qom_list); 806 } 807 808 static bool team_queue_override_port_has_gt_prio_than(struct team_port *port, 809 struct team_port *cur) 810 { 811 if (port->priority < cur->priority) 812 return true; 813 if (port->priority > cur->priority) 814 return false; 815 if (port->index < cur->index) 816 return true; 817 return false; 818 } 819 820 static void __team_queue_override_port_add(struct team *team, 821 struct team_port *port) 822 { 823 struct team_port *cur; 824 struct list_head *qom_list; 825 struct list_head *node; 826 827 if (!port->queue_id) 828 return; 829 qom_list = __team_get_qom_list(team, port->queue_id); 830 node = qom_list; 831 list_for_each_entry(cur, qom_list, qom_list) { 832 if (team_queue_override_port_has_gt_prio_than(port, cur)) 833 break; 834 node = &cur->qom_list; 835 } 836 list_add_tail_rcu(&port->qom_list, node); 837 } 838 839 static void __team_queue_override_enabled_check(struct team *team) 840 { 841 struct team_port *port; 842 bool enabled = false; 843 844 list_for_each_entry(port, &team->port_list, list) { 845 if (port->queue_id) { 846 enabled = true; 847 break; 848 } 849 } 850 if (enabled == team->queue_override_enabled) 851 return; 852 netdev_dbg(team->dev, "%s queue override\n", 853 enabled ? "Enabling" : "Disabling"); 854 team->queue_override_enabled = enabled; 855 } 856 857 static void team_queue_override_port_prio_changed(struct team *team, 858 struct team_port *port) 859 { 860 if (!port->queue_id || team_port_enabled(port)) 861 return; 862 __team_queue_override_port_del(team, port); 863 __team_queue_override_port_add(team, port); 864 __team_queue_override_enabled_check(team); 865 } 866 867 static void team_queue_override_port_change_queue_id(struct team *team, 868 struct team_port *port, 869 u16 new_queue_id) 870 { 871 if (team_port_enabled(port)) { 872 __team_queue_override_port_del(team, port); 873 port->queue_id = new_queue_id; 874 __team_queue_override_port_add(team, port); 875 __team_queue_override_enabled_check(team); 876 } else { 877 port->queue_id = new_queue_id; 878 } 879 } 880 881 static void team_queue_override_port_add(struct team *team, 882 struct team_port *port) 883 { 884 __team_queue_override_port_add(team, port); 885 __team_queue_override_enabled_check(team); 886 } 887 888 static void team_queue_override_port_del(struct team *team, 889 struct team_port *port) 890 { 891 __team_queue_override_port_del(team, port); 892 __team_queue_override_enabled_check(team); 893 } 894 895 896 /**************** 897 * Port handling 898 ****************/ 899 900 static bool team_port_find(const struct team *team, 901 const struct team_port *port) 902 { 903 struct team_port *cur; 904 905 list_for_each_entry(cur, &team->port_list, list) 906 if (cur == port) 907 return true; 908 return false; 909 } 910 911 /* 912 * Enable/disable port by adding to enabled port hashlist and setting 913 * port->index (Might be racy so reader could see incorrect ifindex when 914 * processing a flying packet, but that is not a problem). Write guarded 915 * by team->lock. 916 */ 917 static void team_port_enable(struct team *team, 918 struct team_port *port) 919 { 920 if (team_port_enabled(port)) 921 return; 922 port->index = team->en_port_count++; 923 hlist_add_head_rcu(&port->hlist, 924 team_port_index_hash(team, port->index)); 925 team_adjust_ops(team); 926 team_queue_override_port_add(team, port); 927 if (team->ops.port_enabled) 928 team->ops.port_enabled(team, port); 929 team_notify_peers(team); 930 team_mcast_rejoin(team); 931 } 932 933 static void __reconstruct_port_hlist(struct team *team, int rm_index) 934 { 935 int i; 936 struct team_port *port; 937 938 for (i = rm_index + 1; i < team->en_port_count; i++) { 939 port = team_get_port_by_index(team, i); 940 hlist_del_rcu(&port->hlist); 941 port->index--; 942 hlist_add_head_rcu(&port->hlist, 943 team_port_index_hash(team, port->index)); 944 } 945 } 946 947 static void team_port_disable(struct team *team, 948 struct team_port *port) 949 { 950 if (!team_port_enabled(port)) 951 return; 952 if (team->ops.port_disabled) 953 team->ops.port_disabled(team, port); 954 hlist_del_rcu(&port->hlist); 955 __reconstruct_port_hlist(team, port->index); 956 port->index = -1; 957 team->en_port_count--; 958 team_queue_override_port_del(team, port); 959 team_adjust_ops(team); 960 team_notify_peers(team); 961 team_mcast_rejoin(team); 962 } 963 964 #define TEAM_VLAN_FEATURES (NETIF_F_ALL_CSUM | NETIF_F_SG | \ 965 NETIF_F_FRAGLIST | NETIF_F_ALL_TSO | \ 966 NETIF_F_HIGHDMA | NETIF_F_LRO) 967 968 static void __team_compute_features(struct team *team) 969 { 970 struct team_port *port; 971 u32 vlan_features = TEAM_VLAN_FEATURES & NETIF_F_ALL_FOR_ALL; 972 unsigned short max_hard_header_len = ETH_HLEN; 973 unsigned int dst_release_flag = IFF_XMIT_DST_RELEASE | 974 IFF_XMIT_DST_RELEASE_PERM; 975 976 list_for_each_entry(port, &team->port_list, list) { 977 vlan_features = netdev_increment_features(vlan_features, 978 port->dev->vlan_features, 979 TEAM_VLAN_FEATURES); 980 981 dst_release_flag &= port->dev->priv_flags; 982 if (port->dev->hard_header_len > max_hard_header_len) 983 max_hard_header_len = port->dev->hard_header_len; 984 } 985 986 team->dev->vlan_features = vlan_features; 987 team->dev->hard_header_len = max_hard_header_len; 988 989 team->dev->priv_flags &= ~IFF_XMIT_DST_RELEASE; 990 if (dst_release_flag == (IFF_XMIT_DST_RELEASE | IFF_XMIT_DST_RELEASE_PERM)) 991 team->dev->priv_flags |= IFF_XMIT_DST_RELEASE; 992 993 netdev_change_features(team->dev); 994 } 995 996 static void team_compute_features(struct team *team) 997 { 998 mutex_lock(&team->lock); 999 __team_compute_features(team); 1000 mutex_unlock(&team->lock); 1001 } 1002 1003 static int team_port_enter(struct team *team, struct team_port *port) 1004 { 1005 int err = 0; 1006 1007 dev_hold(team->dev); 1008 if (team->ops.port_enter) { 1009 err = team->ops.port_enter(team, port); 1010 if (err) { 1011 netdev_err(team->dev, "Device %s failed to enter team mode\n", 1012 port->dev->name); 1013 goto err_port_enter; 1014 } 1015 } 1016 1017 return 0; 1018 1019 err_port_enter: 1020 dev_put(team->dev); 1021 1022 return err; 1023 } 1024 1025 static void team_port_leave(struct team *team, struct team_port *port) 1026 { 1027 if (team->ops.port_leave) 1028 team->ops.port_leave(team, port); 1029 dev_put(team->dev); 1030 } 1031 1032 #ifdef CONFIG_NET_POLL_CONTROLLER 1033 static int team_port_enable_netpoll(struct team *team, struct team_port *port) 1034 { 1035 struct netpoll *np; 1036 int err; 1037 1038 if (!team->dev->npinfo) 1039 return 0; 1040 1041 np = kzalloc(sizeof(*np), GFP_KERNEL); 1042 if (!np) 1043 return -ENOMEM; 1044 1045 err = __netpoll_setup(np, port->dev); 1046 if (err) { 1047 kfree(np); 1048 return err; 1049 } 1050 port->np = np; 1051 return err; 1052 } 1053 1054 static void team_port_disable_netpoll(struct team_port *port) 1055 { 1056 struct netpoll *np = port->np; 1057 1058 if (!np) 1059 return; 1060 port->np = NULL; 1061 1062 /* Wait for transmitting packets to finish before freeing. */ 1063 synchronize_rcu_bh(); 1064 __netpoll_cleanup(np); 1065 kfree(np); 1066 } 1067 #else 1068 static int team_port_enable_netpoll(struct team *team, struct team_port *port) 1069 { 1070 return 0; 1071 } 1072 static void team_port_disable_netpoll(struct team_port *port) 1073 { 1074 } 1075 #endif 1076 1077 static int team_upper_dev_link(struct net_device *dev, 1078 struct net_device *port_dev) 1079 { 1080 int err; 1081 1082 err = netdev_master_upper_dev_link(port_dev, dev); 1083 if (err) 1084 return err; 1085 port_dev->priv_flags |= IFF_TEAM_PORT; 1086 return 0; 1087 } 1088 1089 static void team_upper_dev_unlink(struct net_device *dev, 1090 struct net_device *port_dev) 1091 { 1092 netdev_upper_dev_unlink(port_dev, dev); 1093 port_dev->priv_flags &= ~IFF_TEAM_PORT; 1094 } 1095 1096 static void __team_port_change_port_added(struct team_port *port, bool linkup); 1097 static int team_dev_type_check_change(struct net_device *dev, 1098 struct net_device *port_dev); 1099 1100 static int team_port_add(struct team *team, struct net_device *port_dev) 1101 { 1102 struct net_device *dev = team->dev; 1103 struct team_port *port; 1104 char *portname = port_dev->name; 1105 int err; 1106 1107 if (port_dev->flags & IFF_LOOPBACK) { 1108 netdev_err(dev, "Device %s is loopback device. Loopback devices can't be added as a team port\n", 1109 portname); 1110 return -EINVAL; 1111 } 1112 1113 if (team_port_exists(port_dev)) { 1114 netdev_err(dev, "Device %s is already a port " 1115 "of a team device\n", portname); 1116 return -EBUSY; 1117 } 1118 1119 if (port_dev->features & NETIF_F_VLAN_CHALLENGED && 1120 vlan_uses_dev(dev)) { 1121 netdev_err(dev, "Device %s is VLAN challenged and team device has VLAN set up\n", 1122 portname); 1123 return -EPERM; 1124 } 1125 1126 err = team_dev_type_check_change(dev, port_dev); 1127 if (err) 1128 return err; 1129 1130 if (port_dev->flags & IFF_UP) { 1131 netdev_err(dev, "Device %s is up. Set it down before adding it as a team port\n", 1132 portname); 1133 return -EBUSY; 1134 } 1135 1136 port = kzalloc(sizeof(struct team_port) + team->mode->port_priv_size, 1137 GFP_KERNEL); 1138 if (!port) 1139 return -ENOMEM; 1140 1141 port->dev = port_dev; 1142 port->team = team; 1143 INIT_LIST_HEAD(&port->qom_list); 1144 1145 port->orig.mtu = port_dev->mtu; 1146 err = dev_set_mtu(port_dev, dev->mtu); 1147 if (err) { 1148 netdev_dbg(dev, "Error %d calling dev_set_mtu\n", err); 1149 goto err_set_mtu; 1150 } 1151 1152 memcpy(port->orig.dev_addr, port_dev->dev_addr, port_dev->addr_len); 1153 1154 err = team_port_enter(team, port); 1155 if (err) { 1156 netdev_err(dev, "Device %s failed to enter team mode\n", 1157 portname); 1158 goto err_port_enter; 1159 } 1160 1161 err = dev_open(port_dev); 1162 if (err) { 1163 netdev_dbg(dev, "Device %s opening failed\n", 1164 portname); 1165 goto err_dev_open; 1166 } 1167 1168 err = vlan_vids_add_by_dev(port_dev, dev); 1169 if (err) { 1170 netdev_err(dev, "Failed to add vlan ids to device %s\n", 1171 portname); 1172 goto err_vids_add; 1173 } 1174 1175 err = team_port_enable_netpoll(team, port); 1176 if (err) { 1177 netdev_err(dev, "Failed to enable netpoll on device %s\n", 1178 portname); 1179 goto err_enable_netpoll; 1180 } 1181 1182 if (!(dev->features & NETIF_F_LRO)) 1183 dev_disable_lro(port_dev); 1184 1185 err = netdev_rx_handler_register(port_dev, team_handle_frame, 1186 port); 1187 if (err) { 1188 netdev_err(dev, "Device %s failed to register rx_handler\n", 1189 portname); 1190 goto err_handler_register; 1191 } 1192 1193 err = team_upper_dev_link(dev, port_dev); 1194 if (err) { 1195 netdev_err(dev, "Device %s failed to set upper link\n", 1196 portname); 1197 goto err_set_upper_link; 1198 } 1199 1200 err = __team_option_inst_add_port(team, port); 1201 if (err) { 1202 netdev_err(dev, "Device %s failed to add per-port options\n", 1203 portname); 1204 goto err_option_port_add; 1205 } 1206 1207 port->index = -1; 1208 list_add_tail_rcu(&port->list, &team->port_list); 1209 team_port_enable(team, port); 1210 __team_compute_features(team); 1211 __team_port_change_port_added(port, !!netif_carrier_ok(port_dev)); 1212 __team_options_change_check(team); 1213 1214 netdev_info(dev, "Port device %s added\n", portname); 1215 1216 return 0; 1217 1218 err_option_port_add: 1219 team_upper_dev_unlink(dev, port_dev); 1220 1221 err_set_upper_link: 1222 netdev_rx_handler_unregister(port_dev); 1223 1224 err_handler_register: 1225 team_port_disable_netpoll(port); 1226 1227 err_enable_netpoll: 1228 vlan_vids_del_by_dev(port_dev, dev); 1229 1230 err_vids_add: 1231 dev_close(port_dev); 1232 1233 err_dev_open: 1234 team_port_leave(team, port); 1235 team_port_set_orig_dev_addr(port); 1236 1237 err_port_enter: 1238 dev_set_mtu(port_dev, port->orig.mtu); 1239 1240 err_set_mtu: 1241 kfree(port); 1242 1243 return err; 1244 } 1245 1246 static void __team_port_change_port_removed(struct team_port *port); 1247 1248 static int team_port_del(struct team *team, struct net_device *port_dev) 1249 { 1250 struct net_device *dev = team->dev; 1251 struct team_port *port; 1252 char *portname = port_dev->name; 1253 1254 port = team_port_get_rtnl(port_dev); 1255 if (!port || !team_port_find(team, port)) { 1256 netdev_err(dev, "Device %s does not act as a port of this team\n", 1257 portname); 1258 return -ENOENT; 1259 } 1260 1261 team_port_disable(team, port); 1262 list_del_rcu(&port->list); 1263 team_upper_dev_unlink(dev, port_dev); 1264 netdev_rx_handler_unregister(port_dev); 1265 team_port_disable_netpoll(port); 1266 vlan_vids_del_by_dev(port_dev, dev); 1267 dev_uc_unsync(port_dev, dev); 1268 dev_mc_unsync(port_dev, dev); 1269 dev_close(port_dev); 1270 team_port_leave(team, port); 1271 1272 __team_option_inst_mark_removed_port(team, port); 1273 __team_options_change_check(team); 1274 __team_option_inst_del_port(team, port); 1275 __team_port_change_port_removed(port); 1276 1277 team_port_set_orig_dev_addr(port); 1278 dev_set_mtu(port_dev, port->orig.mtu); 1279 kfree_rcu(port, rcu); 1280 netdev_info(dev, "Port device %s removed\n", portname); 1281 __team_compute_features(team); 1282 1283 return 0; 1284 } 1285 1286 1287 /***************** 1288 * Net device ops 1289 *****************/ 1290 1291 static int team_mode_option_get(struct team *team, struct team_gsetter_ctx *ctx) 1292 { 1293 ctx->data.str_val = team->mode->kind; 1294 return 0; 1295 } 1296 1297 static int team_mode_option_set(struct team *team, struct team_gsetter_ctx *ctx) 1298 { 1299 return team_change_mode(team, ctx->data.str_val); 1300 } 1301 1302 static int team_notify_peers_count_get(struct team *team, 1303 struct team_gsetter_ctx *ctx) 1304 { 1305 ctx->data.u32_val = team->notify_peers.count; 1306 return 0; 1307 } 1308 1309 static int team_notify_peers_count_set(struct team *team, 1310 struct team_gsetter_ctx *ctx) 1311 { 1312 team->notify_peers.count = ctx->data.u32_val; 1313 return 0; 1314 } 1315 1316 static int team_notify_peers_interval_get(struct team *team, 1317 struct team_gsetter_ctx *ctx) 1318 { 1319 ctx->data.u32_val = team->notify_peers.interval; 1320 return 0; 1321 } 1322 1323 static int team_notify_peers_interval_set(struct team *team, 1324 struct team_gsetter_ctx *ctx) 1325 { 1326 team->notify_peers.interval = ctx->data.u32_val; 1327 return 0; 1328 } 1329 1330 static int team_mcast_rejoin_count_get(struct team *team, 1331 struct team_gsetter_ctx *ctx) 1332 { 1333 ctx->data.u32_val = team->mcast_rejoin.count; 1334 return 0; 1335 } 1336 1337 static int team_mcast_rejoin_count_set(struct team *team, 1338 struct team_gsetter_ctx *ctx) 1339 { 1340 team->mcast_rejoin.count = ctx->data.u32_val; 1341 return 0; 1342 } 1343 1344 static int team_mcast_rejoin_interval_get(struct team *team, 1345 struct team_gsetter_ctx *ctx) 1346 { 1347 ctx->data.u32_val = team->mcast_rejoin.interval; 1348 return 0; 1349 } 1350 1351 static int team_mcast_rejoin_interval_set(struct team *team, 1352 struct team_gsetter_ctx *ctx) 1353 { 1354 team->mcast_rejoin.interval = ctx->data.u32_val; 1355 return 0; 1356 } 1357 1358 static int team_port_en_option_get(struct team *team, 1359 struct team_gsetter_ctx *ctx) 1360 { 1361 struct team_port *port = ctx->info->port; 1362 1363 ctx->data.bool_val = team_port_enabled(port); 1364 return 0; 1365 } 1366 1367 static int team_port_en_option_set(struct team *team, 1368 struct team_gsetter_ctx *ctx) 1369 { 1370 struct team_port *port = ctx->info->port; 1371 1372 if (ctx->data.bool_val) 1373 team_port_enable(team, port); 1374 else 1375 team_port_disable(team, port); 1376 return 0; 1377 } 1378 1379 static int team_user_linkup_option_get(struct team *team, 1380 struct team_gsetter_ctx *ctx) 1381 { 1382 struct team_port *port = ctx->info->port; 1383 1384 ctx->data.bool_val = port->user.linkup; 1385 return 0; 1386 } 1387 1388 static void __team_carrier_check(struct team *team); 1389 1390 static int team_user_linkup_option_set(struct team *team, 1391 struct team_gsetter_ctx *ctx) 1392 { 1393 struct team_port *port = ctx->info->port; 1394 1395 port->user.linkup = ctx->data.bool_val; 1396 team_refresh_port_linkup(port); 1397 __team_carrier_check(port->team); 1398 return 0; 1399 } 1400 1401 static int team_user_linkup_en_option_get(struct team *team, 1402 struct team_gsetter_ctx *ctx) 1403 { 1404 struct team_port *port = ctx->info->port; 1405 1406 ctx->data.bool_val = port->user.linkup_enabled; 1407 return 0; 1408 } 1409 1410 static int team_user_linkup_en_option_set(struct team *team, 1411 struct team_gsetter_ctx *ctx) 1412 { 1413 struct team_port *port = ctx->info->port; 1414 1415 port->user.linkup_enabled = ctx->data.bool_val; 1416 team_refresh_port_linkup(port); 1417 __team_carrier_check(port->team); 1418 return 0; 1419 } 1420 1421 static int team_priority_option_get(struct team *team, 1422 struct team_gsetter_ctx *ctx) 1423 { 1424 struct team_port *port = ctx->info->port; 1425 1426 ctx->data.s32_val = port->priority; 1427 return 0; 1428 } 1429 1430 static int team_priority_option_set(struct team *team, 1431 struct team_gsetter_ctx *ctx) 1432 { 1433 struct team_port *port = ctx->info->port; 1434 s32 priority = ctx->data.s32_val; 1435 1436 if (port->priority == priority) 1437 return 0; 1438 port->priority = priority; 1439 team_queue_override_port_prio_changed(team, port); 1440 return 0; 1441 } 1442 1443 static int team_queue_id_option_get(struct team *team, 1444 struct team_gsetter_ctx *ctx) 1445 { 1446 struct team_port *port = ctx->info->port; 1447 1448 ctx->data.u32_val = port->queue_id; 1449 return 0; 1450 } 1451 1452 static int team_queue_id_option_set(struct team *team, 1453 struct team_gsetter_ctx *ctx) 1454 { 1455 struct team_port *port = ctx->info->port; 1456 u16 new_queue_id = ctx->data.u32_val; 1457 1458 if (port->queue_id == new_queue_id) 1459 return 0; 1460 if (new_queue_id >= team->dev->real_num_tx_queues) 1461 return -EINVAL; 1462 team_queue_override_port_change_queue_id(team, port, new_queue_id); 1463 return 0; 1464 } 1465 1466 static const struct team_option team_options[] = { 1467 { 1468 .name = "mode", 1469 .type = TEAM_OPTION_TYPE_STRING, 1470 .getter = team_mode_option_get, 1471 .setter = team_mode_option_set, 1472 }, 1473 { 1474 .name = "notify_peers_count", 1475 .type = TEAM_OPTION_TYPE_U32, 1476 .getter = team_notify_peers_count_get, 1477 .setter = team_notify_peers_count_set, 1478 }, 1479 { 1480 .name = "notify_peers_interval", 1481 .type = TEAM_OPTION_TYPE_U32, 1482 .getter = team_notify_peers_interval_get, 1483 .setter = team_notify_peers_interval_set, 1484 }, 1485 { 1486 .name = "mcast_rejoin_count", 1487 .type = TEAM_OPTION_TYPE_U32, 1488 .getter = team_mcast_rejoin_count_get, 1489 .setter = team_mcast_rejoin_count_set, 1490 }, 1491 { 1492 .name = "mcast_rejoin_interval", 1493 .type = TEAM_OPTION_TYPE_U32, 1494 .getter = team_mcast_rejoin_interval_get, 1495 .setter = team_mcast_rejoin_interval_set, 1496 }, 1497 { 1498 .name = "enabled", 1499 .type = TEAM_OPTION_TYPE_BOOL, 1500 .per_port = true, 1501 .getter = team_port_en_option_get, 1502 .setter = team_port_en_option_set, 1503 }, 1504 { 1505 .name = "user_linkup", 1506 .type = TEAM_OPTION_TYPE_BOOL, 1507 .per_port = true, 1508 .getter = team_user_linkup_option_get, 1509 .setter = team_user_linkup_option_set, 1510 }, 1511 { 1512 .name = "user_linkup_enabled", 1513 .type = TEAM_OPTION_TYPE_BOOL, 1514 .per_port = true, 1515 .getter = team_user_linkup_en_option_get, 1516 .setter = team_user_linkup_en_option_set, 1517 }, 1518 { 1519 .name = "priority", 1520 .type = TEAM_OPTION_TYPE_S32, 1521 .per_port = true, 1522 .getter = team_priority_option_get, 1523 .setter = team_priority_option_set, 1524 }, 1525 { 1526 .name = "queue_id", 1527 .type = TEAM_OPTION_TYPE_U32, 1528 .per_port = true, 1529 .getter = team_queue_id_option_get, 1530 .setter = team_queue_id_option_set, 1531 }, 1532 }; 1533 1534 static struct lock_class_key team_netdev_xmit_lock_key; 1535 static struct lock_class_key team_netdev_addr_lock_key; 1536 static struct lock_class_key team_tx_busylock_key; 1537 1538 static void team_set_lockdep_class_one(struct net_device *dev, 1539 struct netdev_queue *txq, 1540 void *unused) 1541 { 1542 lockdep_set_class(&txq->_xmit_lock, &team_netdev_xmit_lock_key); 1543 } 1544 1545 static void team_set_lockdep_class(struct net_device *dev) 1546 { 1547 lockdep_set_class(&dev->addr_list_lock, &team_netdev_addr_lock_key); 1548 netdev_for_each_tx_queue(dev, team_set_lockdep_class_one, NULL); 1549 dev->qdisc_tx_busylock = &team_tx_busylock_key; 1550 } 1551 1552 static int team_init(struct net_device *dev) 1553 { 1554 struct team *team = netdev_priv(dev); 1555 int i; 1556 int err; 1557 1558 team->dev = dev; 1559 mutex_init(&team->lock); 1560 team_set_no_mode(team); 1561 1562 team->pcpu_stats = netdev_alloc_pcpu_stats(struct team_pcpu_stats); 1563 if (!team->pcpu_stats) 1564 return -ENOMEM; 1565 1566 for (i = 0; i < TEAM_PORT_HASHENTRIES; i++) 1567 INIT_HLIST_HEAD(&team->en_port_hlist[i]); 1568 INIT_LIST_HEAD(&team->port_list); 1569 err = team_queue_override_init(team); 1570 if (err) 1571 goto err_team_queue_override_init; 1572 1573 team_adjust_ops(team); 1574 1575 INIT_LIST_HEAD(&team->option_list); 1576 INIT_LIST_HEAD(&team->option_inst_list); 1577 1578 team_notify_peers_init(team); 1579 team_mcast_rejoin_init(team); 1580 1581 err = team_options_register(team, team_options, ARRAY_SIZE(team_options)); 1582 if (err) 1583 goto err_options_register; 1584 netif_carrier_off(dev); 1585 1586 team_set_lockdep_class(dev); 1587 1588 return 0; 1589 1590 err_options_register: 1591 team_mcast_rejoin_fini(team); 1592 team_notify_peers_fini(team); 1593 team_queue_override_fini(team); 1594 err_team_queue_override_init: 1595 free_percpu(team->pcpu_stats); 1596 1597 return err; 1598 } 1599 1600 static void team_uninit(struct net_device *dev) 1601 { 1602 struct team *team = netdev_priv(dev); 1603 struct team_port *port; 1604 struct team_port *tmp; 1605 1606 mutex_lock(&team->lock); 1607 list_for_each_entry_safe(port, tmp, &team->port_list, list) 1608 team_port_del(team, port->dev); 1609 1610 __team_change_mode(team, NULL); /* cleanup */ 1611 __team_options_unregister(team, team_options, ARRAY_SIZE(team_options)); 1612 team_mcast_rejoin_fini(team); 1613 team_notify_peers_fini(team); 1614 team_queue_override_fini(team); 1615 mutex_unlock(&team->lock); 1616 } 1617 1618 static void team_destructor(struct net_device *dev) 1619 { 1620 struct team *team = netdev_priv(dev); 1621 1622 free_percpu(team->pcpu_stats); 1623 free_netdev(dev); 1624 } 1625 1626 static int team_open(struct net_device *dev) 1627 { 1628 return 0; 1629 } 1630 1631 static int team_close(struct net_device *dev) 1632 { 1633 return 0; 1634 } 1635 1636 /* 1637 * note: already called with rcu_read_lock 1638 */ 1639 static netdev_tx_t team_xmit(struct sk_buff *skb, struct net_device *dev) 1640 { 1641 struct team *team = netdev_priv(dev); 1642 bool tx_success; 1643 unsigned int len = skb->len; 1644 1645 tx_success = team_queue_override_transmit(team, skb); 1646 if (!tx_success) 1647 tx_success = team->ops.transmit(team, skb); 1648 if (tx_success) { 1649 struct team_pcpu_stats *pcpu_stats; 1650 1651 pcpu_stats = this_cpu_ptr(team->pcpu_stats); 1652 u64_stats_update_begin(&pcpu_stats->syncp); 1653 pcpu_stats->tx_packets++; 1654 pcpu_stats->tx_bytes += len; 1655 u64_stats_update_end(&pcpu_stats->syncp); 1656 } else { 1657 this_cpu_inc(team->pcpu_stats->tx_dropped); 1658 } 1659 1660 return NETDEV_TX_OK; 1661 } 1662 1663 static u16 team_select_queue(struct net_device *dev, struct sk_buff *skb, 1664 void *accel_priv, select_queue_fallback_t fallback) 1665 { 1666 /* 1667 * This helper function exists to help dev_pick_tx get the correct 1668 * destination queue. Using a helper function skips a call to 1669 * skb_tx_hash and will put the skbs in the queue we expect on their 1670 * way down to the team driver. 1671 */ 1672 u16 txq = skb_rx_queue_recorded(skb) ? skb_get_rx_queue(skb) : 0; 1673 1674 /* 1675 * Save the original txq to restore before passing to the driver 1676 */ 1677 qdisc_skb_cb(skb)->slave_dev_queue_mapping = skb->queue_mapping; 1678 1679 if (unlikely(txq >= dev->real_num_tx_queues)) { 1680 do { 1681 txq -= dev->real_num_tx_queues; 1682 } while (txq >= dev->real_num_tx_queues); 1683 } 1684 return txq; 1685 } 1686 1687 static void team_change_rx_flags(struct net_device *dev, int change) 1688 { 1689 struct team *team = netdev_priv(dev); 1690 struct team_port *port; 1691 int inc; 1692 1693 rcu_read_lock(); 1694 list_for_each_entry_rcu(port, &team->port_list, list) { 1695 if (change & IFF_PROMISC) { 1696 inc = dev->flags & IFF_PROMISC ? 1 : -1; 1697 dev_set_promiscuity(port->dev, inc); 1698 } 1699 if (change & IFF_ALLMULTI) { 1700 inc = dev->flags & IFF_ALLMULTI ? 1 : -1; 1701 dev_set_allmulti(port->dev, inc); 1702 } 1703 } 1704 rcu_read_unlock(); 1705 } 1706 1707 static void team_set_rx_mode(struct net_device *dev) 1708 { 1709 struct team *team = netdev_priv(dev); 1710 struct team_port *port; 1711 1712 rcu_read_lock(); 1713 list_for_each_entry_rcu(port, &team->port_list, list) { 1714 dev_uc_sync_multiple(port->dev, dev); 1715 dev_mc_sync_multiple(port->dev, dev); 1716 } 1717 rcu_read_unlock(); 1718 } 1719 1720 static int team_set_mac_address(struct net_device *dev, void *p) 1721 { 1722 struct sockaddr *addr = p; 1723 struct team *team = netdev_priv(dev); 1724 struct team_port *port; 1725 1726 if (dev->type == ARPHRD_ETHER && !is_valid_ether_addr(addr->sa_data)) 1727 return -EADDRNOTAVAIL; 1728 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len); 1729 rcu_read_lock(); 1730 list_for_each_entry_rcu(port, &team->port_list, list) 1731 if (team->ops.port_change_dev_addr) 1732 team->ops.port_change_dev_addr(team, port); 1733 rcu_read_unlock(); 1734 return 0; 1735 } 1736 1737 static int team_change_mtu(struct net_device *dev, int new_mtu) 1738 { 1739 struct team *team = netdev_priv(dev); 1740 struct team_port *port; 1741 int err; 1742 1743 /* 1744 * Alhough this is reader, it's guarded by team lock. It's not possible 1745 * to traverse list in reverse under rcu_read_lock 1746 */ 1747 mutex_lock(&team->lock); 1748 team->port_mtu_change_allowed = true; 1749 list_for_each_entry(port, &team->port_list, list) { 1750 err = dev_set_mtu(port->dev, new_mtu); 1751 if (err) { 1752 netdev_err(dev, "Device %s failed to change mtu", 1753 port->dev->name); 1754 goto unwind; 1755 } 1756 } 1757 team->port_mtu_change_allowed = false; 1758 mutex_unlock(&team->lock); 1759 1760 dev->mtu = new_mtu; 1761 1762 return 0; 1763 1764 unwind: 1765 list_for_each_entry_continue_reverse(port, &team->port_list, list) 1766 dev_set_mtu(port->dev, dev->mtu); 1767 team->port_mtu_change_allowed = false; 1768 mutex_unlock(&team->lock); 1769 1770 return err; 1771 } 1772 1773 static struct rtnl_link_stats64 * 1774 team_get_stats64(struct net_device *dev, struct rtnl_link_stats64 *stats) 1775 { 1776 struct team *team = netdev_priv(dev); 1777 struct team_pcpu_stats *p; 1778 u64 rx_packets, rx_bytes, rx_multicast, tx_packets, tx_bytes; 1779 u32 rx_dropped = 0, tx_dropped = 0; 1780 unsigned int start; 1781 int i; 1782 1783 for_each_possible_cpu(i) { 1784 p = per_cpu_ptr(team->pcpu_stats, i); 1785 do { 1786 start = u64_stats_fetch_begin_irq(&p->syncp); 1787 rx_packets = p->rx_packets; 1788 rx_bytes = p->rx_bytes; 1789 rx_multicast = p->rx_multicast; 1790 tx_packets = p->tx_packets; 1791 tx_bytes = p->tx_bytes; 1792 } while (u64_stats_fetch_retry_irq(&p->syncp, start)); 1793 1794 stats->rx_packets += rx_packets; 1795 stats->rx_bytes += rx_bytes; 1796 stats->multicast += rx_multicast; 1797 stats->tx_packets += tx_packets; 1798 stats->tx_bytes += tx_bytes; 1799 /* 1800 * rx_dropped & tx_dropped are u32, updated 1801 * without syncp protection. 1802 */ 1803 rx_dropped += p->rx_dropped; 1804 tx_dropped += p->tx_dropped; 1805 } 1806 stats->rx_dropped = rx_dropped; 1807 stats->tx_dropped = tx_dropped; 1808 return stats; 1809 } 1810 1811 static int team_vlan_rx_add_vid(struct net_device *dev, __be16 proto, u16 vid) 1812 { 1813 struct team *team = netdev_priv(dev); 1814 struct team_port *port; 1815 int err; 1816 1817 /* 1818 * Alhough this is reader, it's guarded by team lock. It's not possible 1819 * to traverse list in reverse under rcu_read_lock 1820 */ 1821 mutex_lock(&team->lock); 1822 list_for_each_entry(port, &team->port_list, list) { 1823 err = vlan_vid_add(port->dev, proto, vid); 1824 if (err) 1825 goto unwind; 1826 } 1827 mutex_unlock(&team->lock); 1828 1829 return 0; 1830 1831 unwind: 1832 list_for_each_entry_continue_reverse(port, &team->port_list, list) 1833 vlan_vid_del(port->dev, proto, vid); 1834 mutex_unlock(&team->lock); 1835 1836 return err; 1837 } 1838 1839 static int team_vlan_rx_kill_vid(struct net_device *dev, __be16 proto, u16 vid) 1840 { 1841 struct team *team = netdev_priv(dev); 1842 struct team_port *port; 1843 1844 rcu_read_lock(); 1845 list_for_each_entry_rcu(port, &team->port_list, list) 1846 vlan_vid_del(port->dev, proto, vid); 1847 rcu_read_unlock(); 1848 1849 return 0; 1850 } 1851 1852 #ifdef CONFIG_NET_POLL_CONTROLLER 1853 static void team_poll_controller(struct net_device *dev) 1854 { 1855 } 1856 1857 static void __team_netpoll_cleanup(struct team *team) 1858 { 1859 struct team_port *port; 1860 1861 list_for_each_entry(port, &team->port_list, list) 1862 team_port_disable_netpoll(port); 1863 } 1864 1865 static void team_netpoll_cleanup(struct net_device *dev) 1866 { 1867 struct team *team = netdev_priv(dev); 1868 1869 mutex_lock(&team->lock); 1870 __team_netpoll_cleanup(team); 1871 mutex_unlock(&team->lock); 1872 } 1873 1874 static int team_netpoll_setup(struct net_device *dev, 1875 struct netpoll_info *npifo) 1876 { 1877 struct team *team = netdev_priv(dev); 1878 struct team_port *port; 1879 int err = 0; 1880 1881 mutex_lock(&team->lock); 1882 list_for_each_entry(port, &team->port_list, list) { 1883 err = team_port_enable_netpoll(team, port); 1884 if (err) { 1885 __team_netpoll_cleanup(team); 1886 break; 1887 } 1888 } 1889 mutex_unlock(&team->lock); 1890 return err; 1891 } 1892 #endif 1893 1894 static int team_add_slave(struct net_device *dev, struct net_device *port_dev) 1895 { 1896 struct team *team = netdev_priv(dev); 1897 int err; 1898 1899 mutex_lock(&team->lock); 1900 err = team_port_add(team, port_dev); 1901 mutex_unlock(&team->lock); 1902 return err; 1903 } 1904 1905 static int team_del_slave(struct net_device *dev, struct net_device *port_dev) 1906 { 1907 struct team *team = netdev_priv(dev); 1908 int err; 1909 1910 mutex_lock(&team->lock); 1911 err = team_port_del(team, port_dev); 1912 mutex_unlock(&team->lock); 1913 return err; 1914 } 1915 1916 static netdev_features_t team_fix_features(struct net_device *dev, 1917 netdev_features_t features) 1918 { 1919 struct team_port *port; 1920 struct team *team = netdev_priv(dev); 1921 netdev_features_t mask; 1922 1923 mask = features; 1924 features &= ~NETIF_F_ONE_FOR_ALL; 1925 features |= NETIF_F_ALL_FOR_ALL; 1926 1927 rcu_read_lock(); 1928 list_for_each_entry_rcu(port, &team->port_list, list) { 1929 features = netdev_increment_features(features, 1930 port->dev->features, 1931 mask); 1932 } 1933 rcu_read_unlock(); 1934 return features; 1935 } 1936 1937 static int team_change_carrier(struct net_device *dev, bool new_carrier) 1938 { 1939 struct team *team = netdev_priv(dev); 1940 1941 team->user_carrier_enabled = true; 1942 1943 if (new_carrier) 1944 netif_carrier_on(dev); 1945 else 1946 netif_carrier_off(dev); 1947 return 0; 1948 } 1949 1950 static const struct net_device_ops team_netdev_ops = { 1951 .ndo_init = team_init, 1952 .ndo_uninit = team_uninit, 1953 .ndo_open = team_open, 1954 .ndo_stop = team_close, 1955 .ndo_start_xmit = team_xmit, 1956 .ndo_select_queue = team_select_queue, 1957 .ndo_change_rx_flags = team_change_rx_flags, 1958 .ndo_set_rx_mode = team_set_rx_mode, 1959 .ndo_set_mac_address = team_set_mac_address, 1960 .ndo_change_mtu = team_change_mtu, 1961 .ndo_get_stats64 = team_get_stats64, 1962 .ndo_vlan_rx_add_vid = team_vlan_rx_add_vid, 1963 .ndo_vlan_rx_kill_vid = team_vlan_rx_kill_vid, 1964 #ifdef CONFIG_NET_POLL_CONTROLLER 1965 .ndo_poll_controller = team_poll_controller, 1966 .ndo_netpoll_setup = team_netpoll_setup, 1967 .ndo_netpoll_cleanup = team_netpoll_cleanup, 1968 #endif 1969 .ndo_add_slave = team_add_slave, 1970 .ndo_del_slave = team_del_slave, 1971 .ndo_fix_features = team_fix_features, 1972 .ndo_change_carrier = team_change_carrier, 1973 }; 1974 1975 /*********************** 1976 * ethtool interface 1977 ***********************/ 1978 1979 static void team_ethtool_get_drvinfo(struct net_device *dev, 1980 struct ethtool_drvinfo *drvinfo) 1981 { 1982 strlcpy(drvinfo->driver, DRV_NAME, sizeof(drvinfo->driver)); 1983 strlcpy(drvinfo->version, UTS_RELEASE, sizeof(drvinfo->version)); 1984 } 1985 1986 static const struct ethtool_ops team_ethtool_ops = { 1987 .get_drvinfo = team_ethtool_get_drvinfo, 1988 .get_link = ethtool_op_get_link, 1989 }; 1990 1991 /*********************** 1992 * rt netlink interface 1993 ***********************/ 1994 1995 static void team_setup_by_port(struct net_device *dev, 1996 struct net_device *port_dev) 1997 { 1998 dev->header_ops = port_dev->header_ops; 1999 dev->type = port_dev->type; 2000 dev->hard_header_len = port_dev->hard_header_len; 2001 dev->addr_len = port_dev->addr_len; 2002 dev->mtu = port_dev->mtu; 2003 memcpy(dev->broadcast, port_dev->broadcast, port_dev->addr_len); 2004 eth_hw_addr_inherit(dev, port_dev); 2005 } 2006 2007 static int team_dev_type_check_change(struct net_device *dev, 2008 struct net_device *port_dev) 2009 { 2010 struct team *team = netdev_priv(dev); 2011 char *portname = port_dev->name; 2012 int err; 2013 2014 if (dev->type == port_dev->type) 2015 return 0; 2016 if (!list_empty(&team->port_list)) { 2017 netdev_err(dev, "Device %s is of different type\n", portname); 2018 return -EBUSY; 2019 } 2020 err = call_netdevice_notifiers(NETDEV_PRE_TYPE_CHANGE, dev); 2021 err = notifier_to_errno(err); 2022 if (err) { 2023 netdev_err(dev, "Refused to change device type\n"); 2024 return err; 2025 } 2026 dev_uc_flush(dev); 2027 dev_mc_flush(dev); 2028 team_setup_by_port(dev, port_dev); 2029 call_netdevice_notifiers(NETDEV_POST_TYPE_CHANGE, dev); 2030 return 0; 2031 } 2032 2033 static void team_setup(struct net_device *dev) 2034 { 2035 ether_setup(dev); 2036 2037 dev->netdev_ops = &team_netdev_ops; 2038 dev->ethtool_ops = &team_ethtool_ops; 2039 dev->destructor = team_destructor; 2040 dev->tx_queue_len = 0; 2041 dev->flags |= IFF_MULTICAST; 2042 dev->priv_flags &= ~(IFF_XMIT_DST_RELEASE | IFF_TX_SKB_SHARING); 2043 2044 /* 2045 * Indicate we support unicast address filtering. That way core won't 2046 * bring us to promisc mode in case a unicast addr is added. 2047 * Let this up to underlay drivers. 2048 */ 2049 dev->priv_flags |= IFF_UNICAST_FLT | IFF_LIVE_ADDR_CHANGE; 2050 2051 dev->features |= NETIF_F_LLTX; 2052 dev->features |= NETIF_F_GRO; 2053 2054 /* Don't allow team devices to change network namespaces. */ 2055 dev->features |= NETIF_F_NETNS_LOCAL; 2056 2057 dev->hw_features = TEAM_VLAN_FEATURES | 2058 NETIF_F_HW_VLAN_CTAG_TX | 2059 NETIF_F_HW_VLAN_CTAG_RX | 2060 NETIF_F_HW_VLAN_CTAG_FILTER; 2061 2062 dev->hw_features &= ~(NETIF_F_ALL_CSUM & ~NETIF_F_HW_CSUM); 2063 dev->features |= dev->hw_features; 2064 } 2065 2066 static int team_newlink(struct net *src_net, struct net_device *dev, 2067 struct nlattr *tb[], struct nlattr *data[]) 2068 { 2069 if (tb[IFLA_ADDRESS] == NULL) 2070 eth_hw_addr_random(dev); 2071 2072 return register_netdevice(dev); 2073 } 2074 2075 static int team_validate(struct nlattr *tb[], struct nlattr *data[]) 2076 { 2077 if (tb[IFLA_ADDRESS]) { 2078 if (nla_len(tb[IFLA_ADDRESS]) != ETH_ALEN) 2079 return -EINVAL; 2080 if (!is_valid_ether_addr(nla_data(tb[IFLA_ADDRESS]))) 2081 return -EADDRNOTAVAIL; 2082 } 2083 return 0; 2084 } 2085 2086 static unsigned int team_get_num_tx_queues(void) 2087 { 2088 return TEAM_DEFAULT_NUM_TX_QUEUES; 2089 } 2090 2091 static unsigned int team_get_num_rx_queues(void) 2092 { 2093 return TEAM_DEFAULT_NUM_RX_QUEUES; 2094 } 2095 2096 static struct rtnl_link_ops team_link_ops __read_mostly = { 2097 .kind = DRV_NAME, 2098 .priv_size = sizeof(struct team), 2099 .setup = team_setup, 2100 .newlink = team_newlink, 2101 .validate = team_validate, 2102 .get_num_tx_queues = team_get_num_tx_queues, 2103 .get_num_rx_queues = team_get_num_rx_queues, 2104 }; 2105 2106 2107 /*********************************** 2108 * Generic netlink custom interface 2109 ***********************************/ 2110 2111 static struct genl_family team_nl_family = { 2112 .id = GENL_ID_GENERATE, 2113 .name = TEAM_GENL_NAME, 2114 .version = TEAM_GENL_VERSION, 2115 .maxattr = TEAM_ATTR_MAX, 2116 .netnsok = true, 2117 }; 2118 2119 static const struct nla_policy team_nl_policy[TEAM_ATTR_MAX + 1] = { 2120 [TEAM_ATTR_UNSPEC] = { .type = NLA_UNSPEC, }, 2121 [TEAM_ATTR_TEAM_IFINDEX] = { .type = NLA_U32 }, 2122 [TEAM_ATTR_LIST_OPTION] = { .type = NLA_NESTED }, 2123 [TEAM_ATTR_LIST_PORT] = { .type = NLA_NESTED }, 2124 }; 2125 2126 static const struct nla_policy 2127 team_nl_option_policy[TEAM_ATTR_OPTION_MAX + 1] = { 2128 [TEAM_ATTR_OPTION_UNSPEC] = { .type = NLA_UNSPEC, }, 2129 [TEAM_ATTR_OPTION_NAME] = { 2130 .type = NLA_STRING, 2131 .len = TEAM_STRING_MAX_LEN, 2132 }, 2133 [TEAM_ATTR_OPTION_CHANGED] = { .type = NLA_FLAG }, 2134 [TEAM_ATTR_OPTION_TYPE] = { .type = NLA_U8 }, 2135 [TEAM_ATTR_OPTION_DATA] = { .type = NLA_BINARY }, 2136 }; 2137 2138 static int team_nl_cmd_noop(struct sk_buff *skb, struct genl_info *info) 2139 { 2140 struct sk_buff *msg; 2141 void *hdr; 2142 int err; 2143 2144 msg = nlmsg_new(NLMSG_DEFAULT_SIZE, GFP_KERNEL); 2145 if (!msg) 2146 return -ENOMEM; 2147 2148 hdr = genlmsg_put(msg, info->snd_portid, info->snd_seq, 2149 &team_nl_family, 0, TEAM_CMD_NOOP); 2150 if (!hdr) { 2151 err = -EMSGSIZE; 2152 goto err_msg_put; 2153 } 2154 2155 genlmsg_end(msg, hdr); 2156 2157 return genlmsg_unicast(genl_info_net(info), msg, info->snd_portid); 2158 2159 err_msg_put: 2160 nlmsg_free(msg); 2161 2162 return err; 2163 } 2164 2165 /* 2166 * Netlink cmd functions should be locked by following two functions. 2167 * Since dev gets held here, that ensures dev won't disappear in between. 2168 */ 2169 static struct team *team_nl_team_get(struct genl_info *info) 2170 { 2171 struct net *net = genl_info_net(info); 2172 int ifindex; 2173 struct net_device *dev; 2174 struct team *team; 2175 2176 if (!info->attrs[TEAM_ATTR_TEAM_IFINDEX]) 2177 return NULL; 2178 2179 ifindex = nla_get_u32(info->attrs[TEAM_ATTR_TEAM_IFINDEX]); 2180 dev = dev_get_by_index(net, ifindex); 2181 if (!dev || dev->netdev_ops != &team_netdev_ops) { 2182 if (dev) 2183 dev_put(dev); 2184 return NULL; 2185 } 2186 2187 team = netdev_priv(dev); 2188 mutex_lock(&team->lock); 2189 return team; 2190 } 2191 2192 static void team_nl_team_put(struct team *team) 2193 { 2194 mutex_unlock(&team->lock); 2195 dev_put(team->dev); 2196 } 2197 2198 typedef int team_nl_send_func_t(struct sk_buff *skb, 2199 struct team *team, u32 portid); 2200 2201 static int team_nl_send_unicast(struct sk_buff *skb, struct team *team, u32 portid) 2202 { 2203 return genlmsg_unicast(dev_net(team->dev), skb, portid); 2204 } 2205 2206 static int team_nl_fill_one_option_get(struct sk_buff *skb, struct team *team, 2207 struct team_option_inst *opt_inst) 2208 { 2209 struct nlattr *option_item; 2210 struct team_option *option = opt_inst->option; 2211 struct team_option_inst_info *opt_inst_info = &opt_inst->info; 2212 struct team_gsetter_ctx ctx; 2213 int err; 2214 2215 ctx.info = opt_inst_info; 2216 err = team_option_get(team, opt_inst, &ctx); 2217 if (err) 2218 return err; 2219 2220 option_item = nla_nest_start(skb, TEAM_ATTR_ITEM_OPTION); 2221 if (!option_item) 2222 return -EMSGSIZE; 2223 2224 if (nla_put_string(skb, TEAM_ATTR_OPTION_NAME, option->name)) 2225 goto nest_cancel; 2226 if (opt_inst_info->port && 2227 nla_put_u32(skb, TEAM_ATTR_OPTION_PORT_IFINDEX, 2228 opt_inst_info->port->dev->ifindex)) 2229 goto nest_cancel; 2230 if (opt_inst->option->array_size && 2231 nla_put_u32(skb, TEAM_ATTR_OPTION_ARRAY_INDEX, 2232 opt_inst_info->array_index)) 2233 goto nest_cancel; 2234 2235 switch (option->type) { 2236 case TEAM_OPTION_TYPE_U32: 2237 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_U32)) 2238 goto nest_cancel; 2239 if (nla_put_u32(skb, TEAM_ATTR_OPTION_DATA, ctx.data.u32_val)) 2240 goto nest_cancel; 2241 break; 2242 case TEAM_OPTION_TYPE_STRING: 2243 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_STRING)) 2244 goto nest_cancel; 2245 if (nla_put_string(skb, TEAM_ATTR_OPTION_DATA, 2246 ctx.data.str_val)) 2247 goto nest_cancel; 2248 break; 2249 case TEAM_OPTION_TYPE_BINARY: 2250 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_BINARY)) 2251 goto nest_cancel; 2252 if (nla_put(skb, TEAM_ATTR_OPTION_DATA, ctx.data.bin_val.len, 2253 ctx.data.bin_val.ptr)) 2254 goto nest_cancel; 2255 break; 2256 case TEAM_OPTION_TYPE_BOOL: 2257 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_FLAG)) 2258 goto nest_cancel; 2259 if (ctx.data.bool_val && 2260 nla_put_flag(skb, TEAM_ATTR_OPTION_DATA)) 2261 goto nest_cancel; 2262 break; 2263 case TEAM_OPTION_TYPE_S32: 2264 if (nla_put_u8(skb, TEAM_ATTR_OPTION_TYPE, NLA_S32)) 2265 goto nest_cancel; 2266 if (nla_put_s32(skb, TEAM_ATTR_OPTION_DATA, ctx.data.s32_val)) 2267 goto nest_cancel; 2268 break; 2269 default: 2270 BUG(); 2271 } 2272 if (opt_inst->removed && nla_put_flag(skb, TEAM_ATTR_OPTION_REMOVED)) 2273 goto nest_cancel; 2274 if (opt_inst->changed) { 2275 if (nla_put_flag(skb, TEAM_ATTR_OPTION_CHANGED)) 2276 goto nest_cancel; 2277 opt_inst->changed = false; 2278 } 2279 nla_nest_end(skb, option_item); 2280 return 0; 2281 2282 nest_cancel: 2283 nla_nest_cancel(skb, option_item); 2284 return -EMSGSIZE; 2285 } 2286 2287 static int __send_and_alloc_skb(struct sk_buff **pskb, 2288 struct team *team, u32 portid, 2289 team_nl_send_func_t *send_func) 2290 { 2291 int err; 2292 2293 if (*pskb) { 2294 err = send_func(*pskb, team, portid); 2295 if (err) 2296 return err; 2297 } 2298 *pskb = genlmsg_new(GENLMSG_DEFAULT_SIZE, GFP_KERNEL); 2299 if (!*pskb) 2300 return -ENOMEM; 2301 return 0; 2302 } 2303 2304 static int team_nl_send_options_get(struct team *team, u32 portid, u32 seq, 2305 int flags, team_nl_send_func_t *send_func, 2306 struct list_head *sel_opt_inst_list) 2307 { 2308 struct nlattr *option_list; 2309 struct nlmsghdr *nlh; 2310 void *hdr; 2311 struct team_option_inst *opt_inst; 2312 int err; 2313 struct sk_buff *skb = NULL; 2314 bool incomplete; 2315 int i; 2316 2317 opt_inst = list_first_entry(sel_opt_inst_list, 2318 struct team_option_inst, tmp_list); 2319 2320 start_again: 2321 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2322 if (err) 2323 return err; 2324 2325 hdr = genlmsg_put(skb, portid, seq, &team_nl_family, flags | NLM_F_MULTI, 2326 TEAM_CMD_OPTIONS_GET); 2327 if (!hdr) 2328 return -EMSGSIZE; 2329 2330 if (nla_put_u32(skb, TEAM_ATTR_TEAM_IFINDEX, team->dev->ifindex)) 2331 goto nla_put_failure; 2332 option_list = nla_nest_start(skb, TEAM_ATTR_LIST_OPTION); 2333 if (!option_list) 2334 goto nla_put_failure; 2335 2336 i = 0; 2337 incomplete = false; 2338 list_for_each_entry_from(opt_inst, sel_opt_inst_list, tmp_list) { 2339 err = team_nl_fill_one_option_get(skb, team, opt_inst); 2340 if (err) { 2341 if (err == -EMSGSIZE) { 2342 if (!i) 2343 goto errout; 2344 incomplete = true; 2345 break; 2346 } 2347 goto errout; 2348 } 2349 i++; 2350 } 2351 2352 nla_nest_end(skb, option_list); 2353 genlmsg_end(skb, hdr); 2354 if (incomplete) 2355 goto start_again; 2356 2357 send_done: 2358 nlh = nlmsg_put(skb, portid, seq, NLMSG_DONE, 0, flags | NLM_F_MULTI); 2359 if (!nlh) { 2360 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2361 if (err) 2362 goto errout; 2363 goto send_done; 2364 } 2365 2366 return send_func(skb, team, portid); 2367 2368 nla_put_failure: 2369 err = -EMSGSIZE; 2370 errout: 2371 genlmsg_cancel(skb, hdr); 2372 nlmsg_free(skb); 2373 return err; 2374 } 2375 2376 static int team_nl_cmd_options_get(struct sk_buff *skb, struct genl_info *info) 2377 { 2378 struct team *team; 2379 struct team_option_inst *opt_inst; 2380 int err; 2381 LIST_HEAD(sel_opt_inst_list); 2382 2383 team = team_nl_team_get(info); 2384 if (!team) 2385 return -EINVAL; 2386 2387 list_for_each_entry(opt_inst, &team->option_inst_list, list) 2388 list_add_tail(&opt_inst->tmp_list, &sel_opt_inst_list); 2389 err = team_nl_send_options_get(team, info->snd_portid, info->snd_seq, 2390 NLM_F_ACK, team_nl_send_unicast, 2391 &sel_opt_inst_list); 2392 2393 team_nl_team_put(team); 2394 2395 return err; 2396 } 2397 2398 static int team_nl_send_event_options_get(struct team *team, 2399 struct list_head *sel_opt_inst_list); 2400 2401 static int team_nl_cmd_options_set(struct sk_buff *skb, struct genl_info *info) 2402 { 2403 struct team *team; 2404 int err = 0; 2405 int i; 2406 struct nlattr *nl_option; 2407 LIST_HEAD(opt_inst_list); 2408 2409 team = team_nl_team_get(info); 2410 if (!team) 2411 return -EINVAL; 2412 2413 err = -EINVAL; 2414 if (!info->attrs[TEAM_ATTR_LIST_OPTION]) { 2415 err = -EINVAL; 2416 goto team_put; 2417 } 2418 2419 nla_for_each_nested(nl_option, info->attrs[TEAM_ATTR_LIST_OPTION], i) { 2420 struct nlattr *opt_attrs[TEAM_ATTR_OPTION_MAX + 1]; 2421 struct nlattr *attr; 2422 struct nlattr *attr_data; 2423 enum team_option_type opt_type; 2424 int opt_port_ifindex = 0; /* != 0 for per-port options */ 2425 u32 opt_array_index = 0; 2426 bool opt_is_array = false; 2427 struct team_option_inst *opt_inst; 2428 char *opt_name; 2429 bool opt_found = false; 2430 2431 if (nla_type(nl_option) != TEAM_ATTR_ITEM_OPTION) { 2432 err = -EINVAL; 2433 goto team_put; 2434 } 2435 err = nla_parse_nested(opt_attrs, TEAM_ATTR_OPTION_MAX, 2436 nl_option, team_nl_option_policy); 2437 if (err) 2438 goto team_put; 2439 if (!opt_attrs[TEAM_ATTR_OPTION_NAME] || 2440 !opt_attrs[TEAM_ATTR_OPTION_TYPE]) { 2441 err = -EINVAL; 2442 goto team_put; 2443 } 2444 switch (nla_get_u8(opt_attrs[TEAM_ATTR_OPTION_TYPE])) { 2445 case NLA_U32: 2446 opt_type = TEAM_OPTION_TYPE_U32; 2447 break; 2448 case NLA_STRING: 2449 opt_type = TEAM_OPTION_TYPE_STRING; 2450 break; 2451 case NLA_BINARY: 2452 opt_type = TEAM_OPTION_TYPE_BINARY; 2453 break; 2454 case NLA_FLAG: 2455 opt_type = TEAM_OPTION_TYPE_BOOL; 2456 break; 2457 case NLA_S32: 2458 opt_type = TEAM_OPTION_TYPE_S32; 2459 break; 2460 default: 2461 goto team_put; 2462 } 2463 2464 attr_data = opt_attrs[TEAM_ATTR_OPTION_DATA]; 2465 if (opt_type != TEAM_OPTION_TYPE_BOOL && !attr_data) { 2466 err = -EINVAL; 2467 goto team_put; 2468 } 2469 2470 opt_name = nla_data(opt_attrs[TEAM_ATTR_OPTION_NAME]); 2471 attr = opt_attrs[TEAM_ATTR_OPTION_PORT_IFINDEX]; 2472 if (attr) 2473 opt_port_ifindex = nla_get_u32(attr); 2474 2475 attr = opt_attrs[TEAM_ATTR_OPTION_ARRAY_INDEX]; 2476 if (attr) { 2477 opt_is_array = true; 2478 opt_array_index = nla_get_u32(attr); 2479 } 2480 2481 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 2482 struct team_option *option = opt_inst->option; 2483 struct team_gsetter_ctx ctx; 2484 struct team_option_inst_info *opt_inst_info; 2485 int tmp_ifindex; 2486 2487 opt_inst_info = &opt_inst->info; 2488 tmp_ifindex = opt_inst_info->port ? 2489 opt_inst_info->port->dev->ifindex : 0; 2490 if (option->type != opt_type || 2491 strcmp(option->name, opt_name) || 2492 tmp_ifindex != opt_port_ifindex || 2493 (option->array_size && !opt_is_array) || 2494 opt_inst_info->array_index != opt_array_index) 2495 continue; 2496 opt_found = true; 2497 ctx.info = opt_inst_info; 2498 switch (opt_type) { 2499 case TEAM_OPTION_TYPE_U32: 2500 ctx.data.u32_val = nla_get_u32(attr_data); 2501 break; 2502 case TEAM_OPTION_TYPE_STRING: 2503 if (nla_len(attr_data) > TEAM_STRING_MAX_LEN) { 2504 err = -EINVAL; 2505 goto team_put; 2506 } 2507 ctx.data.str_val = nla_data(attr_data); 2508 break; 2509 case TEAM_OPTION_TYPE_BINARY: 2510 ctx.data.bin_val.len = nla_len(attr_data); 2511 ctx.data.bin_val.ptr = nla_data(attr_data); 2512 break; 2513 case TEAM_OPTION_TYPE_BOOL: 2514 ctx.data.bool_val = attr_data ? true : false; 2515 break; 2516 case TEAM_OPTION_TYPE_S32: 2517 ctx.data.s32_val = nla_get_s32(attr_data); 2518 break; 2519 default: 2520 BUG(); 2521 } 2522 err = team_option_set(team, opt_inst, &ctx); 2523 if (err) 2524 goto team_put; 2525 opt_inst->changed = true; 2526 list_add(&opt_inst->tmp_list, &opt_inst_list); 2527 } 2528 if (!opt_found) { 2529 err = -ENOENT; 2530 goto team_put; 2531 } 2532 } 2533 2534 err = team_nl_send_event_options_get(team, &opt_inst_list); 2535 2536 team_put: 2537 team_nl_team_put(team); 2538 2539 return err; 2540 } 2541 2542 static int team_nl_fill_one_port_get(struct sk_buff *skb, 2543 struct team_port *port) 2544 { 2545 struct nlattr *port_item; 2546 2547 port_item = nla_nest_start(skb, TEAM_ATTR_ITEM_PORT); 2548 if (!port_item) 2549 goto nest_cancel; 2550 if (nla_put_u32(skb, TEAM_ATTR_PORT_IFINDEX, port->dev->ifindex)) 2551 goto nest_cancel; 2552 if (port->changed) { 2553 if (nla_put_flag(skb, TEAM_ATTR_PORT_CHANGED)) 2554 goto nest_cancel; 2555 port->changed = false; 2556 } 2557 if ((port->removed && 2558 nla_put_flag(skb, TEAM_ATTR_PORT_REMOVED)) || 2559 (port->state.linkup && 2560 nla_put_flag(skb, TEAM_ATTR_PORT_LINKUP)) || 2561 nla_put_u32(skb, TEAM_ATTR_PORT_SPEED, port->state.speed) || 2562 nla_put_u8(skb, TEAM_ATTR_PORT_DUPLEX, port->state.duplex)) 2563 goto nest_cancel; 2564 nla_nest_end(skb, port_item); 2565 return 0; 2566 2567 nest_cancel: 2568 nla_nest_cancel(skb, port_item); 2569 return -EMSGSIZE; 2570 } 2571 2572 static int team_nl_send_port_list_get(struct team *team, u32 portid, u32 seq, 2573 int flags, team_nl_send_func_t *send_func, 2574 struct team_port *one_port) 2575 { 2576 struct nlattr *port_list; 2577 struct nlmsghdr *nlh; 2578 void *hdr; 2579 struct team_port *port; 2580 int err; 2581 struct sk_buff *skb = NULL; 2582 bool incomplete; 2583 int i; 2584 2585 port = list_first_entry_or_null(&team->port_list, 2586 struct team_port, list); 2587 2588 start_again: 2589 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2590 if (err) 2591 return err; 2592 2593 hdr = genlmsg_put(skb, portid, seq, &team_nl_family, flags | NLM_F_MULTI, 2594 TEAM_CMD_PORT_LIST_GET); 2595 if (!hdr) 2596 return -EMSGSIZE; 2597 2598 if (nla_put_u32(skb, TEAM_ATTR_TEAM_IFINDEX, team->dev->ifindex)) 2599 goto nla_put_failure; 2600 port_list = nla_nest_start(skb, TEAM_ATTR_LIST_PORT); 2601 if (!port_list) 2602 goto nla_put_failure; 2603 2604 i = 0; 2605 incomplete = false; 2606 2607 /* If one port is selected, called wants to send port list containing 2608 * only this port. Otherwise go through all listed ports and send all 2609 */ 2610 if (one_port) { 2611 err = team_nl_fill_one_port_get(skb, one_port); 2612 if (err) 2613 goto errout; 2614 } else if (port) { 2615 list_for_each_entry_from(port, &team->port_list, list) { 2616 err = team_nl_fill_one_port_get(skb, port); 2617 if (err) { 2618 if (err == -EMSGSIZE) { 2619 if (!i) 2620 goto errout; 2621 incomplete = true; 2622 break; 2623 } 2624 goto errout; 2625 } 2626 i++; 2627 } 2628 } 2629 2630 nla_nest_end(skb, port_list); 2631 genlmsg_end(skb, hdr); 2632 if (incomplete) 2633 goto start_again; 2634 2635 send_done: 2636 nlh = nlmsg_put(skb, portid, seq, NLMSG_DONE, 0, flags | NLM_F_MULTI); 2637 if (!nlh) { 2638 err = __send_and_alloc_skb(&skb, team, portid, send_func); 2639 if (err) 2640 goto errout; 2641 goto send_done; 2642 } 2643 2644 return send_func(skb, team, portid); 2645 2646 nla_put_failure: 2647 err = -EMSGSIZE; 2648 errout: 2649 genlmsg_cancel(skb, hdr); 2650 nlmsg_free(skb); 2651 return err; 2652 } 2653 2654 static int team_nl_cmd_port_list_get(struct sk_buff *skb, 2655 struct genl_info *info) 2656 { 2657 struct team *team; 2658 int err; 2659 2660 team = team_nl_team_get(info); 2661 if (!team) 2662 return -EINVAL; 2663 2664 err = team_nl_send_port_list_get(team, info->snd_portid, info->snd_seq, 2665 NLM_F_ACK, team_nl_send_unicast, NULL); 2666 2667 team_nl_team_put(team); 2668 2669 return err; 2670 } 2671 2672 static const struct genl_ops team_nl_ops[] = { 2673 { 2674 .cmd = TEAM_CMD_NOOP, 2675 .doit = team_nl_cmd_noop, 2676 .policy = team_nl_policy, 2677 }, 2678 { 2679 .cmd = TEAM_CMD_OPTIONS_SET, 2680 .doit = team_nl_cmd_options_set, 2681 .policy = team_nl_policy, 2682 .flags = GENL_ADMIN_PERM, 2683 }, 2684 { 2685 .cmd = TEAM_CMD_OPTIONS_GET, 2686 .doit = team_nl_cmd_options_get, 2687 .policy = team_nl_policy, 2688 .flags = GENL_ADMIN_PERM, 2689 }, 2690 { 2691 .cmd = TEAM_CMD_PORT_LIST_GET, 2692 .doit = team_nl_cmd_port_list_get, 2693 .policy = team_nl_policy, 2694 .flags = GENL_ADMIN_PERM, 2695 }, 2696 }; 2697 2698 static const struct genl_multicast_group team_nl_mcgrps[] = { 2699 { .name = TEAM_GENL_CHANGE_EVENT_MC_GRP_NAME, }, 2700 }; 2701 2702 static int team_nl_send_multicast(struct sk_buff *skb, 2703 struct team *team, u32 portid) 2704 { 2705 return genlmsg_multicast_netns(&team_nl_family, dev_net(team->dev), 2706 skb, 0, 0, GFP_KERNEL); 2707 } 2708 2709 static int team_nl_send_event_options_get(struct team *team, 2710 struct list_head *sel_opt_inst_list) 2711 { 2712 return team_nl_send_options_get(team, 0, 0, 0, team_nl_send_multicast, 2713 sel_opt_inst_list); 2714 } 2715 2716 static int team_nl_send_event_port_get(struct team *team, 2717 struct team_port *port) 2718 { 2719 return team_nl_send_port_list_get(team, 0, 0, 0, team_nl_send_multicast, 2720 port); 2721 } 2722 2723 static int team_nl_init(void) 2724 { 2725 return genl_register_family_with_ops_groups(&team_nl_family, team_nl_ops, 2726 team_nl_mcgrps); 2727 } 2728 2729 static void team_nl_fini(void) 2730 { 2731 genl_unregister_family(&team_nl_family); 2732 } 2733 2734 2735 /****************** 2736 * Change checkers 2737 ******************/ 2738 2739 static void __team_options_change_check(struct team *team) 2740 { 2741 int err; 2742 struct team_option_inst *opt_inst; 2743 LIST_HEAD(sel_opt_inst_list); 2744 2745 list_for_each_entry(opt_inst, &team->option_inst_list, list) { 2746 if (opt_inst->changed) 2747 list_add_tail(&opt_inst->tmp_list, &sel_opt_inst_list); 2748 } 2749 err = team_nl_send_event_options_get(team, &sel_opt_inst_list); 2750 if (err && err != -ESRCH) 2751 netdev_warn(team->dev, "Failed to send options change via netlink (err %d)\n", 2752 err); 2753 } 2754 2755 /* rtnl lock is held */ 2756 2757 static void __team_port_change_send(struct team_port *port, bool linkup) 2758 { 2759 int err; 2760 2761 port->changed = true; 2762 port->state.linkup = linkup; 2763 team_refresh_port_linkup(port); 2764 if (linkup) { 2765 struct ethtool_cmd ecmd; 2766 2767 err = __ethtool_get_settings(port->dev, &ecmd); 2768 if (!err) { 2769 port->state.speed = ethtool_cmd_speed(&ecmd); 2770 port->state.duplex = ecmd.duplex; 2771 goto send_event; 2772 } 2773 } 2774 port->state.speed = 0; 2775 port->state.duplex = 0; 2776 2777 send_event: 2778 err = team_nl_send_event_port_get(port->team, port); 2779 if (err && err != -ESRCH) 2780 netdev_warn(port->team->dev, "Failed to send port change of device %s via netlink (err %d)\n", 2781 port->dev->name, err); 2782 2783 } 2784 2785 static void __team_carrier_check(struct team *team) 2786 { 2787 struct team_port *port; 2788 bool team_linkup; 2789 2790 if (team->user_carrier_enabled) 2791 return; 2792 2793 team_linkup = false; 2794 list_for_each_entry(port, &team->port_list, list) { 2795 if (port->linkup) { 2796 team_linkup = true; 2797 break; 2798 } 2799 } 2800 2801 if (team_linkup) 2802 netif_carrier_on(team->dev); 2803 else 2804 netif_carrier_off(team->dev); 2805 } 2806 2807 static void __team_port_change_check(struct team_port *port, bool linkup) 2808 { 2809 if (port->state.linkup != linkup) 2810 __team_port_change_send(port, linkup); 2811 __team_carrier_check(port->team); 2812 } 2813 2814 static void __team_port_change_port_added(struct team_port *port, bool linkup) 2815 { 2816 __team_port_change_send(port, linkup); 2817 __team_carrier_check(port->team); 2818 } 2819 2820 static void __team_port_change_port_removed(struct team_port *port) 2821 { 2822 port->removed = true; 2823 __team_port_change_send(port, false); 2824 __team_carrier_check(port->team); 2825 } 2826 2827 static void team_port_change_check(struct team_port *port, bool linkup) 2828 { 2829 struct team *team = port->team; 2830 2831 mutex_lock(&team->lock); 2832 __team_port_change_check(port, linkup); 2833 mutex_unlock(&team->lock); 2834 } 2835 2836 2837 /************************************ 2838 * Net device notifier event handler 2839 ************************************/ 2840 2841 static int team_device_event(struct notifier_block *unused, 2842 unsigned long event, void *ptr) 2843 { 2844 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 2845 struct team_port *port; 2846 2847 port = team_port_get_rtnl(dev); 2848 if (!port) 2849 return NOTIFY_DONE; 2850 2851 switch (event) { 2852 case NETDEV_UP: 2853 if (netif_carrier_ok(dev)) 2854 team_port_change_check(port, true); 2855 break; 2856 case NETDEV_DOWN: 2857 team_port_change_check(port, false); 2858 break; 2859 case NETDEV_CHANGE: 2860 if (netif_running(port->dev)) 2861 team_port_change_check(port, 2862 !!netif_carrier_ok(port->dev)); 2863 break; 2864 case NETDEV_UNREGISTER: 2865 team_del_slave(port->team->dev, dev); 2866 break; 2867 case NETDEV_FEAT_CHANGE: 2868 team_compute_features(port->team); 2869 break; 2870 case NETDEV_PRECHANGEMTU: 2871 /* Forbid to change mtu of underlaying device */ 2872 if (!port->team->port_mtu_change_allowed) 2873 return NOTIFY_BAD; 2874 break; 2875 case NETDEV_PRE_TYPE_CHANGE: 2876 /* Forbid to change type of underlaying device */ 2877 return NOTIFY_BAD; 2878 case NETDEV_RESEND_IGMP: 2879 /* Propagate to master device */ 2880 call_netdevice_notifiers(event, port->team->dev); 2881 break; 2882 } 2883 return NOTIFY_DONE; 2884 } 2885 2886 static struct notifier_block team_notifier_block __read_mostly = { 2887 .notifier_call = team_device_event, 2888 }; 2889 2890 2891 /*********************** 2892 * Module init and exit 2893 ***********************/ 2894 2895 static int __init team_module_init(void) 2896 { 2897 int err; 2898 2899 register_netdevice_notifier(&team_notifier_block); 2900 2901 err = rtnl_link_register(&team_link_ops); 2902 if (err) 2903 goto err_rtnl_reg; 2904 2905 err = team_nl_init(); 2906 if (err) 2907 goto err_nl_init; 2908 2909 return 0; 2910 2911 err_nl_init: 2912 rtnl_link_unregister(&team_link_ops); 2913 2914 err_rtnl_reg: 2915 unregister_netdevice_notifier(&team_notifier_block); 2916 2917 return err; 2918 } 2919 2920 static void __exit team_module_exit(void) 2921 { 2922 team_nl_fini(); 2923 rtnl_link_unregister(&team_link_ops); 2924 unregister_netdevice_notifier(&team_notifier_block); 2925 } 2926 2927 module_init(team_module_init); 2928 module_exit(team_module_exit); 2929 2930 MODULE_LICENSE("GPL v2"); 2931 MODULE_AUTHOR("Jiri Pirko <jpirko@redhat.com>"); 2932 MODULE_DESCRIPTION("Ethernet team device driver"); 2933 MODULE_ALIAS_RTNL_LINK(DRV_NAME); 2934