1 /* 2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved. 3 * 4 * This program is free software; you can redistribute it and/or modify it 5 * under the terms of the GNU General Public License as published by the Free 6 * Software Foundation; either version 2 of the License, or (at your option) 7 * any later version. 8 * 9 * This program is distributed in the hope that it will be useful, but WITHOUT 10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 12 * more details. 13 * 14 * You should have received a copy of the GNU General Public License along with 15 * this program; if not, write to the Free Software Foundation, Inc., 59 16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA. 17 * 18 * The full GNU General Public License is included in this distribution in the 19 * file called LICENSE. 20 * 21 */ 22 23 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt 24 25 #include <linux/skbuff.h> 26 #include <linux/if_ether.h> 27 #include <linux/netdevice.h> 28 #include <linux/spinlock.h> 29 #include <linux/ethtool.h> 30 #include <linux/etherdevice.h> 31 #include <linux/if_bonding.h> 32 #include <linux/pkt_sched.h> 33 #include <net/net_namespace.h> 34 #include "bonding.h" 35 #include "bond_3ad.h" 36 37 /* General definitions */ 38 #define AD_SHORT_TIMEOUT 1 39 #define AD_LONG_TIMEOUT 0 40 #define AD_STANDBY 0x2 41 #define AD_MAX_TX_IN_SECOND 3 42 #define AD_COLLECTOR_MAX_DELAY 0 43 44 /* Timer definitions (43.4.4 in the 802.3ad standard) */ 45 #define AD_FAST_PERIODIC_TIME 1 46 #define AD_SLOW_PERIODIC_TIME 30 47 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME) 48 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME) 49 #define AD_CHURN_DETECTION_TIME 60 50 #define AD_AGGREGATE_WAIT_TIME 2 51 52 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */ 53 #define AD_STATE_LACP_ACTIVITY 0x1 54 #define AD_STATE_LACP_TIMEOUT 0x2 55 #define AD_STATE_AGGREGATION 0x4 56 #define AD_STATE_SYNCHRONIZATION 0x8 57 #define AD_STATE_COLLECTING 0x10 58 #define AD_STATE_DISTRIBUTING 0x20 59 #define AD_STATE_DEFAULTED 0x40 60 #define AD_STATE_EXPIRED 0x80 61 62 /* Port Variables definitions used by the State Machines (43.4.7 in the 63 * 802.3ad standard) 64 */ 65 #define AD_PORT_BEGIN 0x1 66 #define AD_PORT_LACP_ENABLED 0x2 67 #define AD_PORT_ACTOR_CHURN 0x4 68 #define AD_PORT_PARTNER_CHURN 0x8 69 #define AD_PORT_READY 0x10 70 #define AD_PORT_READY_N 0x20 71 #define AD_PORT_MATCHED 0x40 72 #define AD_PORT_STANDBY 0x80 73 #define AD_PORT_SELECTED 0x100 74 #define AD_PORT_MOVED 0x200 75 76 /* Port Key definitions 77 * key is determined according to the link speed, duplex and 78 * user key (which is yet not supported) 79 * -------------------------------------------------------------- 80 * Port key : | User key | Speed | Duplex | 81 * -------------------------------------------------------------- 82 * 16 6 1 0 83 */ 84 #define AD_DUPLEX_KEY_BITS 0x1 85 #define AD_SPEED_KEY_BITS 0x3E 86 #define AD_USER_KEY_BITS 0xFFC0 87 88 #define AD_LINK_SPEED_BITMASK_1MBPS 0x1 89 #define AD_LINK_SPEED_BITMASK_10MBPS 0x2 90 #define AD_LINK_SPEED_BITMASK_100MBPS 0x4 91 #define AD_LINK_SPEED_BITMASK_1000MBPS 0x8 92 #define AD_LINK_SPEED_BITMASK_10000MBPS 0x10 93 94 /* compare MAC addresses */ 95 #define MAC_ADDRESS_EQUAL(A, B) \ 96 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B) 97 98 static struct mac_addr null_mac_addr = { { 0, 0, 0, 0, 0, 0 } }; 99 static u16 ad_ticks_per_sec; 100 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000; 101 102 static const u8 lacpdu_mcast_addr[ETH_ALEN] = MULTICAST_LACPDU_ADDR; 103 104 /* ================= main 802.3ad protocol functions ================== */ 105 static int ad_lacpdu_send(struct port *port); 106 static int ad_marker_send(struct port *port, struct bond_marker *marker); 107 static void ad_mux_machine(struct port *port); 108 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port); 109 static void ad_tx_machine(struct port *port); 110 static void ad_periodic_machine(struct port *port); 111 static void ad_port_selection_logic(struct port *port); 112 static void ad_agg_selection_logic(struct aggregator *aggregator); 113 static void ad_clear_agg(struct aggregator *aggregator); 114 static void ad_initialize_agg(struct aggregator *aggregator); 115 static void ad_initialize_port(struct port *port, int lacp_fast); 116 static void ad_enable_collecting_distributing(struct port *port); 117 static void ad_disable_collecting_distributing(struct port *port); 118 static void ad_marker_info_received(struct bond_marker *marker_info, 119 struct port *port); 120 static void ad_marker_response_received(struct bond_marker *marker, 121 struct port *port); 122 123 124 /* ================= api to bonding and kernel code ================== */ 125 126 /** 127 * __get_bond_by_port - get the port's bonding struct 128 * @port: the port we're looking at 129 * 130 * Return @port's bonding struct, or %NULL if it can't be found. 131 */ 132 static inline struct bonding *__get_bond_by_port(struct port *port) 133 { 134 if (port->slave == NULL) 135 return NULL; 136 137 return bond_get_bond_by_slave(port->slave); 138 } 139 140 /** 141 * __get_first_agg - get the first aggregator in the bond 142 * @bond: the bond we're looking at 143 * 144 * Return the aggregator of the first slave in @bond, or %NULL if it can't be 145 * found. 146 * The caller must hold RCU or RTNL lock. 147 */ 148 static inline struct aggregator *__get_first_agg(struct port *port) 149 { 150 struct bonding *bond = __get_bond_by_port(port); 151 struct slave *first_slave; 152 struct aggregator *agg; 153 154 /* If there's no bond for this port, or bond has no slaves */ 155 if (bond == NULL) 156 return NULL; 157 158 rcu_read_lock(); 159 first_slave = bond_first_slave_rcu(bond); 160 agg = first_slave ? &(SLAVE_AD_INFO(first_slave).aggregator) : NULL; 161 rcu_read_unlock(); 162 163 return agg; 164 } 165 166 /** 167 * __agg_has_partner - see if we have a partner 168 * @agg: the agregator we're looking at 169 * 170 * Return nonzero if aggregator has a partner (denoted by a non-zero ether 171 * address for the partner). Return 0 if not. 172 */ 173 static inline int __agg_has_partner(struct aggregator *agg) 174 { 175 return !is_zero_ether_addr(agg->partner_system.mac_addr_value); 176 } 177 178 /** 179 * __disable_port - disable the port's slave 180 * @port: the port we're looking at 181 */ 182 static inline void __disable_port(struct port *port) 183 { 184 bond_set_slave_inactive_flags(port->slave); 185 } 186 187 /** 188 * __enable_port - enable the port's slave, if it's up 189 * @port: the port we're looking at 190 */ 191 static inline void __enable_port(struct port *port) 192 { 193 struct slave *slave = port->slave; 194 195 if ((slave->link == BOND_LINK_UP) && IS_UP(slave->dev)) 196 bond_set_slave_active_flags(slave); 197 } 198 199 /** 200 * __port_is_enabled - check if the port's slave is in active state 201 * @port: the port we're looking at 202 */ 203 static inline int __port_is_enabled(struct port *port) 204 { 205 return bond_is_active_slave(port->slave); 206 } 207 208 /** 209 * __get_agg_selection_mode - get the aggregator selection mode 210 * @port: the port we're looking at 211 * 212 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT. 213 */ 214 static inline u32 __get_agg_selection_mode(struct port *port) 215 { 216 struct bonding *bond = __get_bond_by_port(port); 217 218 if (bond == NULL) 219 return BOND_AD_STABLE; 220 221 return bond->params.ad_select; 222 } 223 224 /** 225 * __check_agg_selection_timer - check if the selection timer has expired 226 * @port: the port we're looking at 227 */ 228 static inline int __check_agg_selection_timer(struct port *port) 229 { 230 struct bonding *bond = __get_bond_by_port(port); 231 232 if (bond == NULL) 233 return 0; 234 235 return BOND_AD_INFO(bond).agg_select_timer ? 1 : 0; 236 } 237 238 /** 239 * __get_state_machine_lock - lock the port's state machines 240 * @port: the port we're looking at 241 */ 242 static inline void __get_state_machine_lock(struct port *port) 243 { 244 spin_lock_bh(&(SLAVE_AD_INFO(port->slave).state_machine_lock)); 245 } 246 247 /** 248 * __release_state_machine_lock - unlock the port's state machines 249 * @port: the port we're looking at 250 */ 251 static inline void __release_state_machine_lock(struct port *port) 252 { 253 spin_unlock_bh(&(SLAVE_AD_INFO(port->slave).state_machine_lock)); 254 } 255 256 /** 257 * __get_link_speed - get a port's speed 258 * @port: the port we're looking at 259 * 260 * Return @port's speed in 802.3ad bitmask format. i.e. one of: 261 * 0, 262 * %AD_LINK_SPEED_BITMASK_10MBPS, 263 * %AD_LINK_SPEED_BITMASK_100MBPS, 264 * %AD_LINK_SPEED_BITMASK_1000MBPS, 265 * %AD_LINK_SPEED_BITMASK_10000MBPS 266 */ 267 static u16 __get_link_speed(struct port *port) 268 { 269 struct slave *slave = port->slave; 270 u16 speed; 271 272 /* this if covers only a special case: when the configuration starts 273 * with link down, it sets the speed to 0. 274 * This is done in spite of the fact that the e100 driver reports 0 275 * to be compatible with MVT in the future. 276 */ 277 if (slave->link != BOND_LINK_UP) 278 speed = 0; 279 else { 280 switch (slave->speed) { 281 case SPEED_10: 282 speed = AD_LINK_SPEED_BITMASK_10MBPS; 283 break; 284 285 case SPEED_100: 286 speed = AD_LINK_SPEED_BITMASK_100MBPS; 287 break; 288 289 case SPEED_1000: 290 speed = AD_LINK_SPEED_BITMASK_1000MBPS; 291 break; 292 293 case SPEED_10000: 294 speed = AD_LINK_SPEED_BITMASK_10000MBPS; 295 break; 296 297 default: 298 /* unknown speed value from ethtool. shouldn't happen */ 299 speed = 0; 300 break; 301 } 302 } 303 304 pr_debug("Port %d Received link speed %d update from adapter\n", 305 port->actor_port_number, speed); 306 return speed; 307 } 308 309 /** 310 * __get_duplex - get a port's duplex 311 * @port: the port we're looking at 312 * 313 * Return @port's duplex in 802.3ad bitmask format. i.e.: 314 * 0x01 if in full duplex 315 * 0x00 otherwise 316 */ 317 static u8 __get_duplex(struct port *port) 318 { 319 struct slave *slave = port->slave; 320 321 u8 retval; 322 323 /* handling a special case: when the configuration starts with 324 * link down, it sets the duplex to 0. 325 */ 326 if (slave->link != BOND_LINK_UP) 327 retval = 0x0; 328 else { 329 switch (slave->duplex) { 330 case DUPLEX_FULL: 331 retval = 0x1; 332 pr_debug("Port %d Received status full duplex update from adapter\n", 333 port->actor_port_number); 334 break; 335 case DUPLEX_HALF: 336 default: 337 retval = 0x0; 338 pr_debug("Port %d Received status NOT full duplex update from adapter\n", 339 port->actor_port_number); 340 break; 341 } 342 } 343 return retval; 344 } 345 346 /** 347 * __initialize_port_locks - initialize a port's STATE machine spinlock 348 * @port: the slave of the port we're looking at 349 */ 350 static inline void __initialize_port_locks(struct slave *slave) 351 { 352 /* make sure it isn't called twice */ 353 spin_lock_init(&(SLAVE_AD_INFO(slave).state_machine_lock)); 354 } 355 356 /* Conversions */ 357 358 /** 359 * __ad_timer_to_ticks - convert a given timer type to AD module ticks 360 * @timer_type: which timer to operate 361 * @par: timer parameter. see below 362 * 363 * If @timer_type is %current_while_timer, @par indicates long/short timer. 364 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME, 365 * %SLOW_PERIODIC_TIME. 366 */ 367 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par) 368 { 369 u16 retval = 0; /* to silence the compiler */ 370 371 switch (timer_type) { 372 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */ 373 if (par) 374 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec); 375 else 376 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec); 377 break; 378 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */ 379 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec); 380 break; 381 case AD_PERIODIC_TIMER: /* for periodic machine */ 382 retval = (par*ad_ticks_per_sec); /* long timeout */ 383 break; 384 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */ 385 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec); 386 break; 387 case AD_WAIT_WHILE_TIMER: /* for selection machine */ 388 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec); 389 break; 390 } 391 392 return retval; 393 } 394 395 396 /* ================= ad_rx_machine helper functions ================== */ 397 398 /** 399 * __choose_matched - update a port's matched variable from a received lacpdu 400 * @lacpdu: the lacpdu we've received 401 * @port: the port we're looking at 402 * 403 * Update the value of the matched variable, using parameter values from a 404 * newly received lacpdu. Parameter values for the partner carried in the 405 * received PDU are compared with the corresponding operational parameter 406 * values for the actor. Matched is set to TRUE if all of these parameters 407 * match and the PDU parameter partner_state.aggregation has the same value as 408 * actor_oper_port_state.aggregation and lacp will actively maintain the link 409 * in the aggregation. Matched is also set to TRUE if the value of 410 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates 411 * an individual link and lacp will actively maintain the link. Otherwise, 412 * matched is set to FALSE. LACP is considered to be actively maintaining the 413 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both 414 * the actor's actor_oper_port_state.lacp_activity and the PDU's 415 * partner_state.lacp_activity variables are TRUE. 416 * 417 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is 418 * used here to implement the language from 802.3ad 43.4.9 that requires 419 * recordPDU to "match" the LACPDU parameters to the stored values. 420 */ 421 static void __choose_matched(struct lacpdu *lacpdu, struct port *port) 422 { 423 /* check if all parameters are alike 424 * or this is individual link(aggregation == FALSE) 425 * then update the state machine Matched variable. 426 */ 427 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) && 428 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) && 429 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) && 430 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) && 431 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) && 432 ((lacpdu->partner_state & AD_STATE_AGGREGATION) == (port->actor_oper_port_state & AD_STATE_AGGREGATION))) || 433 ((lacpdu->actor_state & AD_STATE_AGGREGATION) == 0) 434 ) { 435 port->sm_vars |= AD_PORT_MATCHED; 436 } else { 437 port->sm_vars &= ~AD_PORT_MATCHED; 438 } 439 } 440 441 /** 442 * __record_pdu - record parameters from a received lacpdu 443 * @lacpdu: the lacpdu we've received 444 * @port: the port we're looking at 445 * 446 * Record the parameter values for the Actor carried in a received lacpdu as 447 * the current partner operational parameter values and sets 448 * actor_oper_port_state.defaulted to FALSE. 449 */ 450 static void __record_pdu(struct lacpdu *lacpdu, struct port *port) 451 { 452 if (lacpdu && port) { 453 struct port_params *partner = &port->partner_oper; 454 455 __choose_matched(lacpdu, port); 456 /* record the new parameter values for the partner 457 * operational 458 */ 459 partner->port_number = ntohs(lacpdu->actor_port); 460 partner->port_priority = ntohs(lacpdu->actor_port_priority); 461 partner->system = lacpdu->actor_system; 462 partner->system_priority = ntohs(lacpdu->actor_system_priority); 463 partner->key = ntohs(lacpdu->actor_key); 464 partner->port_state = lacpdu->actor_state; 465 466 /* set actor_oper_port_state.defaulted to FALSE */ 467 port->actor_oper_port_state &= ~AD_STATE_DEFAULTED; 468 469 /* set the partner sync. to on if the partner is sync, 470 * and the port is matched 471 */ 472 if ((port->sm_vars & AD_PORT_MATCHED) 473 && (lacpdu->actor_state & AD_STATE_SYNCHRONIZATION)) 474 partner->port_state |= AD_STATE_SYNCHRONIZATION; 475 else 476 partner->port_state &= ~AD_STATE_SYNCHRONIZATION; 477 } 478 } 479 480 /** 481 * __record_default - record default parameters 482 * @port: the port we're looking at 483 * 484 * This function records the default parameter values for the partner carried 485 * in the Partner Admin parameters as the current partner operational parameter 486 * values and sets actor_oper_port_state.defaulted to TRUE. 487 */ 488 static void __record_default(struct port *port) 489 { 490 if (port) { 491 /* record the partner admin parameters */ 492 memcpy(&port->partner_oper, &port->partner_admin, 493 sizeof(struct port_params)); 494 495 /* set actor_oper_port_state.defaulted to true */ 496 port->actor_oper_port_state |= AD_STATE_DEFAULTED; 497 } 498 } 499 500 /** 501 * __update_selected - update a port's Selected variable from a received lacpdu 502 * @lacpdu: the lacpdu we've received 503 * @port: the port we're looking at 504 * 505 * Update the value of the selected variable, using parameter values from a 506 * newly received lacpdu. The parameter values for the Actor carried in the 507 * received PDU are compared with the corresponding operational parameter 508 * values for the ports partner. If one or more of the comparisons shows that 509 * the value(s) received in the PDU differ from the current operational values, 510 * then selected is set to FALSE and actor_oper_port_state.synchronization is 511 * set to out_of_sync. Otherwise, selected remains unchanged. 512 */ 513 static void __update_selected(struct lacpdu *lacpdu, struct port *port) 514 { 515 if (lacpdu && port) { 516 const struct port_params *partner = &port->partner_oper; 517 518 /* check if any parameter is different then 519 * update the state machine selected variable. 520 */ 521 if (ntohs(lacpdu->actor_port) != partner->port_number || 522 ntohs(lacpdu->actor_port_priority) != partner->port_priority || 523 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) || 524 ntohs(lacpdu->actor_system_priority) != partner->system_priority || 525 ntohs(lacpdu->actor_key) != partner->key || 526 (lacpdu->actor_state & AD_STATE_AGGREGATION) != (partner->port_state & AD_STATE_AGGREGATION)) { 527 port->sm_vars &= ~AD_PORT_SELECTED; 528 } 529 } 530 } 531 532 /** 533 * __update_default_selected - update a port's Selected variable from Partner 534 * @port: the port we're looking at 535 * 536 * This function updates the value of the selected variable, using the partner 537 * administrative parameter values. The administrative values are compared with 538 * the corresponding operational parameter values for the partner. If one or 539 * more of the comparisons shows that the administrative value(s) differ from 540 * the current operational values, then Selected is set to FALSE and 541 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise, 542 * Selected remains unchanged. 543 */ 544 static void __update_default_selected(struct port *port) 545 { 546 if (port) { 547 const struct port_params *admin = &port->partner_admin; 548 const struct port_params *oper = &port->partner_oper; 549 550 /* check if any parameter is different then 551 * update the state machine selected variable. 552 */ 553 if (admin->port_number != oper->port_number || 554 admin->port_priority != oper->port_priority || 555 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) || 556 admin->system_priority != oper->system_priority || 557 admin->key != oper->key || 558 (admin->port_state & AD_STATE_AGGREGATION) 559 != (oper->port_state & AD_STATE_AGGREGATION)) { 560 port->sm_vars &= ~AD_PORT_SELECTED; 561 } 562 } 563 } 564 565 /** 566 * __update_ntt - update a port's ntt variable from a received lacpdu 567 * @lacpdu: the lacpdu we've received 568 * @port: the port we're looking at 569 * 570 * Updates the value of the ntt variable, using parameter values from a newly 571 * received lacpdu. The parameter values for the partner carried in the 572 * received PDU are compared with the corresponding operational parameter 573 * values for the Actor. If one or more of the comparisons shows that the 574 * value(s) received in the PDU differ from the current operational values, 575 * then ntt is set to TRUE. Otherwise, ntt remains unchanged. 576 */ 577 static void __update_ntt(struct lacpdu *lacpdu, struct port *port) 578 { 579 /* validate lacpdu and port */ 580 if (lacpdu && port) { 581 /* check if any parameter is different then 582 * update the port->ntt. 583 */ 584 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) || 585 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) || 586 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) || 587 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) || 588 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) || 589 ((lacpdu->partner_state & AD_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY)) || 590 ((lacpdu->partner_state & AD_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)) || 591 ((lacpdu->partner_state & AD_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) || 592 ((lacpdu->partner_state & AD_STATE_AGGREGATION) != (port->actor_oper_port_state & AD_STATE_AGGREGATION)) 593 ) { 594 port->ntt = true; 595 } 596 } 597 } 598 599 /** 600 * __agg_ports_are_ready - check if all ports in an aggregator are ready 601 * @aggregator: the aggregator we're looking at 602 * 603 */ 604 static int __agg_ports_are_ready(struct aggregator *aggregator) 605 { 606 struct port *port; 607 int retval = 1; 608 609 if (aggregator) { 610 /* scan all ports in this aggregator to verfy if they are 611 * all ready. 612 */ 613 for (port = aggregator->lag_ports; 614 port; 615 port = port->next_port_in_aggregator) { 616 if (!(port->sm_vars & AD_PORT_READY_N)) { 617 retval = 0; 618 break; 619 } 620 } 621 } 622 623 return retval; 624 } 625 626 /** 627 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator 628 * @aggregator: the aggregator we're looking at 629 * @val: Should the ports' ready bit be set on or off 630 * 631 */ 632 static void __set_agg_ports_ready(struct aggregator *aggregator, int val) 633 { 634 struct port *port; 635 636 for (port = aggregator->lag_ports; port; 637 port = port->next_port_in_aggregator) { 638 if (val) 639 port->sm_vars |= AD_PORT_READY; 640 else 641 port->sm_vars &= ~AD_PORT_READY; 642 } 643 } 644 645 /** 646 * __get_agg_bandwidth - get the total bandwidth of an aggregator 647 * @aggregator: the aggregator we're looking at 648 * 649 */ 650 static u32 __get_agg_bandwidth(struct aggregator *aggregator) 651 { 652 u32 bandwidth = 0; 653 654 if (aggregator->num_of_ports) { 655 switch (__get_link_speed(aggregator->lag_ports)) { 656 case AD_LINK_SPEED_BITMASK_1MBPS: 657 bandwidth = aggregator->num_of_ports; 658 break; 659 case AD_LINK_SPEED_BITMASK_10MBPS: 660 bandwidth = aggregator->num_of_ports * 10; 661 break; 662 case AD_LINK_SPEED_BITMASK_100MBPS: 663 bandwidth = aggregator->num_of_ports * 100; 664 break; 665 case AD_LINK_SPEED_BITMASK_1000MBPS: 666 bandwidth = aggregator->num_of_ports * 1000; 667 break; 668 case AD_LINK_SPEED_BITMASK_10000MBPS: 669 bandwidth = aggregator->num_of_ports * 10000; 670 break; 671 default: 672 bandwidth = 0; /* to silence the compiler */ 673 } 674 } 675 return bandwidth; 676 } 677 678 /** 679 * __get_active_agg - get the current active aggregator 680 * @aggregator: the aggregator we're looking at 681 * 682 * Caller must hold RCU lock. 683 */ 684 static struct aggregator *__get_active_agg(struct aggregator *aggregator) 685 { 686 struct bonding *bond = aggregator->slave->bond; 687 struct list_head *iter; 688 struct slave *slave; 689 690 bond_for_each_slave_rcu(bond, slave, iter) 691 if (SLAVE_AD_INFO(slave).aggregator.is_active) 692 return &(SLAVE_AD_INFO(slave).aggregator); 693 694 return NULL; 695 } 696 697 /** 698 * __update_lacpdu_from_port - update a port's lacpdu fields 699 * @port: the port we're looking at 700 */ 701 static inline void __update_lacpdu_from_port(struct port *port) 702 { 703 struct lacpdu *lacpdu = &port->lacpdu; 704 const struct port_params *partner = &port->partner_oper; 705 706 /* update current actual Actor parameters 707 * lacpdu->subtype initialized 708 * lacpdu->version_number initialized 709 * lacpdu->tlv_type_actor_info initialized 710 * lacpdu->actor_information_length initialized 711 */ 712 713 lacpdu->actor_system_priority = htons(port->actor_system_priority); 714 lacpdu->actor_system = port->actor_system; 715 lacpdu->actor_key = htons(port->actor_oper_port_key); 716 lacpdu->actor_port_priority = htons(port->actor_port_priority); 717 lacpdu->actor_port = htons(port->actor_port_number); 718 lacpdu->actor_state = port->actor_oper_port_state; 719 720 /* lacpdu->reserved_3_1 initialized 721 * lacpdu->tlv_type_partner_info initialized 722 * lacpdu->partner_information_length initialized 723 */ 724 725 lacpdu->partner_system_priority = htons(partner->system_priority); 726 lacpdu->partner_system = partner->system; 727 lacpdu->partner_key = htons(partner->key); 728 lacpdu->partner_port_priority = htons(partner->port_priority); 729 lacpdu->partner_port = htons(partner->port_number); 730 lacpdu->partner_state = partner->port_state; 731 732 /* lacpdu->reserved_3_2 initialized 733 * lacpdu->tlv_type_collector_info initialized 734 * lacpdu->collector_information_length initialized 735 * collector_max_delay initialized 736 * reserved_12[12] initialized 737 * tlv_type_terminator initialized 738 * terminator_length initialized 739 * reserved_50[50] initialized 740 */ 741 } 742 743 /* ================= main 802.3ad protocol code ========================= */ 744 745 /** 746 * ad_lacpdu_send - send out a lacpdu packet on a given port 747 * @port: the port we're looking at 748 * 749 * Returns: 0 on success 750 * < 0 on error 751 */ 752 static int ad_lacpdu_send(struct port *port) 753 { 754 struct slave *slave = port->slave; 755 struct sk_buff *skb; 756 struct lacpdu_header *lacpdu_header; 757 int length = sizeof(struct lacpdu_header); 758 759 skb = dev_alloc_skb(length); 760 if (!skb) 761 return -ENOMEM; 762 763 skb->dev = slave->dev; 764 skb_reset_mac_header(skb); 765 skb->network_header = skb->mac_header + ETH_HLEN; 766 skb->protocol = PKT_TYPE_LACPDU; 767 skb->priority = TC_PRIO_CONTROL; 768 769 lacpdu_header = (struct lacpdu_header *)skb_put(skb, length); 770 771 memcpy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr, ETH_ALEN); 772 /* Note: source address is set to be the member's PERMANENT address, 773 * because we use it to identify loopback lacpdus in receive. 774 */ 775 memcpy(lacpdu_header->hdr.h_source, slave->perm_hwaddr, ETH_ALEN); 776 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU; 777 778 lacpdu_header->lacpdu = port->lacpdu; 779 780 dev_queue_xmit(skb); 781 782 return 0; 783 } 784 785 /** 786 * ad_marker_send - send marker information/response on a given port 787 * @port: the port we're looking at 788 * @marker: marker data to send 789 * 790 * Returns: 0 on success 791 * < 0 on error 792 */ 793 static int ad_marker_send(struct port *port, struct bond_marker *marker) 794 { 795 struct slave *slave = port->slave; 796 struct sk_buff *skb; 797 struct bond_marker_header *marker_header; 798 int length = sizeof(struct bond_marker_header); 799 800 skb = dev_alloc_skb(length + 16); 801 if (!skb) 802 return -ENOMEM; 803 804 skb_reserve(skb, 16); 805 806 skb->dev = slave->dev; 807 skb_reset_mac_header(skb); 808 skb->network_header = skb->mac_header + ETH_HLEN; 809 skb->protocol = PKT_TYPE_LACPDU; 810 811 marker_header = (struct bond_marker_header *)skb_put(skb, length); 812 813 memcpy(marker_header->hdr.h_dest, lacpdu_mcast_addr, ETH_ALEN); 814 /* Note: source address is set to be the member's PERMANENT address, 815 * because we use it to identify loopback MARKERs in receive. 816 */ 817 memcpy(marker_header->hdr.h_source, slave->perm_hwaddr, ETH_ALEN); 818 marker_header->hdr.h_proto = PKT_TYPE_LACPDU; 819 820 marker_header->marker = *marker; 821 822 dev_queue_xmit(skb); 823 824 return 0; 825 } 826 827 /** 828 * ad_mux_machine - handle a port's mux state machine 829 * @port: the port we're looking at 830 */ 831 static void ad_mux_machine(struct port *port) 832 { 833 mux_states_t last_state; 834 835 /* keep current State Machine state to compare later if it was 836 * changed 837 */ 838 last_state = port->sm_mux_state; 839 840 if (port->sm_vars & AD_PORT_BEGIN) { 841 port->sm_mux_state = AD_MUX_DETACHED; 842 } else { 843 switch (port->sm_mux_state) { 844 case AD_MUX_DETACHED: 845 if ((port->sm_vars & AD_PORT_SELECTED) 846 || (port->sm_vars & AD_PORT_STANDBY)) 847 /* if SELECTED or STANDBY */ 848 port->sm_mux_state = AD_MUX_WAITING; 849 break; 850 case AD_MUX_WAITING: 851 /* if SELECTED == FALSE return to DETACH state */ 852 if (!(port->sm_vars & AD_PORT_SELECTED)) { 853 port->sm_vars &= ~AD_PORT_READY_N; 854 /* in order to withhold the Selection Logic to 855 * check all ports READY_N value every callback 856 * cycle to update ready variable, we check 857 * READY_N and update READY here 858 */ 859 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator)); 860 port->sm_mux_state = AD_MUX_DETACHED; 861 break; 862 } 863 864 /* check if the wait_while_timer expired */ 865 if (port->sm_mux_timer_counter 866 && !(--port->sm_mux_timer_counter)) 867 port->sm_vars |= AD_PORT_READY_N; 868 869 /* in order to withhold the selection logic to check 870 * all ports READY_N value every callback cycle to 871 * update ready variable, we check READY_N and update 872 * READY here 873 */ 874 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator)); 875 876 /* if the wait_while_timer expired, and the port is 877 * in READY state, move to ATTACHED state 878 */ 879 if ((port->sm_vars & AD_PORT_READY) 880 && !port->sm_mux_timer_counter) 881 port->sm_mux_state = AD_MUX_ATTACHED; 882 break; 883 case AD_MUX_ATTACHED: 884 /* check also if agg_select_timer expired (so the 885 * edable port will take place only after this timer) 886 */ 887 if ((port->sm_vars & AD_PORT_SELECTED) && 888 (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) && 889 !__check_agg_selection_timer(port)) { 890 port->sm_mux_state = AD_MUX_COLLECTING_DISTRIBUTING; 891 } else if (!(port->sm_vars & AD_PORT_SELECTED) || 892 (port->sm_vars & AD_PORT_STANDBY)) { 893 /* if UNSELECTED or STANDBY */ 894 port->sm_vars &= ~AD_PORT_READY_N; 895 /* in order to withhold the selection logic to 896 * check all ports READY_N value every callback 897 * cycle to update ready variable, we check 898 * READY_N and update READY here 899 */ 900 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator)); 901 port->sm_mux_state = AD_MUX_DETACHED; 902 } 903 break; 904 case AD_MUX_COLLECTING_DISTRIBUTING: 905 if (!(port->sm_vars & AD_PORT_SELECTED) || 906 (port->sm_vars & AD_PORT_STANDBY) || 907 !(port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION)) { 908 port->sm_mux_state = AD_MUX_ATTACHED; 909 } else { 910 /* if port state hasn't changed make 911 * sure that a collecting distributing 912 * port in an active aggregator is enabled 913 */ 914 if (port->aggregator && 915 port->aggregator->is_active && 916 !__port_is_enabled(port)) { 917 918 __enable_port(port); 919 } 920 } 921 break; 922 default: 923 break; 924 } 925 } 926 927 /* check if the state machine was changed */ 928 if (port->sm_mux_state != last_state) { 929 pr_debug("Mux Machine: Port=%d, Last State=%d, Curr State=%d\n", 930 port->actor_port_number, last_state, 931 port->sm_mux_state); 932 switch (port->sm_mux_state) { 933 case AD_MUX_DETACHED: 934 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION; 935 ad_disable_collecting_distributing(port); 936 port->actor_oper_port_state &= ~AD_STATE_COLLECTING; 937 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING; 938 port->ntt = true; 939 break; 940 case AD_MUX_WAITING: 941 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0); 942 break; 943 case AD_MUX_ATTACHED: 944 port->actor_oper_port_state |= AD_STATE_SYNCHRONIZATION; 945 port->actor_oper_port_state &= ~AD_STATE_COLLECTING; 946 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING; 947 ad_disable_collecting_distributing(port); 948 port->ntt = true; 949 break; 950 case AD_MUX_COLLECTING_DISTRIBUTING: 951 port->actor_oper_port_state |= AD_STATE_COLLECTING; 952 port->actor_oper_port_state |= AD_STATE_DISTRIBUTING; 953 ad_enable_collecting_distributing(port); 954 port->ntt = true; 955 break; 956 default: 957 break; 958 } 959 } 960 } 961 962 /** 963 * ad_rx_machine - handle a port's rx State Machine 964 * @lacpdu: the lacpdu we've received 965 * @port: the port we're looking at 966 * 967 * If lacpdu arrived, stop previous timer (if exists) and set the next state as 968 * CURRENT. If timer expired set the state machine in the proper state. 969 * In other cases, this function checks if we need to switch to other state. 970 */ 971 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port) 972 { 973 rx_states_t last_state; 974 975 /* keep current State Machine state to compare later if it was 976 * changed 977 */ 978 last_state = port->sm_rx_state; 979 980 /* check if state machine should change state */ 981 982 /* first, check if port was reinitialized */ 983 if (port->sm_vars & AD_PORT_BEGIN) 984 port->sm_rx_state = AD_RX_INITIALIZE; 985 /* check if port is not enabled */ 986 else if (!(port->sm_vars & AD_PORT_BEGIN) 987 && !port->is_enabled && !(port->sm_vars & AD_PORT_MOVED)) 988 port->sm_rx_state = AD_RX_PORT_DISABLED; 989 /* check if new lacpdu arrived */ 990 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) || 991 (port->sm_rx_state == AD_RX_DEFAULTED) || 992 (port->sm_rx_state == AD_RX_CURRENT))) { 993 port->sm_rx_timer_counter = 0; 994 port->sm_rx_state = AD_RX_CURRENT; 995 } else { 996 /* if timer is on, and if it is expired */ 997 if (port->sm_rx_timer_counter && 998 !(--port->sm_rx_timer_counter)) { 999 switch (port->sm_rx_state) { 1000 case AD_RX_EXPIRED: 1001 port->sm_rx_state = AD_RX_DEFAULTED; 1002 break; 1003 case AD_RX_CURRENT: 1004 port->sm_rx_state = AD_RX_EXPIRED; 1005 break; 1006 default: 1007 break; 1008 } 1009 } else { 1010 /* if no lacpdu arrived and no timer is on */ 1011 switch (port->sm_rx_state) { 1012 case AD_RX_PORT_DISABLED: 1013 if (port->sm_vars & AD_PORT_MOVED) 1014 port->sm_rx_state = AD_RX_INITIALIZE; 1015 else if (port->is_enabled 1016 && (port->sm_vars 1017 & AD_PORT_LACP_ENABLED)) 1018 port->sm_rx_state = AD_RX_EXPIRED; 1019 else if (port->is_enabled 1020 && ((port->sm_vars 1021 & AD_PORT_LACP_ENABLED) == 0)) 1022 port->sm_rx_state = AD_RX_LACP_DISABLED; 1023 break; 1024 default: 1025 break; 1026 1027 } 1028 } 1029 } 1030 1031 /* check if the State machine was changed or new lacpdu arrived */ 1032 if ((port->sm_rx_state != last_state) || (lacpdu)) { 1033 pr_debug("Rx Machine: Port=%d, Last State=%d, Curr State=%d\n", 1034 port->actor_port_number, last_state, 1035 port->sm_rx_state); 1036 switch (port->sm_rx_state) { 1037 case AD_RX_INITIALIZE: 1038 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_BITS)) 1039 port->sm_vars &= ~AD_PORT_LACP_ENABLED; 1040 else 1041 port->sm_vars |= AD_PORT_LACP_ENABLED; 1042 port->sm_vars &= ~AD_PORT_SELECTED; 1043 __record_default(port); 1044 port->actor_oper_port_state &= ~AD_STATE_EXPIRED; 1045 port->sm_vars &= ~AD_PORT_MOVED; 1046 port->sm_rx_state = AD_RX_PORT_DISABLED; 1047 1048 /* Fall Through */ 1049 case AD_RX_PORT_DISABLED: 1050 port->sm_vars &= ~AD_PORT_MATCHED; 1051 break; 1052 case AD_RX_LACP_DISABLED: 1053 port->sm_vars &= ~AD_PORT_SELECTED; 1054 __record_default(port); 1055 port->partner_oper.port_state &= ~AD_STATE_AGGREGATION; 1056 port->sm_vars |= AD_PORT_MATCHED; 1057 port->actor_oper_port_state &= ~AD_STATE_EXPIRED; 1058 break; 1059 case AD_RX_EXPIRED: 1060 /* Reset of the Synchronization flag (Standard 43.4.12) 1061 * This reset cause to disable this port in the 1062 * COLLECTING_DISTRIBUTING state of the mux machine in 1063 * case of EXPIRED even if LINK_DOWN didn't arrive for 1064 * the port. 1065 */ 1066 port->partner_oper.port_state &= ~AD_STATE_SYNCHRONIZATION; 1067 port->sm_vars &= ~AD_PORT_MATCHED; 1068 port->partner_oper.port_state |= AD_STATE_LACP_ACTIVITY; 1069 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT)); 1070 port->actor_oper_port_state |= AD_STATE_EXPIRED; 1071 break; 1072 case AD_RX_DEFAULTED: 1073 __update_default_selected(port); 1074 __record_default(port); 1075 port->sm_vars |= AD_PORT_MATCHED; 1076 port->actor_oper_port_state &= ~AD_STATE_EXPIRED; 1077 break; 1078 case AD_RX_CURRENT: 1079 /* detect loopback situation */ 1080 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system), 1081 &(port->actor_system))) { 1082 pr_err("%s: An illegal loopback occurred on adapter (%s).\nCheck the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n", 1083 port->slave->bond->dev->name, 1084 port->slave->dev->name); 1085 return; 1086 } 1087 __update_selected(lacpdu, port); 1088 __update_ntt(lacpdu, port); 1089 __record_pdu(lacpdu, port); 1090 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)); 1091 port->actor_oper_port_state &= ~AD_STATE_EXPIRED; 1092 break; 1093 default: 1094 break; 1095 } 1096 } 1097 } 1098 1099 /** 1100 * ad_tx_machine - handle a port's tx state machine 1101 * @port: the port we're looking at 1102 */ 1103 static void ad_tx_machine(struct port *port) 1104 { 1105 /* check if tx timer expired, to verify that we do not send more than 1106 * 3 packets per second 1107 */ 1108 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) { 1109 /* check if there is something to send */ 1110 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) { 1111 __update_lacpdu_from_port(port); 1112 1113 if (ad_lacpdu_send(port) >= 0) { 1114 pr_debug("Sent LACPDU on port %d\n", 1115 port->actor_port_number); 1116 1117 /* mark ntt as false, so it will not be sent 1118 * again until demanded 1119 */ 1120 port->ntt = false; 1121 } 1122 } 1123 /* restart tx timer(to verify that we will not exceed 1124 * AD_MAX_TX_IN_SECOND 1125 */ 1126 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND; 1127 } 1128 } 1129 1130 /** 1131 * ad_periodic_machine - handle a port's periodic state machine 1132 * @port: the port we're looking at 1133 * 1134 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's. 1135 */ 1136 static void ad_periodic_machine(struct port *port) 1137 { 1138 periodic_states_t last_state; 1139 1140 /* keep current state machine state to compare later if it was changed */ 1141 last_state = port->sm_periodic_state; 1142 1143 /* check if port was reinitialized */ 1144 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) || 1145 (!(port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & AD_STATE_LACP_ACTIVITY)) 1146 ) { 1147 port->sm_periodic_state = AD_NO_PERIODIC; 1148 } 1149 /* check if state machine should change state */ 1150 else if (port->sm_periodic_timer_counter) { 1151 /* check if periodic state machine expired */ 1152 if (!(--port->sm_periodic_timer_counter)) { 1153 /* if expired then do tx */ 1154 port->sm_periodic_state = AD_PERIODIC_TX; 1155 } else { 1156 /* If not expired, check if there is some new timeout 1157 * parameter from the partner state 1158 */ 1159 switch (port->sm_periodic_state) { 1160 case AD_FAST_PERIODIC: 1161 if (!(port->partner_oper.port_state 1162 & AD_STATE_LACP_TIMEOUT)) 1163 port->sm_periodic_state = AD_SLOW_PERIODIC; 1164 break; 1165 case AD_SLOW_PERIODIC: 1166 if ((port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) { 1167 port->sm_periodic_timer_counter = 0; 1168 port->sm_periodic_state = AD_PERIODIC_TX; 1169 } 1170 break; 1171 default: 1172 break; 1173 } 1174 } 1175 } else { 1176 switch (port->sm_periodic_state) { 1177 case AD_NO_PERIODIC: 1178 port->sm_periodic_state = AD_FAST_PERIODIC; 1179 break; 1180 case AD_PERIODIC_TX: 1181 if (!(port->partner_oper.port_state & 1182 AD_STATE_LACP_TIMEOUT)) 1183 port->sm_periodic_state = AD_SLOW_PERIODIC; 1184 else 1185 port->sm_periodic_state = AD_FAST_PERIODIC; 1186 break; 1187 default: 1188 break; 1189 } 1190 } 1191 1192 /* check if the state machine was changed */ 1193 if (port->sm_periodic_state != last_state) { 1194 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n", 1195 port->actor_port_number, last_state, 1196 port->sm_periodic_state); 1197 switch (port->sm_periodic_state) { 1198 case AD_NO_PERIODIC: 1199 port->sm_periodic_timer_counter = 0; 1200 break; 1201 case AD_FAST_PERIODIC: 1202 /* decrement 1 tick we lost in the PERIODIC_TX cycle */ 1203 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1; 1204 break; 1205 case AD_SLOW_PERIODIC: 1206 /* decrement 1 tick we lost in the PERIODIC_TX cycle */ 1207 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1; 1208 break; 1209 case AD_PERIODIC_TX: 1210 port->ntt = true; 1211 break; 1212 default: 1213 break; 1214 } 1215 } 1216 } 1217 1218 /** 1219 * ad_port_selection_logic - select aggregation groups 1220 * @port: the port we're looking at 1221 * 1222 * Select aggregation groups, and assign each port for it's aggregetor. The 1223 * selection logic is called in the inititalization (after all the handshkes), 1224 * and after every lacpdu receive (if selected is off). 1225 */ 1226 static void ad_port_selection_logic(struct port *port) 1227 { 1228 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator; 1229 struct port *last_port = NULL, *curr_port; 1230 struct list_head *iter; 1231 struct bonding *bond; 1232 struct slave *slave; 1233 int found = 0; 1234 1235 /* if the port is already Selected, do nothing */ 1236 if (port->sm_vars & AD_PORT_SELECTED) 1237 return; 1238 1239 bond = __get_bond_by_port(port); 1240 1241 /* if the port is connected to other aggregator, detach it */ 1242 if (port->aggregator) { 1243 /* detach the port from its former aggregator */ 1244 temp_aggregator = port->aggregator; 1245 for (curr_port = temp_aggregator->lag_ports; curr_port; 1246 last_port = curr_port, 1247 curr_port = curr_port->next_port_in_aggregator) { 1248 if (curr_port == port) { 1249 temp_aggregator->num_of_ports--; 1250 /* if it is the first port attached to the 1251 * aggregator 1252 */ 1253 if (!last_port) { 1254 temp_aggregator->lag_ports = 1255 port->next_port_in_aggregator; 1256 } else { 1257 /* not the first port attached to the 1258 * aggregator 1259 */ 1260 last_port->next_port_in_aggregator = 1261 port->next_port_in_aggregator; 1262 } 1263 1264 /* clear the port's relations to this 1265 * aggregator 1266 */ 1267 port->aggregator = NULL; 1268 port->next_port_in_aggregator = NULL; 1269 port->actor_port_aggregator_identifier = 0; 1270 1271 pr_debug("Port %d left LAG %d\n", 1272 port->actor_port_number, 1273 temp_aggregator->aggregator_identifier); 1274 /* if the aggregator is empty, clear its 1275 * parameters, and set it ready to be attached 1276 */ 1277 if (!temp_aggregator->lag_ports) 1278 ad_clear_agg(temp_aggregator); 1279 break; 1280 } 1281 } 1282 if (!curr_port) { 1283 /* meaning: the port was related to an aggregator 1284 * but was not on the aggregator port list 1285 */ 1286 pr_warn("%s: Warning: Port %d (on %s) was related to aggregator %d but was not on its port list\n", 1287 port->slave->bond->dev->name, 1288 port->actor_port_number, 1289 port->slave->dev->name, 1290 port->aggregator->aggregator_identifier); 1291 } 1292 } 1293 /* search on all aggregators for a suitable aggregator for this port */ 1294 bond_for_each_slave(bond, slave, iter) { 1295 aggregator = &(SLAVE_AD_INFO(slave).aggregator); 1296 1297 /* keep a free aggregator for later use(if needed) */ 1298 if (!aggregator->lag_ports) { 1299 if (!free_aggregator) 1300 free_aggregator = aggregator; 1301 continue; 1302 } 1303 /* check if current aggregator suits us */ 1304 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */ 1305 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) && 1306 (aggregator->partner_system_priority == port->partner_oper.system_priority) && 1307 (aggregator->partner_oper_aggregator_key == port->partner_oper.key) 1308 ) && 1309 ((!MAC_ADDRESS_EQUAL(&(port->partner_oper.system), &(null_mac_addr)) && /* partner answers */ 1310 !aggregator->is_individual) /* but is not individual OR */ 1311 ) 1312 ) { 1313 /* attach to the founded aggregator */ 1314 port->aggregator = aggregator; 1315 port->actor_port_aggregator_identifier = 1316 port->aggregator->aggregator_identifier; 1317 port->next_port_in_aggregator = aggregator->lag_ports; 1318 port->aggregator->num_of_ports++; 1319 aggregator->lag_ports = port; 1320 pr_debug("Port %d joined LAG %d(existing LAG)\n", 1321 port->actor_port_number, 1322 port->aggregator->aggregator_identifier); 1323 1324 /* mark this port as selected */ 1325 port->sm_vars |= AD_PORT_SELECTED; 1326 found = 1; 1327 break; 1328 } 1329 } 1330 1331 /* the port couldn't find an aggregator - attach it to a new 1332 * aggregator 1333 */ 1334 if (!found) { 1335 if (free_aggregator) { 1336 /* assign port a new aggregator */ 1337 port->aggregator = free_aggregator; 1338 port->actor_port_aggregator_identifier = 1339 port->aggregator->aggregator_identifier; 1340 1341 /* update the new aggregator's parameters 1342 * if port was responsed from the end-user 1343 */ 1344 if (port->actor_oper_port_key & AD_DUPLEX_KEY_BITS) 1345 /* if port is full duplex */ 1346 port->aggregator->is_individual = false; 1347 else 1348 port->aggregator->is_individual = true; 1349 1350 port->aggregator->actor_admin_aggregator_key = port->actor_admin_port_key; 1351 port->aggregator->actor_oper_aggregator_key = port->actor_oper_port_key; 1352 port->aggregator->partner_system = 1353 port->partner_oper.system; 1354 port->aggregator->partner_system_priority = 1355 port->partner_oper.system_priority; 1356 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key; 1357 port->aggregator->receive_state = 1; 1358 port->aggregator->transmit_state = 1; 1359 port->aggregator->lag_ports = port; 1360 port->aggregator->num_of_ports++; 1361 1362 /* mark this port as selected */ 1363 port->sm_vars |= AD_PORT_SELECTED; 1364 1365 pr_debug("Port %d joined LAG %d(new LAG)\n", 1366 port->actor_port_number, 1367 port->aggregator->aggregator_identifier); 1368 } else { 1369 pr_err("%s: Port %d (on %s) did not find a suitable aggregator\n", 1370 port->slave->bond->dev->name, 1371 port->actor_port_number, port->slave->dev->name); 1372 } 1373 } 1374 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE 1375 * in all aggregator's ports, else set ready=FALSE in all 1376 * aggregator's ports 1377 */ 1378 __set_agg_ports_ready(port->aggregator, 1379 __agg_ports_are_ready(port->aggregator)); 1380 1381 aggregator = __get_first_agg(port); 1382 ad_agg_selection_logic(aggregator); 1383 } 1384 1385 /* Decide if "agg" is a better choice for the new active aggregator that 1386 * the current best, according to the ad_select policy. 1387 */ 1388 static struct aggregator *ad_agg_selection_test(struct aggregator *best, 1389 struct aggregator *curr) 1390 { 1391 /* 0. If no best, select current. 1392 * 1393 * 1. If the current agg is not individual, and the best is 1394 * individual, select current. 1395 * 1396 * 2. If current agg is individual and the best is not, keep best. 1397 * 1398 * 3. Therefore, current and best are both individual or both not 1399 * individual, so: 1400 * 1401 * 3a. If current agg partner replied, and best agg partner did not, 1402 * select current. 1403 * 1404 * 3b. If current agg partner did not reply and best agg partner 1405 * did reply, keep best. 1406 * 1407 * 4. Therefore, current and best both have partner replies or 1408 * both do not, so perform selection policy: 1409 * 1410 * BOND_AD_COUNT: Select by count of ports. If count is equal, 1411 * select by bandwidth. 1412 * 1413 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth. 1414 */ 1415 if (!best) 1416 return curr; 1417 1418 if (!curr->is_individual && best->is_individual) 1419 return curr; 1420 1421 if (curr->is_individual && !best->is_individual) 1422 return best; 1423 1424 if (__agg_has_partner(curr) && !__agg_has_partner(best)) 1425 return curr; 1426 1427 if (!__agg_has_partner(curr) && __agg_has_partner(best)) 1428 return best; 1429 1430 switch (__get_agg_selection_mode(curr->lag_ports)) { 1431 case BOND_AD_COUNT: 1432 if (curr->num_of_ports > best->num_of_ports) 1433 return curr; 1434 1435 if (curr->num_of_ports < best->num_of_ports) 1436 return best; 1437 1438 /*FALLTHROUGH*/ 1439 case BOND_AD_STABLE: 1440 case BOND_AD_BANDWIDTH: 1441 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best)) 1442 return curr; 1443 1444 break; 1445 1446 default: 1447 pr_warn("%s: Impossible agg select mode %d\n", 1448 curr->slave->bond->dev->name, 1449 __get_agg_selection_mode(curr->lag_ports)); 1450 break; 1451 } 1452 1453 return best; 1454 } 1455 1456 static int agg_device_up(const struct aggregator *agg) 1457 { 1458 struct port *port = agg->lag_ports; 1459 1460 if (!port) 1461 return 0; 1462 1463 return netif_running(port->slave->dev) && 1464 netif_carrier_ok(port->slave->dev); 1465 } 1466 1467 /** 1468 * ad_agg_selection_logic - select an aggregation group for a team 1469 * @aggregator: the aggregator we're looking at 1470 * 1471 * It is assumed that only one aggregator may be selected for a team. 1472 * 1473 * The logic of this function is to select the aggregator according to 1474 * the ad_select policy: 1475 * 1476 * BOND_AD_STABLE: select the aggregator with the most ports attached to 1477 * it, and to reselect the active aggregator only if the previous 1478 * aggregator has no more ports related to it. 1479 * 1480 * BOND_AD_BANDWIDTH: select the aggregator with the highest total 1481 * bandwidth, and reselect whenever a link state change takes place or the 1482 * set of slaves in the bond changes. 1483 * 1484 * BOND_AD_COUNT: select the aggregator with largest number of ports 1485 * (slaves), and reselect whenever a link state change takes place or the 1486 * set of slaves in the bond changes. 1487 * 1488 * FIXME: this function MUST be called with the first agg in the bond, or 1489 * __get_active_agg() won't work correctly. This function should be better 1490 * called with the bond itself, and retrieve the first agg from it. 1491 */ 1492 static void ad_agg_selection_logic(struct aggregator *agg) 1493 { 1494 struct aggregator *best, *active, *origin; 1495 struct bonding *bond = agg->slave->bond; 1496 struct list_head *iter; 1497 struct slave *slave; 1498 struct port *port; 1499 1500 rcu_read_lock(); 1501 origin = agg; 1502 active = __get_active_agg(agg); 1503 best = (active && agg_device_up(active)) ? active : NULL; 1504 1505 bond_for_each_slave_rcu(bond, slave, iter) { 1506 agg = &(SLAVE_AD_INFO(slave).aggregator); 1507 1508 agg->is_active = 0; 1509 1510 if (agg->num_of_ports && agg_device_up(agg)) 1511 best = ad_agg_selection_test(best, agg); 1512 } 1513 1514 if (best && 1515 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) { 1516 /* For the STABLE policy, don't replace the old active 1517 * aggregator if it's still active (it has an answering 1518 * partner) or if both the best and active don't have an 1519 * answering partner. 1520 */ 1521 if (active && active->lag_ports && 1522 active->lag_ports->is_enabled && 1523 (__agg_has_partner(active) || 1524 (!__agg_has_partner(active) && 1525 !__agg_has_partner(best)))) { 1526 if (!(!active->actor_oper_aggregator_key && 1527 best->actor_oper_aggregator_key)) { 1528 best = NULL; 1529 active->is_active = 1; 1530 } 1531 } 1532 } 1533 1534 if (best && (best == active)) { 1535 best = NULL; 1536 active->is_active = 1; 1537 } 1538 1539 /* if there is new best aggregator, activate it */ 1540 if (best) { 1541 pr_debug("best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n", 1542 best->aggregator_identifier, best->num_of_ports, 1543 best->actor_oper_aggregator_key, 1544 best->partner_oper_aggregator_key, 1545 best->is_individual, best->is_active); 1546 pr_debug("best ports %p slave %p %s\n", 1547 best->lag_ports, best->slave, 1548 best->slave ? best->slave->dev->name : "NULL"); 1549 1550 bond_for_each_slave_rcu(bond, slave, iter) { 1551 agg = &(SLAVE_AD_INFO(slave).aggregator); 1552 1553 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n", 1554 agg->aggregator_identifier, agg->num_of_ports, 1555 agg->actor_oper_aggregator_key, 1556 agg->partner_oper_aggregator_key, 1557 agg->is_individual, agg->is_active); 1558 } 1559 1560 /* check if any partner replys */ 1561 if (best->is_individual) { 1562 pr_warn("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n", 1563 best->slave ? 1564 best->slave->bond->dev->name : "NULL"); 1565 } 1566 1567 best->is_active = 1; 1568 pr_debug("LAG %d chosen as the active LAG\n", 1569 best->aggregator_identifier); 1570 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n", 1571 best->aggregator_identifier, best->num_of_ports, 1572 best->actor_oper_aggregator_key, 1573 best->partner_oper_aggregator_key, 1574 best->is_individual, best->is_active); 1575 1576 /* disable the ports that were related to the former 1577 * active_aggregator 1578 */ 1579 if (active) { 1580 for (port = active->lag_ports; port; 1581 port = port->next_port_in_aggregator) { 1582 __disable_port(port); 1583 } 1584 } 1585 } 1586 1587 /* if the selected aggregator is of join individuals 1588 * (partner_system is NULL), enable their ports 1589 */ 1590 active = __get_active_agg(origin); 1591 1592 if (active) { 1593 if (!__agg_has_partner(active)) { 1594 for (port = active->lag_ports; port; 1595 port = port->next_port_in_aggregator) { 1596 __enable_port(port); 1597 } 1598 } 1599 } 1600 1601 rcu_read_unlock(); 1602 1603 bond_3ad_set_carrier(bond); 1604 } 1605 1606 /** 1607 * ad_clear_agg - clear a given aggregator's parameters 1608 * @aggregator: the aggregator we're looking at 1609 */ 1610 static void ad_clear_agg(struct aggregator *aggregator) 1611 { 1612 if (aggregator) { 1613 aggregator->is_individual = false; 1614 aggregator->actor_admin_aggregator_key = 0; 1615 aggregator->actor_oper_aggregator_key = 0; 1616 aggregator->partner_system = null_mac_addr; 1617 aggregator->partner_system_priority = 0; 1618 aggregator->partner_oper_aggregator_key = 0; 1619 aggregator->receive_state = 0; 1620 aggregator->transmit_state = 0; 1621 aggregator->lag_ports = NULL; 1622 aggregator->is_active = 0; 1623 aggregator->num_of_ports = 0; 1624 pr_debug("LAG %d was cleared\n", 1625 aggregator->aggregator_identifier); 1626 } 1627 } 1628 1629 /** 1630 * ad_initialize_agg - initialize a given aggregator's parameters 1631 * @aggregator: the aggregator we're looking at 1632 */ 1633 static void ad_initialize_agg(struct aggregator *aggregator) 1634 { 1635 if (aggregator) { 1636 ad_clear_agg(aggregator); 1637 1638 aggregator->aggregator_mac_address = null_mac_addr; 1639 aggregator->aggregator_identifier = 0; 1640 aggregator->slave = NULL; 1641 } 1642 } 1643 1644 /** 1645 * ad_initialize_port - initialize a given port's parameters 1646 * @aggregator: the aggregator we're looking at 1647 * @lacp_fast: boolean. whether fast periodic should be used 1648 */ 1649 static void ad_initialize_port(struct port *port, int lacp_fast) 1650 { 1651 static const struct port_params tmpl = { 1652 .system_priority = 0xffff, 1653 .key = 1, 1654 .port_number = 1, 1655 .port_priority = 0xff, 1656 .port_state = 1, 1657 }; 1658 static const struct lacpdu lacpdu = { 1659 .subtype = 0x01, 1660 .version_number = 0x01, 1661 .tlv_type_actor_info = 0x01, 1662 .actor_information_length = 0x14, 1663 .tlv_type_partner_info = 0x02, 1664 .partner_information_length = 0x14, 1665 .tlv_type_collector_info = 0x03, 1666 .collector_information_length = 0x10, 1667 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY), 1668 }; 1669 1670 if (port) { 1671 port->actor_port_number = 1; 1672 port->actor_port_priority = 0xff; 1673 port->actor_system = null_mac_addr; 1674 port->actor_system_priority = 0xffff; 1675 port->actor_port_aggregator_identifier = 0; 1676 port->ntt = false; 1677 port->actor_admin_port_key = 1; 1678 port->actor_oper_port_key = 1; 1679 port->actor_admin_port_state = AD_STATE_AGGREGATION | 1680 AD_STATE_LACP_ACTIVITY; 1681 port->actor_oper_port_state = AD_STATE_AGGREGATION | 1682 AD_STATE_LACP_ACTIVITY; 1683 1684 if (lacp_fast) 1685 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT; 1686 1687 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl)); 1688 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl)); 1689 1690 port->is_enabled = true; 1691 /* private parameters */ 1692 port->sm_vars = 0x3; 1693 port->sm_rx_state = 0; 1694 port->sm_rx_timer_counter = 0; 1695 port->sm_periodic_state = 0; 1696 port->sm_periodic_timer_counter = 0; 1697 port->sm_mux_state = 0; 1698 port->sm_mux_timer_counter = 0; 1699 port->sm_tx_state = 0; 1700 port->sm_tx_timer_counter = 0; 1701 port->slave = NULL; 1702 port->aggregator = NULL; 1703 port->next_port_in_aggregator = NULL; 1704 port->transaction_id = 0; 1705 1706 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu)); 1707 } 1708 } 1709 1710 /** 1711 * ad_enable_collecting_distributing - enable a port's transmit/receive 1712 * @port: the port we're looking at 1713 * 1714 * Enable @port if it's in an active aggregator 1715 */ 1716 static void ad_enable_collecting_distributing(struct port *port) 1717 { 1718 if (port->aggregator->is_active) { 1719 pr_debug("Enabling port %d(LAG %d)\n", 1720 port->actor_port_number, 1721 port->aggregator->aggregator_identifier); 1722 __enable_port(port); 1723 } 1724 } 1725 1726 /** 1727 * ad_disable_collecting_distributing - disable a port's transmit/receive 1728 * @port: the port we're looking at 1729 */ 1730 static void ad_disable_collecting_distributing(struct port *port) 1731 { 1732 if (port->aggregator && 1733 !MAC_ADDRESS_EQUAL(&(port->aggregator->partner_system), 1734 &(null_mac_addr))) { 1735 pr_debug("Disabling port %d(LAG %d)\n", 1736 port->actor_port_number, 1737 port->aggregator->aggregator_identifier); 1738 __disable_port(port); 1739 } 1740 } 1741 1742 /** 1743 * ad_marker_info_received - handle receive of a Marker information frame 1744 * @marker_info: Marker info received 1745 * @port: the port we're looking at 1746 */ 1747 static void ad_marker_info_received(struct bond_marker *marker_info, 1748 struct port *port) 1749 { 1750 struct bond_marker marker; 1751 1752 /* copy the received marker data to the response marker */ 1753 memcpy(&marker, marker_info, sizeof(struct bond_marker)); 1754 /* change the marker subtype to marker response */ 1755 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE; 1756 1757 /* send the marker response */ 1758 if (ad_marker_send(port, &marker) >= 0) { 1759 pr_debug("Sent Marker Response on port %d\n", 1760 port->actor_port_number); 1761 } 1762 } 1763 1764 /** 1765 * ad_marker_response_received - handle receive of a marker response frame 1766 * @marker: marker PDU received 1767 * @port: the port we're looking at 1768 * 1769 * This function does nothing since we decided not to implement send and handle 1770 * response for marker PDU's, in this stage, but only to respond to marker 1771 * information. 1772 */ 1773 static void ad_marker_response_received(struct bond_marker *marker, 1774 struct port *port) 1775 { 1776 marker = NULL; 1777 port = NULL; 1778 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */ 1779 } 1780 1781 /* ========= AD exported functions to the main bonding code ========= */ 1782 1783 /* Check aggregators status in team every T seconds */ 1784 #define AD_AGGREGATOR_SELECTION_TIMER 8 1785 1786 /** 1787 * bond_3ad_initiate_agg_selection - initate aggregator selection 1788 * @bond: bonding struct 1789 * 1790 * Set the aggregation selection timer, to initiate an agg selection in 1791 * the very near future. Called during first initialization, and during 1792 * any down to up transitions of the bond. 1793 */ 1794 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout) 1795 { 1796 BOND_AD_INFO(bond).agg_select_timer = timeout; 1797 } 1798 1799 static u16 aggregator_identifier; 1800 1801 /** 1802 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures 1803 * @bond: bonding struct to work on 1804 * @tick_resolution: tick duration (millisecond resolution) 1805 * 1806 * Can be called only after the mac address of the bond is set. 1807 */ 1808 void bond_3ad_initialize(struct bonding *bond, u16 tick_resolution) 1809 { 1810 /* check that the bond is not initialized yet */ 1811 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond).system.sys_mac_addr), 1812 bond->dev->dev_addr)) { 1813 1814 aggregator_identifier = 0; 1815 1816 BOND_AD_INFO(bond).system.sys_priority = 0xFFFF; 1817 BOND_AD_INFO(bond).system.sys_mac_addr = *((struct mac_addr *)bond->dev->dev_addr); 1818 1819 /* initialize how many times this module is called in one 1820 * second (should be about every 100ms) 1821 */ 1822 ad_ticks_per_sec = tick_resolution; 1823 1824 bond_3ad_initiate_agg_selection(bond, 1825 AD_AGGREGATOR_SELECTION_TIMER * 1826 ad_ticks_per_sec); 1827 } 1828 } 1829 1830 /** 1831 * bond_3ad_bind_slave - initialize a slave's port 1832 * @slave: slave struct to work on 1833 * 1834 * Returns: 0 on success 1835 * < 0 on error 1836 */ 1837 void bond_3ad_bind_slave(struct slave *slave) 1838 { 1839 struct bonding *bond = bond_get_bond_by_slave(slave); 1840 struct port *port; 1841 struct aggregator *aggregator; 1842 1843 /* check that the slave has not been initialized yet. */ 1844 if (SLAVE_AD_INFO(slave).port.slave != slave) { 1845 1846 /* port initialization */ 1847 port = &(SLAVE_AD_INFO(slave).port); 1848 1849 ad_initialize_port(port, bond->params.lacp_fast); 1850 1851 __initialize_port_locks(slave); 1852 port->slave = slave; 1853 port->actor_port_number = SLAVE_AD_INFO(slave).id; 1854 /* key is determined according to the link speed, duplex and user key(which 1855 * is yet not supported) 1856 */ 1857 port->actor_admin_port_key = 0; 1858 port->actor_admin_port_key |= __get_duplex(port); 1859 port->actor_admin_port_key |= (__get_link_speed(port) << 1); 1860 port->actor_oper_port_key = port->actor_admin_port_key; 1861 /* if the port is not full duplex, then the port should be not 1862 * lacp Enabled 1863 */ 1864 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_BITS)) 1865 port->sm_vars &= ~AD_PORT_LACP_ENABLED; 1866 /* actor system is the bond's system */ 1867 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr; 1868 /* tx timer(to verify that no more than MAX_TX_IN_SECOND 1869 * lacpdu's are sent in one second) 1870 */ 1871 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND; 1872 port->aggregator = NULL; 1873 port->next_port_in_aggregator = NULL; 1874 1875 __disable_port(port); 1876 1877 /* aggregator initialization */ 1878 aggregator = &(SLAVE_AD_INFO(slave).aggregator); 1879 1880 ad_initialize_agg(aggregator); 1881 1882 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr); 1883 aggregator->aggregator_identifier = (++aggregator_identifier); 1884 aggregator->slave = slave; 1885 aggregator->is_active = 0; 1886 aggregator->num_of_ports = 0; 1887 } 1888 } 1889 1890 /** 1891 * bond_3ad_unbind_slave - deinitialize a slave's port 1892 * @slave: slave struct to work on 1893 * 1894 * Search for the aggregator that is related to this port, remove the 1895 * aggregator and assign another aggregator for other port related to it 1896 * (if any), and remove the port. 1897 */ 1898 void bond_3ad_unbind_slave(struct slave *slave) 1899 { 1900 struct port *port, *prev_port, *temp_port; 1901 struct aggregator *aggregator, *new_aggregator, *temp_aggregator; 1902 int select_new_active_agg = 0; 1903 struct bonding *bond = slave->bond; 1904 struct slave *slave_iter; 1905 struct list_head *iter; 1906 1907 aggregator = &(SLAVE_AD_INFO(slave).aggregator); 1908 port = &(SLAVE_AD_INFO(slave).port); 1909 1910 /* if slave is null, the whole port is not initialized */ 1911 if (!port->slave) { 1912 pr_warn("Warning: %s: Trying to unbind an uninitialized port on %s\n", 1913 slave->bond->dev->name, slave->dev->name); 1914 return; 1915 } 1916 1917 pr_debug("Unbinding Link Aggregation Group %d\n", 1918 aggregator->aggregator_identifier); 1919 1920 /* Tell the partner that this port is not suitable for aggregation */ 1921 port->actor_oper_port_state &= ~AD_STATE_AGGREGATION; 1922 __update_lacpdu_from_port(port); 1923 ad_lacpdu_send(port); 1924 1925 /* check if this aggregator is occupied */ 1926 if (aggregator->lag_ports) { 1927 /* check if there are other ports related to this aggregator 1928 * except the port related to this slave(thats ensure us that 1929 * there is a reason to search for new aggregator, and that we 1930 * will find one 1931 */ 1932 if ((aggregator->lag_ports != port) || 1933 (aggregator->lag_ports->next_port_in_aggregator)) { 1934 /* find new aggregator for the related port(s) */ 1935 bond_for_each_slave(bond, slave_iter, iter) { 1936 new_aggregator = &(SLAVE_AD_INFO(slave_iter).aggregator); 1937 /* if the new aggregator is empty, or it is 1938 * connected to our port only 1939 */ 1940 if (!new_aggregator->lag_ports || 1941 ((new_aggregator->lag_ports == port) && 1942 !new_aggregator->lag_ports->next_port_in_aggregator)) 1943 break; 1944 } 1945 if (!slave_iter) 1946 new_aggregator = NULL; 1947 1948 /* if new aggregator found, copy the aggregator's 1949 * parameters and connect the related lag_ports to the 1950 * new aggregator 1951 */ 1952 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) { 1953 pr_debug("Some port(s) related to LAG %d - replaceing with LAG %d\n", 1954 aggregator->aggregator_identifier, 1955 new_aggregator->aggregator_identifier); 1956 1957 if ((new_aggregator->lag_ports == port) && 1958 new_aggregator->is_active) { 1959 pr_info("%s: Removing an active aggregator\n", 1960 aggregator->slave->bond->dev->name); 1961 select_new_active_agg = 1; 1962 } 1963 1964 new_aggregator->is_individual = aggregator->is_individual; 1965 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key; 1966 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key; 1967 new_aggregator->partner_system = aggregator->partner_system; 1968 new_aggregator->partner_system_priority = aggregator->partner_system_priority; 1969 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key; 1970 new_aggregator->receive_state = aggregator->receive_state; 1971 new_aggregator->transmit_state = aggregator->transmit_state; 1972 new_aggregator->lag_ports = aggregator->lag_ports; 1973 new_aggregator->is_active = aggregator->is_active; 1974 new_aggregator->num_of_ports = aggregator->num_of_ports; 1975 1976 /* update the information that is written on 1977 * the ports about the aggregator 1978 */ 1979 for (temp_port = aggregator->lag_ports; temp_port; 1980 temp_port = temp_port->next_port_in_aggregator) { 1981 temp_port->aggregator = new_aggregator; 1982 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier; 1983 } 1984 1985 ad_clear_agg(aggregator); 1986 1987 if (select_new_active_agg) 1988 ad_agg_selection_logic(__get_first_agg(port)); 1989 } else { 1990 pr_warn("%s: Warning: unbinding aggregator, and could not find a new aggregator for its ports\n", 1991 slave->bond->dev->name); 1992 } 1993 } else { 1994 /* in case that the only port related to this 1995 * aggregator is the one we want to remove 1996 */ 1997 select_new_active_agg = aggregator->is_active; 1998 ad_clear_agg(aggregator); 1999 if (select_new_active_agg) { 2000 pr_info("%s: Removing an active aggregator\n", 2001 slave->bond->dev->name); 2002 /* select new active aggregator */ 2003 temp_aggregator = __get_first_agg(port); 2004 if (temp_aggregator) 2005 ad_agg_selection_logic(temp_aggregator); 2006 } 2007 } 2008 } 2009 2010 pr_debug("Unbinding port %d\n", port->actor_port_number); 2011 2012 /* find the aggregator that this port is connected to */ 2013 bond_for_each_slave(bond, slave_iter, iter) { 2014 temp_aggregator = &(SLAVE_AD_INFO(slave_iter).aggregator); 2015 prev_port = NULL; 2016 /* search the port in the aggregator's related ports */ 2017 for (temp_port = temp_aggregator->lag_ports; temp_port; 2018 prev_port = temp_port, 2019 temp_port = temp_port->next_port_in_aggregator) { 2020 if (temp_port == port) { 2021 /* the aggregator found - detach the port from 2022 * this aggregator 2023 */ 2024 if (prev_port) 2025 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator; 2026 else 2027 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator; 2028 temp_aggregator->num_of_ports--; 2029 if (temp_aggregator->num_of_ports == 0) { 2030 select_new_active_agg = temp_aggregator->is_active; 2031 ad_clear_agg(temp_aggregator); 2032 if (select_new_active_agg) { 2033 pr_info("%s: Removing an active aggregator\n", 2034 slave->bond->dev->name); 2035 /* select new active aggregator */ 2036 ad_agg_selection_logic(__get_first_agg(port)); 2037 } 2038 } 2039 break; 2040 } 2041 } 2042 } 2043 port->slave = NULL; 2044 } 2045 2046 /** 2047 * bond_3ad_state_machine_handler - handle state machines timeout 2048 * @bond: bonding struct to work on 2049 * 2050 * The state machine handling concept in this module is to check every tick 2051 * which state machine should operate any function. The execution order is 2052 * round robin, so when we have an interaction between state machines, the 2053 * reply of one to each other might be delayed until next tick. 2054 * 2055 * This function also complete the initialization when the agg_select_timer 2056 * times out, and it selects an aggregator for the ports that are yet not 2057 * related to any aggregator, and selects the active aggregator for a bond. 2058 */ 2059 void bond_3ad_state_machine_handler(struct work_struct *work) 2060 { 2061 struct bonding *bond = container_of(work, struct bonding, 2062 ad_work.work); 2063 struct aggregator *aggregator; 2064 struct list_head *iter; 2065 struct slave *slave; 2066 struct port *port; 2067 2068 read_lock(&bond->lock); 2069 rcu_read_lock(); 2070 2071 /* check if there are any slaves */ 2072 if (!bond_has_slaves(bond)) 2073 goto re_arm; 2074 2075 /* check if agg_select_timer timer after initialize is timed out */ 2076 if (BOND_AD_INFO(bond).agg_select_timer && 2077 !(--BOND_AD_INFO(bond).agg_select_timer)) { 2078 slave = bond_first_slave_rcu(bond); 2079 port = slave ? &(SLAVE_AD_INFO(slave).port) : NULL; 2080 2081 /* select the active aggregator for the bond */ 2082 if (port) { 2083 if (!port->slave) { 2084 pr_warn("%s: Warning: bond's first port is uninitialized\n", 2085 bond->dev->name); 2086 goto re_arm; 2087 } 2088 2089 aggregator = __get_first_agg(port); 2090 ad_agg_selection_logic(aggregator); 2091 } 2092 bond_3ad_set_carrier(bond); 2093 } 2094 2095 /* for each port run the state machines */ 2096 bond_for_each_slave_rcu(bond, slave, iter) { 2097 port = &(SLAVE_AD_INFO(slave).port); 2098 if (!port->slave) { 2099 pr_warn("%s: Warning: Found an uninitialized port\n", 2100 bond->dev->name); 2101 goto re_arm; 2102 } 2103 2104 /* Lock around state machines to protect data accessed 2105 * by all (e.g., port->sm_vars). ad_rx_machine may run 2106 * concurrently due to incoming LACPDU. 2107 */ 2108 __get_state_machine_lock(port); 2109 2110 ad_rx_machine(NULL, port); 2111 ad_periodic_machine(port); 2112 ad_port_selection_logic(port); 2113 ad_mux_machine(port); 2114 ad_tx_machine(port); 2115 2116 /* turn off the BEGIN bit, since we already handled it */ 2117 if (port->sm_vars & AD_PORT_BEGIN) 2118 port->sm_vars &= ~AD_PORT_BEGIN; 2119 2120 __release_state_machine_lock(port); 2121 } 2122 2123 re_arm: 2124 rcu_read_unlock(); 2125 read_unlock(&bond->lock); 2126 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks); 2127 } 2128 2129 /** 2130 * bond_3ad_rx_indication - handle a received frame 2131 * @lacpdu: received lacpdu 2132 * @slave: slave struct to work on 2133 * @length: length of the data received 2134 * 2135 * It is assumed that frames that were sent on this NIC don't returned as new 2136 * received frames (loopback). Since only the payload is given to this 2137 * function, it check for loopback. 2138 */ 2139 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave, 2140 u16 length) 2141 { 2142 struct port *port; 2143 int ret = RX_HANDLER_ANOTHER; 2144 2145 if (length >= sizeof(struct lacpdu)) { 2146 2147 port = &(SLAVE_AD_INFO(slave).port); 2148 2149 if (!port->slave) { 2150 pr_warn("%s: Warning: port of slave %s is uninitialized\n", 2151 slave->dev->name, slave->bond->dev->name); 2152 return ret; 2153 } 2154 2155 switch (lacpdu->subtype) { 2156 case AD_TYPE_LACPDU: 2157 ret = RX_HANDLER_CONSUMED; 2158 pr_debug("Received LACPDU on port %d\n", 2159 port->actor_port_number); 2160 /* Protect against concurrent state machines */ 2161 __get_state_machine_lock(port); 2162 ad_rx_machine(lacpdu, port); 2163 __release_state_machine_lock(port); 2164 break; 2165 2166 case AD_TYPE_MARKER: 2167 ret = RX_HANDLER_CONSUMED; 2168 /* No need to convert fields to Little Endian since we 2169 * don't use the marker's fields. 2170 */ 2171 2172 switch (((struct bond_marker *)lacpdu)->tlv_type) { 2173 case AD_MARKER_INFORMATION_SUBTYPE: 2174 pr_debug("Received Marker Information on port %d\n", 2175 port->actor_port_number); 2176 ad_marker_info_received((struct bond_marker *)lacpdu, port); 2177 break; 2178 2179 case AD_MARKER_RESPONSE_SUBTYPE: 2180 pr_debug("Received Marker Response on port %d\n", 2181 port->actor_port_number); 2182 ad_marker_response_received((struct bond_marker *)lacpdu, port); 2183 break; 2184 2185 default: 2186 pr_debug("Received an unknown Marker subtype on slot %d\n", 2187 port->actor_port_number); 2188 } 2189 } 2190 } 2191 return ret; 2192 } 2193 2194 /** 2195 * bond_3ad_adapter_speed_changed - handle a slave's speed change indication 2196 * @slave: slave struct to work on 2197 * 2198 * Handle reselection of aggregator (if needed) for this port. 2199 */ 2200 void bond_3ad_adapter_speed_changed(struct slave *slave) 2201 { 2202 struct port *port; 2203 2204 port = &(SLAVE_AD_INFO(slave).port); 2205 2206 /* if slave is null, the whole port is not initialized */ 2207 if (!port->slave) { 2208 pr_warn("Warning: %s: speed changed for uninitialized port on %s\n", 2209 slave->bond->dev->name, slave->dev->name); 2210 return; 2211 } 2212 2213 __get_state_machine_lock(port); 2214 2215 port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS; 2216 port->actor_oper_port_key = port->actor_admin_port_key |= 2217 (__get_link_speed(port) << 1); 2218 pr_debug("Port %d changed speed\n", port->actor_port_number); 2219 /* there is no need to reselect a new aggregator, just signal the 2220 * state machines to reinitialize 2221 */ 2222 port->sm_vars |= AD_PORT_BEGIN; 2223 2224 __release_state_machine_lock(port); 2225 } 2226 2227 /** 2228 * bond_3ad_adapter_duplex_changed - handle a slave's duplex change indication 2229 * @slave: slave struct to work on 2230 * 2231 * Handle reselection of aggregator (if needed) for this port. 2232 */ 2233 void bond_3ad_adapter_duplex_changed(struct slave *slave) 2234 { 2235 struct port *port; 2236 2237 port = &(SLAVE_AD_INFO(slave).port); 2238 2239 /* if slave is null, the whole port is not initialized */ 2240 if (!port->slave) { 2241 pr_warn("%s: Warning: duplex changed for uninitialized port on %s\n", 2242 slave->bond->dev->name, slave->dev->name); 2243 return; 2244 } 2245 2246 __get_state_machine_lock(port); 2247 2248 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS; 2249 port->actor_oper_port_key = port->actor_admin_port_key |= 2250 __get_duplex(port); 2251 pr_debug("Port %d changed duplex\n", port->actor_port_number); 2252 /* there is no need to reselect a new aggregator, just signal the 2253 * state machines to reinitialize 2254 */ 2255 port->sm_vars |= AD_PORT_BEGIN; 2256 2257 __release_state_machine_lock(port); 2258 } 2259 2260 /** 2261 * bond_3ad_handle_link_change - handle a slave's link status change indication 2262 * @slave: slave struct to work on 2263 * @status: whether the link is now up or down 2264 * 2265 * Handle reselection of aggregator (if needed) for this port. 2266 */ 2267 void bond_3ad_handle_link_change(struct slave *slave, char link) 2268 { 2269 struct port *port; 2270 2271 port = &(SLAVE_AD_INFO(slave).port); 2272 2273 /* if slave is null, the whole port is not initialized */ 2274 if (!port->slave) { 2275 pr_warn("Warning: %s: link status changed for uninitialized port on %s\n", 2276 slave->bond->dev->name, slave->dev->name); 2277 return; 2278 } 2279 2280 __get_state_machine_lock(port); 2281 /* on link down we are zeroing duplex and speed since 2282 * some of the adaptors(ce1000.lan) report full duplex/speed 2283 * instead of N/A(duplex) / 0(speed). 2284 * 2285 * on link up we are forcing recheck on the duplex and speed since 2286 * some of he adaptors(ce1000.lan) report. 2287 */ 2288 if (link == BOND_LINK_UP) { 2289 port->is_enabled = true; 2290 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS; 2291 port->actor_oper_port_key = port->actor_admin_port_key |= 2292 __get_duplex(port); 2293 port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS; 2294 port->actor_oper_port_key = port->actor_admin_port_key |= 2295 (__get_link_speed(port) << 1); 2296 } else { 2297 /* link has failed */ 2298 port->is_enabled = false; 2299 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS; 2300 port->actor_oper_port_key = (port->actor_admin_port_key &= 2301 ~AD_SPEED_KEY_BITS); 2302 } 2303 pr_debug("Port %d changed link status to %s", 2304 port->actor_port_number, 2305 (link == BOND_LINK_UP) ? "UP" : "DOWN"); 2306 /* there is no need to reselect a new aggregator, just signal the 2307 * state machines to reinitialize 2308 */ 2309 port->sm_vars |= AD_PORT_BEGIN; 2310 2311 __release_state_machine_lock(port); 2312 } 2313 2314 /** 2315 * bond_3ad_set_carrier - set link state for bonding master 2316 * @bond - bonding structure 2317 * 2318 * if we have an active aggregator, we're up, if not, we're down. 2319 * Presumes that we cannot have an active aggregator if there are 2320 * no slaves with link up. 2321 * 2322 * This behavior complies with IEEE 802.3 section 43.3.9. 2323 * 2324 * Called by bond_set_carrier(). Return zero if carrier state does not 2325 * change, nonzero if it does. 2326 */ 2327 int bond_3ad_set_carrier(struct bonding *bond) 2328 { 2329 struct aggregator *active; 2330 struct slave *first_slave; 2331 int ret = 1; 2332 2333 rcu_read_lock(); 2334 first_slave = bond_first_slave_rcu(bond); 2335 if (!first_slave) { 2336 ret = 0; 2337 goto out; 2338 } 2339 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave).aggregator)); 2340 if (active) { 2341 /* are enough slaves available to consider link up? */ 2342 if (active->num_of_ports < bond->params.min_links) { 2343 if (netif_carrier_ok(bond->dev)) { 2344 netif_carrier_off(bond->dev); 2345 goto out; 2346 } 2347 } else if (!netif_carrier_ok(bond->dev)) { 2348 netif_carrier_on(bond->dev); 2349 goto out; 2350 } 2351 } else if (netif_carrier_ok(bond->dev)) { 2352 netif_carrier_off(bond->dev); 2353 } 2354 out: 2355 rcu_read_unlock(); 2356 return ret; 2357 } 2358 2359 /** 2360 * __bond_3ad_get_active_agg_info - get information of the active aggregator 2361 * @bond: bonding struct to work on 2362 * @ad_info: ad_info struct to fill with the bond's info 2363 * 2364 * Returns: 0 on success 2365 * < 0 on error 2366 */ 2367 int __bond_3ad_get_active_agg_info(struct bonding *bond, 2368 struct ad_info *ad_info) 2369 { 2370 struct aggregator *aggregator = NULL; 2371 struct list_head *iter; 2372 struct slave *slave; 2373 struct port *port; 2374 2375 bond_for_each_slave_rcu(bond, slave, iter) { 2376 port = &(SLAVE_AD_INFO(slave).port); 2377 if (port->aggregator && port->aggregator->is_active) { 2378 aggregator = port->aggregator; 2379 break; 2380 } 2381 } 2382 2383 if (aggregator) { 2384 ad_info->aggregator_id = aggregator->aggregator_identifier; 2385 ad_info->ports = aggregator->num_of_ports; 2386 ad_info->actor_key = aggregator->actor_oper_aggregator_key; 2387 ad_info->partner_key = aggregator->partner_oper_aggregator_key; 2388 memcpy(ad_info->partner_system, 2389 aggregator->partner_system.mac_addr_value, ETH_ALEN); 2390 return 0; 2391 } 2392 2393 return -1; 2394 } 2395 2396 /* Wrapper used to hold bond->lock so no slave manipulation can occur */ 2397 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info) 2398 { 2399 int ret; 2400 2401 rcu_read_lock(); 2402 ret = __bond_3ad_get_active_agg_info(bond, ad_info); 2403 rcu_read_unlock(); 2404 2405 return ret; 2406 } 2407 2408 int bond_3ad_xmit_xor(struct sk_buff *skb, struct net_device *dev) 2409 { 2410 struct bonding *bond = netdev_priv(dev); 2411 struct slave *slave, *first_ok_slave; 2412 struct aggregator *agg; 2413 struct ad_info ad_info; 2414 struct list_head *iter; 2415 int slaves_in_agg; 2416 int slave_agg_no; 2417 int agg_id; 2418 2419 if (__bond_3ad_get_active_agg_info(bond, &ad_info)) { 2420 pr_debug("%s: Error: __bond_3ad_get_active_agg_info failed\n", 2421 dev->name); 2422 goto err_free; 2423 } 2424 2425 slaves_in_agg = ad_info.ports; 2426 agg_id = ad_info.aggregator_id; 2427 2428 if (slaves_in_agg == 0) { 2429 pr_debug("%s: Error: active aggregator is empty\n", dev->name); 2430 goto err_free; 2431 } 2432 2433 slave_agg_no = bond_xmit_hash(bond, skb, slaves_in_agg); 2434 first_ok_slave = NULL; 2435 2436 bond_for_each_slave_rcu(bond, slave, iter) { 2437 agg = SLAVE_AD_INFO(slave).port.aggregator; 2438 if (!agg || agg->aggregator_identifier != agg_id) 2439 continue; 2440 2441 if (slave_agg_no >= 0) { 2442 if (!first_ok_slave && SLAVE_IS_OK(slave)) 2443 first_ok_slave = slave; 2444 slave_agg_no--; 2445 continue; 2446 } 2447 2448 if (SLAVE_IS_OK(slave)) { 2449 bond_dev_queue_xmit(bond, skb, slave->dev); 2450 goto out; 2451 } 2452 } 2453 2454 if (slave_agg_no >= 0) { 2455 pr_err("%s: Error: Couldn't find a slave to tx on for aggregator ID %d\n", 2456 dev->name, agg_id); 2457 goto err_free; 2458 } 2459 2460 /* we couldn't find any suitable slave after the agg_no, so use the 2461 * first suitable found, if found. 2462 */ 2463 if (first_ok_slave) 2464 bond_dev_queue_xmit(bond, skb, first_ok_slave->dev); 2465 else 2466 goto err_free; 2467 2468 out: 2469 return NETDEV_TX_OK; 2470 err_free: 2471 /* no suitable interface, frame not sent */ 2472 kfree_skb(skb); 2473 goto out; 2474 } 2475 2476 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond, 2477 struct slave *slave) 2478 { 2479 int ret = RX_HANDLER_ANOTHER; 2480 struct lacpdu *lacpdu, _lacpdu; 2481 2482 if (skb->protocol != PKT_TYPE_LACPDU) 2483 return ret; 2484 2485 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu); 2486 if (!lacpdu) 2487 return ret; 2488 2489 read_lock(&bond->lock); 2490 ret = bond_3ad_rx_indication(lacpdu, slave, skb->len); 2491 read_unlock(&bond->lock); 2492 return ret; 2493 } 2494 2495 /** 2496 * bond_3ad_update_lacp_rate - change the lacp rate 2497 * @bond - bonding struct 2498 * 2499 * When modify lacp_rate parameter via sysfs, 2500 * update actor_oper_port_state of each port. 2501 * 2502 * Hold slave->state_machine_lock, 2503 * so we can modify port->actor_oper_port_state, 2504 * no matter bond is up or down. 2505 */ 2506 void bond_3ad_update_lacp_rate(struct bonding *bond) 2507 { 2508 struct port *port = NULL; 2509 struct list_head *iter; 2510 struct slave *slave; 2511 int lacp_fast; 2512 2513 lacp_fast = bond->params.lacp_fast; 2514 bond_for_each_slave(bond, slave, iter) { 2515 port = &(SLAVE_AD_INFO(slave).port); 2516 __get_state_machine_lock(port); 2517 if (lacp_fast) 2518 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT; 2519 else 2520 port->actor_oper_port_state &= ~AD_STATE_LACP_TIMEOUT; 2521 __release_state_machine_lock(port); 2522 } 2523 } 2524