1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* 3 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved. 4 */ 5 6 #include <linux/skbuff.h> 7 #include <linux/if_ether.h> 8 #include <linux/netdevice.h> 9 #include <linux/spinlock.h> 10 #include <linux/ethtool.h> 11 #include <linux/etherdevice.h> 12 #include <linux/if_bonding.h> 13 #include <linux/pkt_sched.h> 14 #include <net/net_namespace.h> 15 #include <net/bonding.h> 16 #include <net/bond_3ad.h> 17 #include <net/netlink.h> 18 19 /* General definitions */ 20 #define AD_SHORT_TIMEOUT 1 21 #define AD_LONG_TIMEOUT 0 22 #define AD_STANDBY 0x2 23 #define AD_MAX_TX_IN_SECOND 3 24 #define AD_COLLECTOR_MAX_DELAY 0 25 26 /* Timer definitions (43.4.4 in the 802.3ad standard) */ 27 #define AD_FAST_PERIODIC_TIME 1 28 #define AD_SLOW_PERIODIC_TIME 30 29 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME) 30 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME) 31 #define AD_CHURN_DETECTION_TIME 60 32 #define AD_AGGREGATE_WAIT_TIME 2 33 34 /* Port Variables definitions used by the State Machines (43.4.7 in the 35 * 802.3ad standard) 36 */ 37 #define AD_PORT_BEGIN 0x1 38 #define AD_PORT_LACP_ENABLED 0x2 39 #define AD_PORT_ACTOR_CHURN 0x4 40 #define AD_PORT_PARTNER_CHURN 0x8 41 #define AD_PORT_READY 0x10 42 #define AD_PORT_READY_N 0x20 43 #define AD_PORT_MATCHED 0x40 44 #define AD_PORT_STANDBY 0x80 45 #define AD_PORT_SELECTED 0x100 46 #define AD_PORT_MOVED 0x200 47 #define AD_PORT_CHURNED (AD_PORT_ACTOR_CHURN | AD_PORT_PARTNER_CHURN) 48 49 /* Port Key definitions 50 * key is determined according to the link speed, duplex and 51 * user key (which is yet not supported) 52 * -------------------------------------------------------------- 53 * Port key | User key (10 bits) | Speed (5 bits) | Duplex| 54 * -------------------------------------------------------------- 55 * |15 6|5 1|0 56 */ 57 #define AD_DUPLEX_KEY_MASKS 0x1 58 #define AD_SPEED_KEY_MASKS 0x3E 59 #define AD_USER_KEY_MASKS 0xFFC0 60 61 enum ad_link_speed_type { 62 AD_LINK_SPEED_1MBPS = 1, 63 AD_LINK_SPEED_10MBPS, 64 AD_LINK_SPEED_100MBPS, 65 AD_LINK_SPEED_1000MBPS, 66 AD_LINK_SPEED_2500MBPS, 67 AD_LINK_SPEED_5000MBPS, 68 AD_LINK_SPEED_10000MBPS, 69 AD_LINK_SPEED_14000MBPS, 70 AD_LINK_SPEED_20000MBPS, 71 AD_LINK_SPEED_25000MBPS, 72 AD_LINK_SPEED_40000MBPS, 73 AD_LINK_SPEED_50000MBPS, 74 AD_LINK_SPEED_56000MBPS, 75 AD_LINK_SPEED_100000MBPS, 76 AD_LINK_SPEED_200000MBPS, 77 AD_LINK_SPEED_400000MBPS, 78 AD_LINK_SPEED_800000MBPS, 79 }; 80 81 /* compare MAC addresses */ 82 #define MAC_ADDRESS_EQUAL(A, B) \ 83 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B) 84 85 static const u16 ad_ticks_per_sec = 1000 / AD_TIMER_INTERVAL; 86 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000; 87 88 const u8 lacpdu_mcast_addr[ETH_ALEN + 2] __long_aligned = { 89 0x01, 0x80, 0xC2, 0x00, 0x00, 0x02 90 }; 91 92 /* ================= main 802.3ad protocol functions ================== */ 93 static int ad_lacpdu_send(struct port *port); 94 static int ad_marker_send(struct port *port, struct bond_marker *marker); 95 static void ad_mux_machine(struct port *port, bool *update_slave_arr); 96 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port); 97 static void ad_tx_machine(struct port *port); 98 static void ad_periodic_machine(struct port *port); 99 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr); 100 static void ad_agg_selection_logic(struct aggregator *aggregator, 101 bool *update_slave_arr); 102 static void ad_clear_agg(struct aggregator *aggregator); 103 static void ad_initialize_agg(struct aggregator *aggregator); 104 static void ad_initialize_port(struct port *port, const struct bond_params *bond_params); 105 static void ad_enable_collecting(struct port *port); 106 static void ad_disable_distributing(struct port *port, 107 bool *update_slave_arr); 108 static void ad_enable_collecting_distributing(struct port *port, 109 bool *update_slave_arr); 110 static void ad_disable_collecting_distributing(struct port *port, 111 bool *update_slave_arr); 112 static void ad_marker_info_received(struct bond_marker *marker_info, 113 struct port *port); 114 static void ad_marker_response_received(struct bond_marker *marker, 115 struct port *port); 116 static void ad_update_actor_keys(struct port *port, bool reset); 117 118 119 /* ================= api to bonding and kernel code ================== */ 120 121 /** 122 * __get_bond_by_port - get the port's bonding struct 123 * @port: the port we're looking at 124 * 125 * Return @port's bonding struct, or %NULL if it can't be found. 126 */ 127 static inline struct bonding *__get_bond_by_port(struct port *port) 128 { 129 if (port->slave == NULL) 130 return NULL; 131 132 return bond_get_bond_by_slave(port->slave); 133 } 134 135 /** 136 * __get_first_agg - get the first aggregator in the bond 137 * @port: the port we're looking at 138 * 139 * Return the aggregator of the first slave in @bond, or %NULL if it can't be 140 * found. 141 * The caller must hold RCU or RTNL lock. 142 */ 143 static inline struct aggregator *__get_first_agg(struct port *port) 144 { 145 struct bonding *bond = __get_bond_by_port(port); 146 struct slave *first_slave; 147 struct aggregator *agg; 148 149 /* If there's no bond for this port, or bond has no slaves */ 150 if (bond == NULL) 151 return NULL; 152 153 rcu_read_lock(); 154 first_slave = bond_first_slave_rcu(bond); 155 agg = first_slave ? &(SLAVE_AD_INFO(first_slave)->aggregator) : NULL; 156 rcu_read_unlock(); 157 158 return agg; 159 } 160 161 /** 162 * __agg_has_partner - see if we have a partner 163 * @agg: the agregator we're looking at 164 * 165 * Return nonzero if aggregator has a partner (denoted by a non-zero ether 166 * address for the partner). Return 0 if not. 167 */ 168 static inline int __agg_has_partner(struct aggregator *agg) 169 { 170 return !is_zero_ether_addr(agg->partner_system.mac_addr_value); 171 } 172 173 /** 174 * __disable_distributing_port - disable the port's slave for distributing. 175 * Port will still be able to collect. 176 * @port: the port we're looking at 177 * 178 * This will disable only distributing on the port's slave. 179 */ 180 static void __disable_distributing_port(struct port *port) 181 { 182 bond_set_slave_tx_disabled_flags(port->slave, BOND_SLAVE_NOTIFY_LATER); 183 } 184 185 /** 186 * __enable_collecting_port - enable the port's slave for collecting, 187 * if it's up 188 * @port: the port we're looking at 189 * 190 * This will enable only collecting on the port's slave. 191 */ 192 static void __enable_collecting_port(struct port *port) 193 { 194 struct slave *slave = port->slave; 195 196 if (slave->link == BOND_LINK_UP && bond_slave_is_up(slave)) 197 bond_set_slave_rx_enabled_flags(slave, BOND_SLAVE_NOTIFY_LATER); 198 } 199 200 /** 201 * __disable_port - disable the port's slave 202 * @port: the port we're looking at 203 * 204 * This will disable both collecting and distributing on the port's slave. 205 */ 206 static inline void __disable_port(struct port *port) 207 { 208 bond_set_slave_inactive_flags(port->slave, BOND_SLAVE_NOTIFY_LATER); 209 } 210 211 /** 212 * __enable_port - enable the port's slave, if it's up 213 * @port: the port we're looking at 214 * 215 * This will enable both collecting and distributing on the port's slave. 216 */ 217 static inline void __enable_port(struct port *port) 218 { 219 struct slave *slave = port->slave; 220 221 if ((slave->link == BOND_LINK_UP) && bond_slave_is_up(slave)) 222 bond_set_slave_active_flags(slave, BOND_SLAVE_NOTIFY_LATER); 223 } 224 225 /** 226 * __port_move_to_attached_state - check if port should transition back to attached 227 * state. 228 * @port: the port we're looking at 229 */ 230 static bool __port_move_to_attached_state(struct port *port) 231 { 232 if (!(port->sm_vars & AD_PORT_SELECTED) || 233 (port->sm_vars & AD_PORT_STANDBY) || 234 !(port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) || 235 !(port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION)) 236 port->sm_mux_state = AD_MUX_ATTACHED; 237 238 return port->sm_mux_state == AD_MUX_ATTACHED; 239 } 240 241 /** 242 * __port_is_collecting_distributing - check if the port's slave is in the 243 * combined collecting/distributing state 244 * @port: the port we're looking at 245 */ 246 static int __port_is_collecting_distributing(struct port *port) 247 { 248 return bond_is_active_slave(port->slave); 249 } 250 251 /** 252 * __get_agg_selection_mode - get the aggregator selection mode 253 * @port: the port we're looking at 254 * 255 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT. 256 */ 257 static inline u32 __get_agg_selection_mode(struct port *port) 258 { 259 struct bonding *bond = __get_bond_by_port(port); 260 261 if (bond == NULL) 262 return BOND_AD_STABLE; 263 264 return bond->params.ad_select; 265 } 266 267 /** 268 * __check_agg_selection_timer - check if the selection timer has expired 269 * @port: the port we're looking at 270 */ 271 static inline int __check_agg_selection_timer(struct port *port) 272 { 273 struct bonding *bond = __get_bond_by_port(port); 274 275 if (bond == NULL) 276 return 0; 277 278 return atomic_read(&BOND_AD_INFO(bond).agg_select_timer) ? 1 : 0; 279 } 280 281 /** 282 * __get_link_speed - get a port's speed 283 * @port: the port we're looking at 284 * 285 * Return @port's speed in 802.3ad enum format. i.e. one of: 286 * 0, 287 * %AD_LINK_SPEED_10MBPS, 288 * %AD_LINK_SPEED_100MBPS, 289 * %AD_LINK_SPEED_1000MBPS, 290 * %AD_LINK_SPEED_2500MBPS, 291 * %AD_LINK_SPEED_5000MBPS, 292 * %AD_LINK_SPEED_10000MBPS 293 * %AD_LINK_SPEED_14000MBPS, 294 * %AD_LINK_SPEED_20000MBPS 295 * %AD_LINK_SPEED_25000MBPS 296 * %AD_LINK_SPEED_40000MBPS 297 * %AD_LINK_SPEED_50000MBPS 298 * %AD_LINK_SPEED_56000MBPS 299 * %AD_LINK_SPEED_100000MBPS 300 * %AD_LINK_SPEED_200000MBPS 301 * %AD_LINK_SPEED_400000MBPS 302 * %AD_LINK_SPEED_800000MBPS 303 */ 304 static u16 __get_link_speed(struct port *port) 305 { 306 struct slave *slave = port->slave; 307 u16 speed; 308 309 /* this if covers only a special case: when the configuration starts 310 * with link down, it sets the speed to 0. 311 * This is done in spite of the fact that the e100 driver reports 0 312 * to be compatible with MVT in the future. 313 */ 314 if (slave->link != BOND_LINK_UP) 315 speed = 0; 316 else { 317 switch (slave->speed) { 318 case SPEED_10: 319 speed = AD_LINK_SPEED_10MBPS; 320 break; 321 322 case SPEED_100: 323 speed = AD_LINK_SPEED_100MBPS; 324 break; 325 326 case SPEED_1000: 327 speed = AD_LINK_SPEED_1000MBPS; 328 break; 329 330 case SPEED_2500: 331 speed = AD_LINK_SPEED_2500MBPS; 332 break; 333 334 case SPEED_5000: 335 speed = AD_LINK_SPEED_5000MBPS; 336 break; 337 338 case SPEED_10000: 339 speed = AD_LINK_SPEED_10000MBPS; 340 break; 341 342 case SPEED_14000: 343 speed = AD_LINK_SPEED_14000MBPS; 344 break; 345 346 case SPEED_20000: 347 speed = AD_LINK_SPEED_20000MBPS; 348 break; 349 350 case SPEED_25000: 351 speed = AD_LINK_SPEED_25000MBPS; 352 break; 353 354 case SPEED_40000: 355 speed = AD_LINK_SPEED_40000MBPS; 356 break; 357 358 case SPEED_50000: 359 speed = AD_LINK_SPEED_50000MBPS; 360 break; 361 362 case SPEED_56000: 363 speed = AD_LINK_SPEED_56000MBPS; 364 break; 365 366 case SPEED_100000: 367 speed = AD_LINK_SPEED_100000MBPS; 368 break; 369 370 case SPEED_200000: 371 speed = AD_LINK_SPEED_200000MBPS; 372 break; 373 374 case SPEED_400000: 375 speed = AD_LINK_SPEED_400000MBPS; 376 break; 377 378 case SPEED_800000: 379 speed = AD_LINK_SPEED_800000MBPS; 380 break; 381 382 default: 383 /* unknown speed value from ethtool. shouldn't happen */ 384 if (slave->speed != SPEED_UNKNOWN) 385 pr_err_once("%s: (slave %s): unknown ethtool speed (%d) for port %d (set it to 0)\n", 386 slave->bond->dev->name, 387 slave->dev->name, slave->speed, 388 port->actor_port_number); 389 speed = 0; 390 break; 391 } 392 } 393 394 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received link speed %d update from adapter\n", 395 port->actor_port_number, speed); 396 return speed; 397 } 398 399 /** 400 * __get_duplex - get a port's duplex 401 * @port: the port we're looking at 402 * 403 * Return @port's duplex in 802.3ad bitmask format. i.e.: 404 * 0x01 if in full duplex 405 * 0x00 otherwise 406 */ 407 static u8 __get_duplex(struct port *port) 408 { 409 struct slave *slave = port->slave; 410 u8 retval = 0x0; 411 412 /* handling a special case: when the configuration starts with 413 * link down, it sets the duplex to 0. 414 */ 415 if (slave->link == BOND_LINK_UP) { 416 switch (slave->duplex) { 417 case DUPLEX_FULL: 418 retval = 0x1; 419 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received status full duplex update from adapter\n", 420 port->actor_port_number); 421 break; 422 case DUPLEX_HALF: 423 default: 424 retval = 0x0; 425 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received status NOT full duplex update from adapter\n", 426 port->actor_port_number); 427 break; 428 } 429 } 430 return retval; 431 } 432 433 static void __ad_actor_update_port(struct port *port) 434 { 435 const struct bonding *bond = bond_get_bond_by_slave(port->slave); 436 437 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr; 438 port->actor_system_priority = BOND_AD_INFO(bond).system.sys_priority; 439 } 440 441 /* Conversions */ 442 443 /** 444 * __ad_timer_to_ticks - convert a given timer type to AD module ticks 445 * @timer_type: which timer to operate 446 * @par: timer parameter. see below 447 * 448 * If @timer_type is %current_while_timer, @par indicates long/short timer. 449 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME, 450 * %SLOW_PERIODIC_TIME. 451 */ 452 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par) 453 { 454 u16 retval = 0; /* to silence the compiler */ 455 456 switch (timer_type) { 457 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */ 458 if (par) 459 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec); 460 else 461 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec); 462 break; 463 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */ 464 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec); 465 break; 466 case AD_PERIODIC_TIMER: /* for periodic machine */ 467 retval = (par*ad_ticks_per_sec); /* long timeout */ 468 break; 469 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */ 470 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec); 471 break; 472 case AD_WAIT_WHILE_TIMER: /* for selection machine */ 473 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec); 474 break; 475 } 476 477 return retval; 478 } 479 480 481 /* ================= ad_rx_machine helper functions ================== */ 482 483 /** 484 * __choose_matched - update a port's matched variable from a received lacpdu 485 * @lacpdu: the lacpdu we've received 486 * @port: the port we're looking at 487 * 488 * Update the value of the matched variable, using parameter values from a 489 * newly received lacpdu. Parameter values for the partner carried in the 490 * received PDU are compared with the corresponding operational parameter 491 * values for the actor. Matched is set to TRUE if all of these parameters 492 * match and the PDU parameter partner_state.aggregation has the same value as 493 * actor_oper_port_state.aggregation and lacp will actively maintain the link 494 * in the aggregation. Matched is also set to TRUE if the value of 495 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates 496 * an individual link and lacp will actively maintain the link. Otherwise, 497 * matched is set to FALSE. LACP is considered to be actively maintaining the 498 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both 499 * the actor's actor_oper_port_state.lacp_activity and the PDU's 500 * partner_state.lacp_activity variables are TRUE. 501 * 502 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is 503 * used here to implement the language from 802.3ad 43.4.9 that requires 504 * recordPDU to "match" the LACPDU parameters to the stored values. 505 */ 506 static void __choose_matched(struct lacpdu *lacpdu, struct port *port) 507 { 508 /* check if all parameters are alike 509 * or this is individual link(aggregation == FALSE) 510 * then update the state machine Matched variable. 511 */ 512 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) && 513 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) && 514 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) && 515 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) && 516 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) && 517 ((lacpdu->partner_state & LACP_STATE_AGGREGATION) == (port->actor_oper_port_state & LACP_STATE_AGGREGATION))) || 518 ((lacpdu->actor_state & LACP_STATE_AGGREGATION) == 0) 519 ) { 520 port->sm_vars |= AD_PORT_MATCHED; 521 } else { 522 port->sm_vars &= ~AD_PORT_MATCHED; 523 } 524 } 525 526 /** 527 * __record_pdu - record parameters from a received lacpdu 528 * @lacpdu: the lacpdu we've received 529 * @port: the port we're looking at 530 * 531 * Record the parameter values for the Actor carried in a received lacpdu as 532 * the current partner operational parameter values and sets 533 * actor_oper_port_state.defaulted to FALSE. 534 */ 535 static void __record_pdu(struct lacpdu *lacpdu, struct port *port) 536 { 537 if (lacpdu && port) { 538 struct port_params *partner = &port->partner_oper; 539 540 __choose_matched(lacpdu, port); 541 /* record the new parameter values for the partner 542 * operational 543 */ 544 partner->port_number = ntohs(lacpdu->actor_port); 545 partner->port_priority = ntohs(lacpdu->actor_port_priority); 546 partner->system = lacpdu->actor_system; 547 partner->system_priority = ntohs(lacpdu->actor_system_priority); 548 partner->key = ntohs(lacpdu->actor_key); 549 partner->port_state = lacpdu->actor_state; 550 551 /* set actor_oper_port_state.defaulted to FALSE */ 552 port->actor_oper_port_state &= ~LACP_STATE_DEFAULTED; 553 554 /* set the partner sync. to on if the partner is sync, 555 * and the port is matched 556 */ 557 if ((port->sm_vars & AD_PORT_MATCHED) && 558 (lacpdu->actor_state & LACP_STATE_SYNCHRONIZATION)) { 559 partner->port_state |= LACP_STATE_SYNCHRONIZATION; 560 slave_dbg(port->slave->bond->dev, port->slave->dev, 561 "partner sync=1\n"); 562 } else { 563 partner->port_state &= ~LACP_STATE_SYNCHRONIZATION; 564 slave_dbg(port->slave->bond->dev, port->slave->dev, 565 "partner sync=0\n"); 566 } 567 } 568 } 569 570 /** 571 * __record_default - record default parameters 572 * @port: the port we're looking at 573 * 574 * This function records the default parameter values for the partner carried 575 * in the Partner Admin parameters as the current partner operational parameter 576 * values and sets actor_oper_port_state.defaulted to TRUE. 577 */ 578 static void __record_default(struct port *port) 579 { 580 if (port) { 581 /* record the partner admin parameters */ 582 memcpy(&port->partner_oper, &port->partner_admin, 583 sizeof(struct port_params)); 584 585 /* set actor_oper_port_state.defaulted to true */ 586 port->actor_oper_port_state |= LACP_STATE_DEFAULTED; 587 } 588 } 589 590 /** 591 * __update_selected - update a port's Selected variable from a received lacpdu 592 * @lacpdu: the lacpdu we've received 593 * @port: the port we're looking at 594 * 595 * Update the value of the selected variable, using parameter values from a 596 * newly received lacpdu. The parameter values for the Actor carried in the 597 * received PDU are compared with the corresponding operational parameter 598 * values for the ports partner. If one or more of the comparisons shows that 599 * the value(s) received in the PDU differ from the current operational values, 600 * then selected is set to FALSE and actor_oper_port_state.synchronization is 601 * set to out_of_sync. Otherwise, selected remains unchanged. 602 */ 603 static void __update_selected(struct lacpdu *lacpdu, struct port *port) 604 { 605 if (lacpdu && port) { 606 const struct port_params *partner = &port->partner_oper; 607 608 /* check if any parameter is different then 609 * update the state machine selected variable. 610 */ 611 if (ntohs(lacpdu->actor_port) != partner->port_number || 612 ntohs(lacpdu->actor_port_priority) != partner->port_priority || 613 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) || 614 ntohs(lacpdu->actor_system_priority) != partner->system_priority || 615 ntohs(lacpdu->actor_key) != partner->key || 616 (lacpdu->actor_state & LACP_STATE_AGGREGATION) != (partner->port_state & LACP_STATE_AGGREGATION)) { 617 port->sm_vars &= ~AD_PORT_SELECTED; 618 } 619 } 620 } 621 622 /** 623 * __update_default_selected - update a port's Selected variable from Partner 624 * @port: the port we're looking at 625 * 626 * This function updates the value of the selected variable, using the partner 627 * administrative parameter values. The administrative values are compared with 628 * the corresponding operational parameter values for the partner. If one or 629 * more of the comparisons shows that the administrative value(s) differ from 630 * the current operational values, then Selected is set to FALSE and 631 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise, 632 * Selected remains unchanged. 633 */ 634 static void __update_default_selected(struct port *port) 635 { 636 if (port) { 637 const struct port_params *admin = &port->partner_admin; 638 const struct port_params *oper = &port->partner_oper; 639 640 /* check if any parameter is different then 641 * update the state machine selected variable. 642 */ 643 if (admin->port_number != oper->port_number || 644 admin->port_priority != oper->port_priority || 645 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) || 646 admin->system_priority != oper->system_priority || 647 admin->key != oper->key || 648 (admin->port_state & LACP_STATE_AGGREGATION) 649 != (oper->port_state & LACP_STATE_AGGREGATION)) { 650 port->sm_vars &= ~AD_PORT_SELECTED; 651 } 652 } 653 } 654 655 /** 656 * __update_ntt - update a port's ntt variable from a received lacpdu 657 * @lacpdu: the lacpdu we've received 658 * @port: the port we're looking at 659 * 660 * Updates the value of the ntt variable, using parameter values from a newly 661 * received lacpdu. The parameter values for the partner carried in the 662 * received PDU are compared with the corresponding operational parameter 663 * values for the Actor. If one or more of the comparisons shows that the 664 * value(s) received in the PDU differ from the current operational values, 665 * then ntt is set to TRUE. Otherwise, ntt remains unchanged. 666 */ 667 static void __update_ntt(struct lacpdu *lacpdu, struct port *port) 668 { 669 /* validate lacpdu and port */ 670 if (lacpdu && port) { 671 /* check if any parameter is different then 672 * update the port->ntt. 673 */ 674 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) || 675 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) || 676 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) || 677 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) || 678 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) || 679 ((lacpdu->partner_state & LACP_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & LACP_STATE_LACP_ACTIVITY)) || 680 ((lacpdu->partner_state & LACP_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & LACP_STATE_LACP_TIMEOUT)) || 681 ((lacpdu->partner_state & LACP_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION)) || 682 ((lacpdu->partner_state & LACP_STATE_AGGREGATION) != (port->actor_oper_port_state & LACP_STATE_AGGREGATION)) 683 ) { 684 port->ntt = true; 685 } 686 } 687 } 688 689 /** 690 * __agg_ports_are_ready - check if all ports in an aggregator are ready 691 * @aggregator: the aggregator we're looking at 692 * 693 */ 694 static int __agg_ports_are_ready(struct aggregator *aggregator) 695 { 696 struct port *port; 697 int retval = 1; 698 699 if (aggregator) { 700 /* scan all ports in this aggregator to verfy if they are 701 * all ready. 702 */ 703 for (port = aggregator->lag_ports; 704 port; 705 port = port->next_port_in_aggregator) { 706 if (!(port->sm_vars & AD_PORT_READY_N)) { 707 retval = 0; 708 break; 709 } 710 } 711 } 712 713 return retval; 714 } 715 716 /** 717 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator 718 * @aggregator: the aggregator we're looking at 719 * @val: Should the ports' ready bit be set on or off 720 * 721 */ 722 static void __set_agg_ports_ready(struct aggregator *aggregator, int val) 723 { 724 struct port *port; 725 726 for (port = aggregator->lag_ports; port; 727 port = port->next_port_in_aggregator) { 728 if (val) 729 port->sm_vars |= AD_PORT_READY; 730 else 731 port->sm_vars &= ~AD_PORT_READY; 732 } 733 } 734 735 static int __agg_active_ports(struct aggregator *agg) 736 { 737 struct port *port; 738 int active = 0; 739 740 for (port = agg->lag_ports; port; 741 port = port->next_port_in_aggregator) { 742 if (port->is_enabled) 743 active++; 744 } 745 746 return active; 747 } 748 749 /** 750 * __get_agg_bandwidth - get the total bandwidth of an aggregator 751 * @aggregator: the aggregator we're looking at 752 * 753 */ 754 static u32 __get_agg_bandwidth(struct aggregator *aggregator) 755 { 756 int nports = __agg_active_ports(aggregator); 757 u32 bandwidth = 0; 758 759 if (nports) { 760 switch (__get_link_speed(aggregator->lag_ports)) { 761 case AD_LINK_SPEED_1MBPS: 762 bandwidth = nports; 763 break; 764 case AD_LINK_SPEED_10MBPS: 765 bandwidth = nports * 10; 766 break; 767 case AD_LINK_SPEED_100MBPS: 768 bandwidth = nports * 100; 769 break; 770 case AD_LINK_SPEED_1000MBPS: 771 bandwidth = nports * 1000; 772 break; 773 case AD_LINK_SPEED_2500MBPS: 774 bandwidth = nports * 2500; 775 break; 776 case AD_LINK_SPEED_5000MBPS: 777 bandwidth = nports * 5000; 778 break; 779 case AD_LINK_SPEED_10000MBPS: 780 bandwidth = nports * 10000; 781 break; 782 case AD_LINK_SPEED_14000MBPS: 783 bandwidth = nports * 14000; 784 break; 785 case AD_LINK_SPEED_20000MBPS: 786 bandwidth = nports * 20000; 787 break; 788 case AD_LINK_SPEED_25000MBPS: 789 bandwidth = nports * 25000; 790 break; 791 case AD_LINK_SPEED_40000MBPS: 792 bandwidth = nports * 40000; 793 break; 794 case AD_LINK_SPEED_50000MBPS: 795 bandwidth = nports * 50000; 796 break; 797 case AD_LINK_SPEED_56000MBPS: 798 bandwidth = nports * 56000; 799 break; 800 case AD_LINK_SPEED_100000MBPS: 801 bandwidth = nports * 100000; 802 break; 803 case AD_LINK_SPEED_200000MBPS: 804 bandwidth = nports * 200000; 805 break; 806 case AD_LINK_SPEED_400000MBPS: 807 bandwidth = nports * 400000; 808 break; 809 case AD_LINK_SPEED_800000MBPS: 810 bandwidth = nports * 800000; 811 break; 812 default: 813 bandwidth = 0; /* to silence the compiler */ 814 } 815 } 816 return bandwidth; 817 } 818 819 /** 820 * __get_active_agg - get the current active aggregator 821 * @aggregator: the aggregator we're looking at 822 * 823 * Caller must hold RCU lock. 824 */ 825 static struct aggregator *__get_active_agg(struct aggregator *aggregator) 826 { 827 struct bonding *bond = aggregator->slave->bond; 828 struct list_head *iter; 829 struct slave *slave; 830 831 bond_for_each_slave_rcu(bond, slave, iter) 832 if (SLAVE_AD_INFO(slave)->aggregator.is_active) 833 return &(SLAVE_AD_INFO(slave)->aggregator); 834 835 return NULL; 836 } 837 838 /** 839 * __update_lacpdu_from_port - update a port's lacpdu fields 840 * @port: the port we're looking at 841 */ 842 static inline void __update_lacpdu_from_port(struct port *port) 843 { 844 struct lacpdu *lacpdu = &port->lacpdu; 845 const struct port_params *partner = &port->partner_oper; 846 847 /* update current actual Actor parameters 848 * lacpdu->subtype initialized 849 * lacpdu->version_number initialized 850 * lacpdu->tlv_type_actor_info initialized 851 * lacpdu->actor_information_length initialized 852 */ 853 854 lacpdu->actor_system_priority = htons(port->actor_system_priority); 855 lacpdu->actor_system = port->actor_system; 856 lacpdu->actor_key = htons(port->actor_oper_port_key); 857 lacpdu->actor_port_priority = htons(port->actor_port_priority); 858 lacpdu->actor_port = htons(port->actor_port_number); 859 lacpdu->actor_state = port->actor_oper_port_state; 860 slave_dbg(port->slave->bond->dev, port->slave->dev, 861 "update lacpdu: actor port state %x\n", 862 port->actor_oper_port_state); 863 864 /* lacpdu->reserved_3_1 initialized 865 * lacpdu->tlv_type_partner_info initialized 866 * lacpdu->partner_information_length initialized 867 */ 868 869 lacpdu->partner_system_priority = htons(partner->system_priority); 870 lacpdu->partner_system = partner->system; 871 lacpdu->partner_key = htons(partner->key); 872 lacpdu->partner_port_priority = htons(partner->port_priority); 873 lacpdu->partner_port = htons(partner->port_number); 874 lacpdu->partner_state = partner->port_state; 875 876 /* lacpdu->reserved_3_2 initialized 877 * lacpdu->tlv_type_collector_info initialized 878 * lacpdu->collector_information_length initialized 879 * collector_max_delay initialized 880 * reserved_12[12] initialized 881 * tlv_type_terminator initialized 882 * terminator_length initialized 883 * reserved_50[50] initialized 884 */ 885 } 886 887 /* ================= main 802.3ad protocol code ========================= */ 888 889 /** 890 * ad_lacpdu_send - send out a lacpdu packet on a given port 891 * @port: the port we're looking at 892 * 893 * Returns: 0 on success 894 * < 0 on error 895 */ 896 static int ad_lacpdu_send(struct port *port) 897 { 898 struct slave *slave = port->slave; 899 struct sk_buff *skb; 900 struct lacpdu_header *lacpdu_header; 901 int length = sizeof(struct lacpdu_header); 902 903 skb = dev_alloc_skb(length); 904 if (!skb) 905 return -ENOMEM; 906 907 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_tx); 908 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.lacpdu_tx); 909 910 skb->dev = slave->dev; 911 skb_reset_mac_header(skb); 912 skb->network_header = skb->mac_header + ETH_HLEN; 913 skb->protocol = PKT_TYPE_LACPDU; 914 skb->priority = TC_PRIO_CONTROL; 915 916 lacpdu_header = skb_put(skb, length); 917 918 ether_addr_copy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr); 919 /* Note: source address is set to be the member's PERMANENT address, 920 * because we use it to identify loopback lacpdus in receive. 921 */ 922 ether_addr_copy(lacpdu_header->hdr.h_source, slave->perm_hwaddr); 923 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU; 924 925 lacpdu_header->lacpdu = port->lacpdu; 926 927 dev_queue_xmit(skb); 928 929 return 0; 930 } 931 932 /** 933 * ad_marker_send - send marker information/response on a given port 934 * @port: the port we're looking at 935 * @marker: marker data to send 936 * 937 * Returns: 0 on success 938 * < 0 on error 939 */ 940 static int ad_marker_send(struct port *port, struct bond_marker *marker) 941 { 942 struct slave *slave = port->slave; 943 struct sk_buff *skb; 944 struct bond_marker_header *marker_header; 945 int length = sizeof(struct bond_marker_header); 946 947 skb = dev_alloc_skb(length + 16); 948 if (!skb) 949 return -ENOMEM; 950 951 switch (marker->tlv_type) { 952 case AD_MARKER_INFORMATION_SUBTYPE: 953 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.marker_tx); 954 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.marker_tx); 955 break; 956 case AD_MARKER_RESPONSE_SUBTYPE: 957 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.marker_resp_tx); 958 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.marker_resp_tx); 959 break; 960 } 961 962 skb_reserve(skb, 16); 963 964 skb->dev = slave->dev; 965 skb_reset_mac_header(skb); 966 skb->network_header = skb->mac_header + ETH_HLEN; 967 skb->protocol = PKT_TYPE_LACPDU; 968 969 marker_header = skb_put(skb, length); 970 971 ether_addr_copy(marker_header->hdr.h_dest, lacpdu_mcast_addr); 972 /* Note: source address is set to be the member's PERMANENT address, 973 * because we use it to identify loopback MARKERs in receive. 974 */ 975 ether_addr_copy(marker_header->hdr.h_source, slave->perm_hwaddr); 976 marker_header->hdr.h_proto = PKT_TYPE_LACPDU; 977 978 marker_header->marker = *marker; 979 980 dev_queue_xmit(skb); 981 982 return 0; 983 } 984 985 static void ad_cond_set_peer_notif(struct port *port) 986 { 987 struct bonding *bond = port->slave->bond; 988 989 if (bond->params.broadcast_neighbor && rtnl_trylock()) { 990 bond->send_peer_notif = bond->params.num_peer_notif * 991 max(1, bond->params.peer_notif_delay); 992 rtnl_unlock(); 993 } 994 } 995 996 /** 997 * ad_mux_machine - handle a port's mux state machine 998 * @port: the port we're looking at 999 * @update_slave_arr: Does slave array need update? 1000 */ 1001 static void ad_mux_machine(struct port *port, bool *update_slave_arr) 1002 { 1003 struct bonding *bond = __get_bond_by_port(port); 1004 mux_states_t last_state; 1005 1006 /* keep current State Machine state to compare later if it was 1007 * changed 1008 */ 1009 last_state = port->sm_mux_state; 1010 1011 if (port->sm_vars & AD_PORT_BEGIN) { 1012 port->sm_mux_state = AD_MUX_DETACHED; 1013 } else { 1014 switch (port->sm_mux_state) { 1015 case AD_MUX_DETACHED: 1016 if ((port->sm_vars & AD_PORT_SELECTED) 1017 || (port->sm_vars & AD_PORT_STANDBY)) 1018 /* if SELECTED or STANDBY */ 1019 port->sm_mux_state = AD_MUX_WAITING; 1020 break; 1021 case AD_MUX_WAITING: 1022 /* if SELECTED == FALSE return to DETACH state */ 1023 if (!(port->sm_vars & AD_PORT_SELECTED)) { 1024 port->sm_vars &= ~AD_PORT_READY_N; 1025 /* in order to withhold the Selection Logic to 1026 * check all ports READY_N value every callback 1027 * cycle to update ready variable, we check 1028 * READY_N and update READY here 1029 */ 1030 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator)); 1031 port->sm_mux_state = AD_MUX_DETACHED; 1032 break; 1033 } 1034 1035 /* check if the wait_while_timer expired */ 1036 if (port->sm_mux_timer_counter 1037 && !(--port->sm_mux_timer_counter)) 1038 port->sm_vars |= AD_PORT_READY_N; 1039 1040 /* in order to withhold the selection logic to check 1041 * all ports READY_N value every callback cycle to 1042 * update ready variable, we check READY_N and update 1043 * READY here 1044 */ 1045 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator)); 1046 1047 /* if the wait_while_timer expired, and the port is 1048 * in READY state, move to ATTACHED state 1049 */ 1050 if ((port->sm_vars & AD_PORT_READY) 1051 && !port->sm_mux_timer_counter) 1052 port->sm_mux_state = AD_MUX_ATTACHED; 1053 break; 1054 case AD_MUX_ATTACHED: 1055 /* check also if agg_select_timer expired (so the 1056 * edable port will take place only after this timer) 1057 */ 1058 if ((port->sm_vars & AD_PORT_SELECTED) && 1059 (port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) && 1060 !__check_agg_selection_timer(port)) { 1061 if (port->aggregator->is_active) { 1062 int state = AD_MUX_COLLECTING_DISTRIBUTING; 1063 1064 if (!bond->params.coupled_control) 1065 state = AD_MUX_COLLECTING; 1066 port->sm_mux_state = state; 1067 } 1068 } else if (!(port->sm_vars & AD_PORT_SELECTED) || 1069 (port->sm_vars & AD_PORT_STANDBY)) { 1070 /* if UNSELECTED or STANDBY */ 1071 port->sm_vars &= ~AD_PORT_READY_N; 1072 /* in order to withhold the selection logic to 1073 * check all ports READY_N value every callback 1074 * cycle to update ready variable, we check 1075 * READY_N and update READY here 1076 */ 1077 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator)); 1078 port->sm_mux_state = AD_MUX_DETACHED; 1079 } else if (port->aggregator->is_active) { 1080 port->actor_oper_port_state |= 1081 LACP_STATE_SYNCHRONIZATION; 1082 } 1083 break; 1084 case AD_MUX_COLLECTING_DISTRIBUTING: 1085 if (!__port_move_to_attached_state(port)) { 1086 /* if port state hasn't changed make 1087 * sure that a collecting distributing 1088 * port in an active aggregator is enabled 1089 */ 1090 if (port->aggregator->is_active && 1091 !__port_is_collecting_distributing(port)) { 1092 __enable_port(port); 1093 *update_slave_arr = true; 1094 } 1095 } 1096 break; 1097 case AD_MUX_COLLECTING: 1098 if (!__port_move_to_attached_state(port)) { 1099 if ((port->sm_vars & AD_PORT_SELECTED) && 1100 (port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) && 1101 (port->partner_oper.port_state & LACP_STATE_COLLECTING)) { 1102 port->sm_mux_state = AD_MUX_DISTRIBUTING; 1103 } else { 1104 /* If port state hasn't changed, make sure that a collecting 1105 * port is enabled for an active aggregator. 1106 */ 1107 struct slave *slave = port->slave; 1108 1109 if (port->aggregator->is_active && 1110 bond_is_slave_rx_disabled(slave)) { 1111 ad_enable_collecting(port); 1112 *update_slave_arr = true; 1113 } 1114 } 1115 } 1116 break; 1117 case AD_MUX_DISTRIBUTING: 1118 if (!(port->sm_vars & AD_PORT_SELECTED) || 1119 (port->sm_vars & AD_PORT_STANDBY) || 1120 !(port->partner_oper.port_state & LACP_STATE_COLLECTING) || 1121 !(port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) || 1122 !(port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION)) { 1123 port->sm_mux_state = AD_MUX_COLLECTING; 1124 } else { 1125 /* if port state hasn't changed make 1126 * sure that a collecting distributing 1127 * port in an active aggregator is enabled 1128 */ 1129 if (port->aggregator && 1130 port->aggregator->is_active && 1131 !__port_is_collecting_distributing(port)) { 1132 __enable_port(port); 1133 *update_slave_arr = true; 1134 } 1135 } 1136 break; 1137 default: 1138 break; 1139 } 1140 } 1141 1142 /* check if the state machine was changed */ 1143 if (port->sm_mux_state != last_state) { 1144 slave_dbg(port->slave->bond->dev, port->slave->dev, 1145 "Mux Machine: Port=%d, Last State=%d, Curr State=%d\n", 1146 port->actor_port_number, 1147 last_state, 1148 port->sm_mux_state); 1149 switch (port->sm_mux_state) { 1150 case AD_MUX_DETACHED: 1151 port->actor_oper_port_state &= ~LACP_STATE_SYNCHRONIZATION; 1152 ad_disable_collecting_distributing(port, 1153 update_slave_arr); 1154 port->actor_oper_port_state &= ~LACP_STATE_COLLECTING; 1155 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING; 1156 port->ntt = true; 1157 break; 1158 case AD_MUX_WAITING: 1159 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0); 1160 break; 1161 case AD_MUX_ATTACHED: 1162 if (port->aggregator->is_active) 1163 port->actor_oper_port_state |= 1164 LACP_STATE_SYNCHRONIZATION; 1165 else 1166 port->actor_oper_port_state &= 1167 ~LACP_STATE_SYNCHRONIZATION; 1168 port->actor_oper_port_state &= ~LACP_STATE_COLLECTING; 1169 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING; 1170 ad_disable_collecting_distributing(port, 1171 update_slave_arr); 1172 port->ntt = true; 1173 break; 1174 case AD_MUX_COLLECTING_DISTRIBUTING: 1175 port->actor_oper_port_state |= LACP_STATE_COLLECTING; 1176 port->actor_oper_port_state |= LACP_STATE_DISTRIBUTING; 1177 port->actor_oper_port_state |= LACP_STATE_SYNCHRONIZATION; 1178 ad_enable_collecting_distributing(port, 1179 update_slave_arr); 1180 port->ntt = true; 1181 break; 1182 case AD_MUX_COLLECTING: 1183 port->actor_oper_port_state |= LACP_STATE_COLLECTING; 1184 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING; 1185 port->actor_oper_port_state |= LACP_STATE_SYNCHRONIZATION; 1186 ad_enable_collecting(port); 1187 ad_disable_distributing(port, update_slave_arr); 1188 port->ntt = true; 1189 break; 1190 case AD_MUX_DISTRIBUTING: 1191 port->actor_oper_port_state |= LACP_STATE_DISTRIBUTING; 1192 port->actor_oper_port_state |= LACP_STATE_SYNCHRONIZATION; 1193 ad_enable_collecting_distributing(port, 1194 update_slave_arr); 1195 break; 1196 default: 1197 break; 1198 } 1199 } 1200 } 1201 1202 /** 1203 * ad_rx_machine - handle a port's rx State Machine 1204 * @lacpdu: the lacpdu we've received 1205 * @port: the port we're looking at 1206 * 1207 * If lacpdu arrived, stop previous timer (if exists) and set the next state as 1208 * CURRENT. If timer expired set the state machine in the proper state. 1209 * In other cases, this function checks if we need to switch to other state. 1210 */ 1211 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port) 1212 { 1213 rx_states_t last_state; 1214 1215 /* keep current State Machine state to compare later if it was 1216 * changed 1217 */ 1218 last_state = port->sm_rx_state; 1219 1220 if (lacpdu) { 1221 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.lacpdu_rx); 1222 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.lacpdu_rx); 1223 } 1224 /* check if state machine should change state */ 1225 1226 /* first, check if port was reinitialized */ 1227 if (port->sm_vars & AD_PORT_BEGIN) { 1228 port->sm_rx_state = AD_RX_INITIALIZE; 1229 port->sm_vars |= AD_PORT_CHURNED; 1230 /* check if port is not enabled */ 1231 } else if (!(port->sm_vars & AD_PORT_BEGIN) && !port->is_enabled) 1232 port->sm_rx_state = AD_RX_PORT_DISABLED; 1233 /* check if new lacpdu arrived */ 1234 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) || 1235 (port->sm_rx_state == AD_RX_DEFAULTED) || 1236 (port->sm_rx_state == AD_RX_CURRENT))) { 1237 if (port->sm_rx_state != AD_RX_CURRENT) 1238 port->sm_vars |= AD_PORT_CHURNED; 1239 port->sm_rx_timer_counter = 0; 1240 port->sm_rx_state = AD_RX_CURRENT; 1241 } else { 1242 /* if timer is on, and if it is expired */ 1243 if (port->sm_rx_timer_counter && 1244 !(--port->sm_rx_timer_counter)) { 1245 switch (port->sm_rx_state) { 1246 case AD_RX_EXPIRED: 1247 port->sm_rx_state = AD_RX_DEFAULTED; 1248 break; 1249 case AD_RX_CURRENT: 1250 port->sm_rx_state = AD_RX_EXPIRED; 1251 break; 1252 default: 1253 break; 1254 } 1255 } else { 1256 /* if no lacpdu arrived and no timer is on */ 1257 switch (port->sm_rx_state) { 1258 case AD_RX_PORT_DISABLED: 1259 if (port->is_enabled && 1260 (port->sm_vars & AD_PORT_LACP_ENABLED)) 1261 port->sm_rx_state = AD_RX_EXPIRED; 1262 else if (port->is_enabled 1263 && ((port->sm_vars 1264 & AD_PORT_LACP_ENABLED) == 0)) 1265 port->sm_rx_state = AD_RX_LACP_DISABLED; 1266 break; 1267 default: 1268 break; 1269 1270 } 1271 } 1272 } 1273 1274 /* check if the State machine was changed or new lacpdu arrived */ 1275 if ((port->sm_rx_state != last_state) || (lacpdu)) { 1276 slave_dbg(port->slave->bond->dev, port->slave->dev, 1277 "Rx Machine: Port=%d, Last State=%d, Curr State=%d\n", 1278 port->actor_port_number, 1279 last_state, 1280 port->sm_rx_state); 1281 switch (port->sm_rx_state) { 1282 case AD_RX_INITIALIZE: 1283 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS)) 1284 port->sm_vars &= ~AD_PORT_LACP_ENABLED; 1285 else 1286 port->sm_vars |= AD_PORT_LACP_ENABLED; 1287 port->sm_vars &= ~AD_PORT_SELECTED; 1288 __record_default(port); 1289 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED; 1290 port->sm_rx_state = AD_RX_PORT_DISABLED; 1291 1292 fallthrough; 1293 case AD_RX_PORT_DISABLED: 1294 port->sm_vars &= ~AD_PORT_MATCHED; 1295 break; 1296 case AD_RX_LACP_DISABLED: 1297 port->sm_vars &= ~AD_PORT_SELECTED; 1298 __record_default(port); 1299 port->partner_oper.port_state &= ~LACP_STATE_AGGREGATION; 1300 port->sm_vars |= AD_PORT_MATCHED; 1301 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED; 1302 break; 1303 case AD_RX_EXPIRED: 1304 /* Reset of the Synchronization flag (Standard 43.4.12) 1305 * This reset cause to disable this port in the 1306 * COLLECTING_DISTRIBUTING state of the mux machine in 1307 * case of EXPIRED even if LINK_DOWN didn't arrive for 1308 * the port. 1309 */ 1310 port->sm_vars &= ~AD_PORT_MATCHED; 1311 /* Based on IEEE 8021AX-2014, Figure 6-18 - Receive 1312 * machine state diagram, the statue should be 1313 * Partner_Oper_Port_State.Synchronization = FALSE; 1314 * Partner_Oper_Port_State.LACP_Timeout = Short Timeout; 1315 * start current_while_timer(Short Timeout); 1316 * Actor_Oper_Port_State.Expired = TRUE; 1317 */ 1318 port->partner_oper.port_state &= ~LACP_STATE_SYNCHRONIZATION; 1319 port->partner_oper.port_state |= LACP_STATE_LACP_TIMEOUT; 1320 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT)); 1321 port->actor_oper_port_state |= LACP_STATE_EXPIRED; 1322 port->sm_vars |= AD_PORT_CHURNED; 1323 break; 1324 case AD_RX_DEFAULTED: 1325 __update_default_selected(port); 1326 __record_default(port); 1327 port->sm_vars |= AD_PORT_MATCHED; 1328 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED; 1329 break; 1330 case AD_RX_CURRENT: 1331 /* detect loopback situation */ 1332 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system), 1333 &(port->actor_system))) { 1334 slave_err(port->slave->bond->dev, port->slave->dev, "An illegal loopback occurred on slave\n" 1335 "Check the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n"); 1336 return; 1337 } 1338 __update_selected(lacpdu, port); 1339 __update_ntt(lacpdu, port); 1340 __record_pdu(lacpdu, port); 1341 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & LACP_STATE_LACP_TIMEOUT)); 1342 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED; 1343 break; 1344 default: 1345 break; 1346 } 1347 } 1348 } 1349 1350 /** 1351 * ad_churn_machine - handle port churn's state machine 1352 * @port: the port we're looking at 1353 * 1354 */ 1355 static void ad_churn_machine(struct port *port) 1356 { 1357 if (port->sm_vars & AD_PORT_CHURNED) { 1358 port->sm_vars &= ~AD_PORT_CHURNED; 1359 port->sm_churn_actor_state = AD_CHURN_MONITOR; 1360 port->sm_churn_partner_state = AD_CHURN_MONITOR; 1361 port->sm_churn_actor_timer_counter = 1362 __ad_timer_to_ticks(AD_ACTOR_CHURN_TIMER, 0); 1363 port->sm_churn_partner_timer_counter = 1364 __ad_timer_to_ticks(AD_PARTNER_CHURN_TIMER, 0); 1365 return; 1366 } 1367 if (port->sm_churn_actor_timer_counter && 1368 !(--port->sm_churn_actor_timer_counter) && 1369 port->sm_churn_actor_state == AD_CHURN_MONITOR) { 1370 if (port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION) { 1371 port->sm_churn_actor_state = AD_NO_CHURN; 1372 } else { 1373 port->churn_actor_count++; 1374 port->sm_churn_actor_state = AD_CHURN; 1375 } 1376 } 1377 if (port->sm_churn_partner_timer_counter && 1378 !(--port->sm_churn_partner_timer_counter) && 1379 port->sm_churn_partner_state == AD_CHURN_MONITOR) { 1380 if (port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) { 1381 port->sm_churn_partner_state = AD_NO_CHURN; 1382 } else { 1383 port->churn_partner_count++; 1384 port->sm_churn_partner_state = AD_CHURN; 1385 } 1386 } 1387 } 1388 1389 /** 1390 * ad_tx_machine - handle a port's tx state machine 1391 * @port: the port we're looking at 1392 */ 1393 static void ad_tx_machine(struct port *port) 1394 { 1395 /* check if tx timer expired, to verify that we do not send more than 1396 * 3 packets per second 1397 */ 1398 if (!port->sm_tx_timer_counter || !(--port->sm_tx_timer_counter)) { 1399 /* check if there is something to send */ 1400 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) { 1401 __update_lacpdu_from_port(port); 1402 1403 if (ad_lacpdu_send(port) >= 0) { 1404 slave_dbg(port->slave->bond->dev, 1405 port->slave->dev, 1406 "Sent LACPDU on port %d\n", 1407 port->actor_port_number); 1408 1409 /* mark ntt as false, so it will not be sent 1410 * again until demanded 1411 */ 1412 port->ntt = false; 1413 1414 /* restart tx timer(to verify that we will not 1415 * exceed AD_MAX_TX_IN_SECOND 1416 */ 1417 port->sm_tx_timer_counter = ad_ticks_per_sec / AD_MAX_TX_IN_SECOND; 1418 } 1419 } 1420 } 1421 } 1422 1423 /** 1424 * ad_periodic_machine - handle a port's periodic state machine 1425 * @port: the port we're looking at 1426 * 1427 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's. 1428 */ 1429 static void ad_periodic_machine(struct port *port) 1430 { 1431 periodic_states_t last_state; 1432 1433 /* keep current state machine state to compare later if it was changed */ 1434 last_state = port->sm_periodic_state; 1435 1436 /* check if port was reinitialized */ 1437 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) || 1438 (!(port->actor_oper_port_state & LACP_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & LACP_STATE_LACP_ACTIVITY))) { 1439 port->sm_periodic_state = AD_NO_PERIODIC; 1440 } 1441 /* check if state machine should change state */ 1442 else if (port->sm_periodic_timer_counter) { 1443 /* check if periodic state machine expired */ 1444 if (!(--port->sm_periodic_timer_counter)) { 1445 /* if expired then do tx */ 1446 port->sm_periodic_state = AD_PERIODIC_TX; 1447 } else { 1448 /* If not expired, check if there is some new timeout 1449 * parameter from the partner state 1450 */ 1451 switch (port->sm_periodic_state) { 1452 case AD_FAST_PERIODIC: 1453 if (!(port->partner_oper.port_state 1454 & LACP_STATE_LACP_TIMEOUT)) 1455 port->sm_periodic_state = AD_SLOW_PERIODIC; 1456 break; 1457 case AD_SLOW_PERIODIC: 1458 if ((port->partner_oper.port_state & LACP_STATE_LACP_TIMEOUT)) { 1459 port->sm_periodic_timer_counter = 0; 1460 port->sm_periodic_state = AD_PERIODIC_TX; 1461 } 1462 break; 1463 default: 1464 break; 1465 } 1466 } 1467 } else { 1468 switch (port->sm_periodic_state) { 1469 case AD_NO_PERIODIC: 1470 port->sm_periodic_state = AD_FAST_PERIODIC; 1471 break; 1472 case AD_PERIODIC_TX: 1473 if (!(port->partner_oper.port_state & 1474 LACP_STATE_LACP_TIMEOUT)) 1475 port->sm_periodic_state = AD_SLOW_PERIODIC; 1476 else 1477 port->sm_periodic_state = AD_FAST_PERIODIC; 1478 break; 1479 default: 1480 break; 1481 } 1482 } 1483 1484 /* check if the state machine was changed */ 1485 if (port->sm_periodic_state != last_state) { 1486 slave_dbg(port->slave->bond->dev, port->slave->dev, 1487 "Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n", 1488 port->actor_port_number, last_state, 1489 port->sm_periodic_state); 1490 switch (port->sm_periodic_state) { 1491 case AD_NO_PERIODIC: 1492 port->sm_periodic_timer_counter = 0; 1493 break; 1494 case AD_FAST_PERIODIC: 1495 /* decrement 1 tick we lost in the PERIODIC_TX cycle */ 1496 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1; 1497 break; 1498 case AD_SLOW_PERIODIC: 1499 /* decrement 1 tick we lost in the PERIODIC_TX cycle */ 1500 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1; 1501 break; 1502 case AD_PERIODIC_TX: 1503 port->ntt = true; 1504 break; 1505 default: 1506 break; 1507 } 1508 } 1509 } 1510 1511 /** 1512 * ad_port_selection_logic - select aggregation groups 1513 * @port: the port we're looking at 1514 * @update_slave_arr: Does slave array need update? 1515 * 1516 * Select aggregation groups, and assign each port for it's aggregetor. The 1517 * selection logic is called in the inititalization (after all the handshkes), 1518 * and after every lacpdu receive (if selected is off). 1519 */ 1520 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr) 1521 { 1522 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator; 1523 struct port *last_port = NULL, *curr_port; 1524 struct list_head *iter; 1525 struct bonding *bond; 1526 struct slave *slave; 1527 int found = 0; 1528 1529 /* if the port is already Selected, do nothing */ 1530 if (port->sm_vars & AD_PORT_SELECTED) 1531 return; 1532 1533 bond = __get_bond_by_port(port); 1534 1535 /* if the port is connected to other aggregator, detach it */ 1536 if (port->aggregator) { 1537 /* detach the port from its former aggregator */ 1538 temp_aggregator = port->aggregator; 1539 for (curr_port = temp_aggregator->lag_ports; curr_port; 1540 last_port = curr_port, 1541 curr_port = curr_port->next_port_in_aggregator) { 1542 if (curr_port == port) { 1543 temp_aggregator->num_of_ports--; 1544 /* if it is the first port attached to the 1545 * aggregator 1546 */ 1547 if (!last_port) { 1548 temp_aggregator->lag_ports = 1549 port->next_port_in_aggregator; 1550 } else { 1551 /* not the first port attached to the 1552 * aggregator 1553 */ 1554 last_port->next_port_in_aggregator = 1555 port->next_port_in_aggregator; 1556 } 1557 1558 /* clear the port's relations to this 1559 * aggregator 1560 */ 1561 port->aggregator = NULL; 1562 port->next_port_in_aggregator = NULL; 1563 port->actor_port_aggregator_identifier = 0; 1564 1565 slave_dbg(bond->dev, port->slave->dev, "Port %d left LAG %d\n", 1566 port->actor_port_number, 1567 temp_aggregator->aggregator_identifier); 1568 /* if the aggregator is empty, clear its 1569 * parameters, and set it ready to be attached 1570 */ 1571 if (!temp_aggregator->lag_ports) 1572 ad_clear_agg(temp_aggregator); 1573 break; 1574 } 1575 } 1576 if (!curr_port) { 1577 /* meaning: the port was related to an aggregator 1578 * but was not on the aggregator port list 1579 */ 1580 net_warn_ratelimited("%s: (slave %s): Warning: Port %d was related to aggregator %d but was not on its port list\n", 1581 port->slave->bond->dev->name, 1582 port->slave->dev->name, 1583 port->actor_port_number, 1584 port->aggregator->aggregator_identifier); 1585 } 1586 } 1587 /* search on all aggregators for a suitable aggregator for this port */ 1588 bond_for_each_slave(bond, slave, iter) { 1589 aggregator = &(SLAVE_AD_INFO(slave)->aggregator); 1590 1591 /* keep a free aggregator for later use(if needed) */ 1592 if (!aggregator->lag_ports) { 1593 if (!free_aggregator) 1594 free_aggregator = aggregator; 1595 continue; 1596 } 1597 /* check if current aggregator suits us */ 1598 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */ 1599 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) && 1600 (aggregator->partner_system_priority == port->partner_oper.system_priority) && 1601 (aggregator->partner_oper_aggregator_key == port->partner_oper.key) 1602 ) && 1603 ((__agg_has_partner(aggregator) && /* partner answers */ 1604 !aggregator->is_individual) /* but is not individual OR */ 1605 ) 1606 ) { 1607 /* attach to the founded aggregator */ 1608 port->aggregator = aggregator; 1609 port->actor_port_aggregator_identifier = 1610 port->aggregator->aggregator_identifier; 1611 port->next_port_in_aggregator = aggregator->lag_ports; 1612 port->aggregator->num_of_ports++; 1613 aggregator->lag_ports = port; 1614 slave_dbg(bond->dev, slave->dev, "Port %d joined LAG %d (existing LAG)\n", 1615 port->actor_port_number, 1616 port->aggregator->aggregator_identifier); 1617 1618 /* mark this port as selected */ 1619 port->sm_vars |= AD_PORT_SELECTED; 1620 found = 1; 1621 break; 1622 } 1623 } 1624 1625 /* the port couldn't find an aggregator - attach it to a new 1626 * aggregator 1627 */ 1628 if (!found) { 1629 if (free_aggregator) { 1630 /* assign port a new aggregator */ 1631 port->aggregator = free_aggregator; 1632 port->actor_port_aggregator_identifier = 1633 port->aggregator->aggregator_identifier; 1634 1635 /* update the new aggregator's parameters 1636 * if port was responsed from the end-user 1637 */ 1638 if (port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS) 1639 /* if port is full duplex */ 1640 port->aggregator->is_individual = false; 1641 else 1642 port->aggregator->is_individual = true; 1643 1644 port->aggregator->actor_admin_aggregator_key = 1645 port->actor_admin_port_key; 1646 port->aggregator->actor_oper_aggregator_key = 1647 port->actor_oper_port_key; 1648 port->aggregator->partner_system = 1649 port->partner_oper.system; 1650 port->aggregator->partner_system_priority = 1651 port->partner_oper.system_priority; 1652 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key; 1653 port->aggregator->receive_state = 1; 1654 port->aggregator->transmit_state = 1; 1655 port->aggregator->lag_ports = port; 1656 port->aggregator->num_of_ports++; 1657 1658 /* mark this port as selected */ 1659 port->sm_vars |= AD_PORT_SELECTED; 1660 1661 slave_dbg(bond->dev, port->slave->dev, "Port %d joined LAG %d (new LAG)\n", 1662 port->actor_port_number, 1663 port->aggregator->aggregator_identifier); 1664 } else { 1665 slave_err(bond->dev, port->slave->dev, 1666 "Port %d did not find a suitable aggregator\n", 1667 port->actor_port_number); 1668 return; 1669 } 1670 } 1671 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE 1672 * in all aggregator's ports, else set ready=FALSE in all 1673 * aggregator's ports 1674 */ 1675 __set_agg_ports_ready(port->aggregator, 1676 __agg_ports_are_ready(port->aggregator)); 1677 1678 aggregator = __get_first_agg(port); 1679 ad_agg_selection_logic(aggregator, update_slave_arr); 1680 1681 if (!port->aggregator->is_active) 1682 port->actor_oper_port_state &= ~LACP_STATE_SYNCHRONIZATION; 1683 } 1684 1685 /* Decide if "agg" is a better choice for the new active aggregator that 1686 * the current best, according to the ad_select policy. 1687 */ 1688 static struct aggregator *ad_agg_selection_test(struct aggregator *best, 1689 struct aggregator *curr) 1690 { 1691 /* 0. If no best, select current. 1692 * 1693 * 1. If the current agg is not individual, and the best is 1694 * individual, select current. 1695 * 1696 * 2. If current agg is individual and the best is not, keep best. 1697 * 1698 * 3. Therefore, current and best are both individual or both not 1699 * individual, so: 1700 * 1701 * 3a. If current agg partner replied, and best agg partner did not, 1702 * select current. 1703 * 1704 * 3b. If current agg partner did not reply and best agg partner 1705 * did reply, keep best. 1706 * 1707 * 4. Therefore, current and best both have partner replies or 1708 * both do not, so perform selection policy: 1709 * 1710 * BOND_AD_COUNT: Select by count of ports. If count is equal, 1711 * select by bandwidth. 1712 * 1713 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth. 1714 */ 1715 if (!best) 1716 return curr; 1717 1718 if (!curr->is_individual && best->is_individual) 1719 return curr; 1720 1721 if (curr->is_individual && !best->is_individual) 1722 return best; 1723 1724 if (__agg_has_partner(curr) && !__agg_has_partner(best)) 1725 return curr; 1726 1727 if (!__agg_has_partner(curr) && __agg_has_partner(best)) 1728 return best; 1729 1730 switch (__get_agg_selection_mode(curr->lag_ports)) { 1731 case BOND_AD_COUNT: 1732 if (__agg_active_ports(curr) > __agg_active_ports(best)) 1733 return curr; 1734 1735 if (__agg_active_ports(curr) < __agg_active_ports(best)) 1736 return best; 1737 1738 fallthrough; 1739 case BOND_AD_STABLE: 1740 case BOND_AD_BANDWIDTH: 1741 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best)) 1742 return curr; 1743 1744 break; 1745 1746 default: 1747 net_warn_ratelimited("%s: (slave %s): Impossible agg select mode %d\n", 1748 curr->slave->bond->dev->name, 1749 curr->slave->dev->name, 1750 __get_agg_selection_mode(curr->lag_ports)); 1751 break; 1752 } 1753 1754 return best; 1755 } 1756 1757 static int agg_device_up(const struct aggregator *agg) 1758 { 1759 struct port *port = agg->lag_ports; 1760 1761 if (!port) 1762 return 0; 1763 1764 for (port = agg->lag_ports; port; 1765 port = port->next_port_in_aggregator) { 1766 if (netif_running(port->slave->dev) && 1767 netif_carrier_ok(port->slave->dev)) 1768 return 1; 1769 } 1770 1771 return 0; 1772 } 1773 1774 /** 1775 * ad_agg_selection_logic - select an aggregation group for a team 1776 * @agg: the aggregator we're looking at 1777 * @update_slave_arr: Does slave array need update? 1778 * 1779 * It is assumed that only one aggregator may be selected for a team. 1780 * 1781 * The logic of this function is to select the aggregator according to 1782 * the ad_select policy: 1783 * 1784 * BOND_AD_STABLE: select the aggregator with the most ports attached to 1785 * it, and to reselect the active aggregator only if the previous 1786 * aggregator has no more ports related to it. 1787 * 1788 * BOND_AD_BANDWIDTH: select the aggregator with the highest total 1789 * bandwidth, and reselect whenever a link state change takes place or the 1790 * set of slaves in the bond changes. 1791 * 1792 * BOND_AD_COUNT: select the aggregator with largest number of ports 1793 * (slaves), and reselect whenever a link state change takes place or the 1794 * set of slaves in the bond changes. 1795 * 1796 * FIXME: this function MUST be called with the first agg in the bond, or 1797 * __get_active_agg() won't work correctly. This function should be better 1798 * called with the bond itself, and retrieve the first agg from it. 1799 */ 1800 static void ad_agg_selection_logic(struct aggregator *agg, 1801 bool *update_slave_arr) 1802 { 1803 struct aggregator *best, *active, *origin; 1804 struct bonding *bond = agg->slave->bond; 1805 struct list_head *iter; 1806 struct slave *slave; 1807 struct port *port; 1808 1809 rcu_read_lock(); 1810 origin = agg; 1811 active = __get_active_agg(agg); 1812 best = (active && agg_device_up(active)) ? active : NULL; 1813 1814 bond_for_each_slave_rcu(bond, slave, iter) { 1815 agg = &(SLAVE_AD_INFO(slave)->aggregator); 1816 1817 agg->is_active = 0; 1818 1819 if (__agg_active_ports(agg) && agg_device_up(agg)) 1820 best = ad_agg_selection_test(best, agg); 1821 } 1822 1823 if (best && 1824 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) { 1825 /* For the STABLE policy, don't replace the old active 1826 * aggregator if it's still active (it has an answering 1827 * partner) or if both the best and active don't have an 1828 * answering partner. 1829 */ 1830 if (active && active->lag_ports && 1831 __agg_active_ports(active) && 1832 (__agg_has_partner(active) || 1833 (!__agg_has_partner(active) && 1834 !__agg_has_partner(best)))) { 1835 if (!(!active->actor_oper_aggregator_key && 1836 best->actor_oper_aggregator_key)) { 1837 best = NULL; 1838 active->is_active = 1; 1839 } 1840 } 1841 } 1842 1843 if (best && (best == active)) { 1844 best = NULL; 1845 active->is_active = 1; 1846 } 1847 1848 /* if there is new best aggregator, activate it */ 1849 if (best) { 1850 netdev_dbg(bond->dev, "(slave %s): best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n", 1851 best->slave ? best->slave->dev->name : "NULL", 1852 best->aggregator_identifier, best->num_of_ports, 1853 best->actor_oper_aggregator_key, 1854 best->partner_oper_aggregator_key, 1855 best->is_individual, best->is_active); 1856 netdev_dbg(bond->dev, "(slave %s): best ports %p slave %p\n", 1857 best->slave ? best->slave->dev->name : "NULL", 1858 best->lag_ports, best->slave); 1859 1860 bond_for_each_slave_rcu(bond, slave, iter) { 1861 agg = &(SLAVE_AD_INFO(slave)->aggregator); 1862 1863 slave_dbg(bond->dev, slave->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n", 1864 agg->aggregator_identifier, agg->num_of_ports, 1865 agg->actor_oper_aggregator_key, 1866 agg->partner_oper_aggregator_key, 1867 agg->is_individual, agg->is_active); 1868 } 1869 1870 /* check if any partner replies */ 1871 if (best->is_individual) 1872 net_warn_ratelimited("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n", 1873 bond->dev->name); 1874 1875 best->is_active = 1; 1876 netdev_dbg(bond->dev, "(slave %s): LAG %d chosen as the active LAG\n", 1877 best->slave ? best->slave->dev->name : "NULL", 1878 best->aggregator_identifier); 1879 netdev_dbg(bond->dev, "(slave %s): Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n", 1880 best->slave ? best->slave->dev->name : "NULL", 1881 best->aggregator_identifier, best->num_of_ports, 1882 best->actor_oper_aggregator_key, 1883 best->partner_oper_aggregator_key, 1884 best->is_individual, best->is_active); 1885 1886 /* disable the ports that were related to the former 1887 * active_aggregator 1888 */ 1889 if (active) { 1890 for (port = active->lag_ports; port; 1891 port = port->next_port_in_aggregator) { 1892 __disable_port(port); 1893 } 1894 } 1895 /* Slave array needs update. */ 1896 *update_slave_arr = true; 1897 } 1898 1899 /* if the selected aggregator is of join individuals 1900 * (partner_system is NULL), enable their ports 1901 */ 1902 active = __get_active_agg(origin); 1903 1904 if (active) { 1905 if (!__agg_has_partner(active)) { 1906 for (port = active->lag_ports; port; 1907 port = port->next_port_in_aggregator) { 1908 __enable_port(port); 1909 } 1910 *update_slave_arr = true; 1911 } 1912 } 1913 1914 rcu_read_unlock(); 1915 1916 bond_3ad_set_carrier(bond); 1917 } 1918 1919 /** 1920 * ad_clear_agg - clear a given aggregator's parameters 1921 * @aggregator: the aggregator we're looking at 1922 */ 1923 static void ad_clear_agg(struct aggregator *aggregator) 1924 { 1925 if (aggregator) { 1926 aggregator->is_individual = false; 1927 aggregator->actor_admin_aggregator_key = 0; 1928 aggregator->actor_oper_aggregator_key = 0; 1929 eth_zero_addr(aggregator->partner_system.mac_addr_value); 1930 aggregator->partner_system_priority = 0; 1931 aggregator->partner_oper_aggregator_key = 0; 1932 aggregator->receive_state = 0; 1933 aggregator->transmit_state = 0; 1934 aggregator->lag_ports = NULL; 1935 aggregator->is_active = 0; 1936 aggregator->num_of_ports = 0; 1937 pr_debug("%s: LAG %d was cleared\n", 1938 aggregator->slave ? 1939 aggregator->slave->dev->name : "NULL", 1940 aggregator->aggregator_identifier); 1941 } 1942 } 1943 1944 /** 1945 * ad_initialize_agg - initialize a given aggregator's parameters 1946 * @aggregator: the aggregator we're looking at 1947 */ 1948 static void ad_initialize_agg(struct aggregator *aggregator) 1949 { 1950 if (aggregator) { 1951 ad_clear_agg(aggregator); 1952 1953 eth_zero_addr(aggregator->aggregator_mac_address.mac_addr_value); 1954 aggregator->aggregator_identifier = 0; 1955 aggregator->slave = NULL; 1956 } 1957 } 1958 1959 /** 1960 * ad_initialize_port - initialize a given port's parameters 1961 * @port: the port we're looking at 1962 * @bond_params: bond parameters we will use 1963 */ 1964 static void ad_initialize_port(struct port *port, const struct bond_params *bond_params) 1965 { 1966 static const struct port_params tmpl = { 1967 .system_priority = 0xffff, 1968 .key = 1, 1969 .port_number = 1, 1970 .port_priority = 0xff, 1971 .port_state = 0, 1972 }; 1973 static const struct lacpdu lacpdu = { 1974 .subtype = 0x01, 1975 .version_number = 0x01, 1976 .tlv_type_actor_info = 0x01, 1977 .actor_information_length = 0x14, 1978 .tlv_type_partner_info = 0x02, 1979 .partner_information_length = 0x14, 1980 .tlv_type_collector_info = 0x03, 1981 .collector_information_length = 0x10, 1982 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY), 1983 }; 1984 1985 if (port) { 1986 port->actor_port_priority = 0xff; 1987 port->actor_port_aggregator_identifier = 0; 1988 port->ntt = false; 1989 port->actor_admin_port_state = LACP_STATE_AGGREGATION; 1990 port->actor_oper_port_state = LACP_STATE_AGGREGATION; 1991 if (bond_params->lacp_active) { 1992 port->actor_admin_port_state |= LACP_STATE_LACP_ACTIVITY; 1993 port->actor_oper_port_state |= LACP_STATE_LACP_ACTIVITY; 1994 } 1995 1996 if (bond_params->lacp_fast) 1997 port->actor_oper_port_state |= LACP_STATE_LACP_TIMEOUT; 1998 1999 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl)); 2000 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl)); 2001 2002 port->is_enabled = true; 2003 /* private parameters */ 2004 port->sm_vars = AD_PORT_BEGIN | AD_PORT_LACP_ENABLED; 2005 port->sm_rx_state = 0; 2006 port->sm_rx_timer_counter = 0; 2007 port->sm_periodic_state = 0; 2008 port->sm_periodic_timer_counter = 0; 2009 port->sm_mux_state = 0; 2010 port->sm_mux_timer_counter = 0; 2011 port->sm_tx_state = 0; 2012 port->aggregator = NULL; 2013 port->next_port_in_aggregator = NULL; 2014 port->transaction_id = 0; 2015 2016 port->sm_churn_actor_timer_counter = 0; 2017 port->sm_churn_actor_state = 0; 2018 port->churn_actor_count = 0; 2019 port->sm_churn_partner_timer_counter = 0; 2020 port->sm_churn_partner_state = 0; 2021 port->churn_partner_count = 0; 2022 2023 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu)); 2024 } 2025 } 2026 2027 /** 2028 * ad_enable_collecting - enable a port's receive 2029 * @port: the port we're looking at 2030 * 2031 * Enable @port if it's in an active aggregator 2032 */ 2033 static void ad_enable_collecting(struct port *port) 2034 { 2035 if (port->aggregator->is_active) { 2036 struct slave *slave = port->slave; 2037 2038 slave_dbg(slave->bond->dev, slave->dev, 2039 "Enabling collecting on port %d (LAG %d)\n", 2040 port->actor_port_number, 2041 port->aggregator->aggregator_identifier); 2042 __enable_collecting_port(port); 2043 } 2044 } 2045 2046 /** 2047 * ad_disable_distributing - disable a port's transmit 2048 * @port: the port we're looking at 2049 * @update_slave_arr: Does slave array need update? 2050 */ 2051 static void ad_disable_distributing(struct port *port, bool *update_slave_arr) 2052 { 2053 if (port->aggregator && __agg_has_partner(port->aggregator)) { 2054 slave_dbg(port->slave->bond->dev, port->slave->dev, 2055 "Disabling distributing on port %d (LAG %d)\n", 2056 port->actor_port_number, 2057 port->aggregator->aggregator_identifier); 2058 __disable_distributing_port(port); 2059 /* Slave array needs an update */ 2060 *update_slave_arr = true; 2061 } 2062 } 2063 2064 /** 2065 * ad_enable_collecting_distributing - enable a port's transmit/receive 2066 * @port: the port we're looking at 2067 * @update_slave_arr: Does slave array need update? 2068 * 2069 * Enable @port if it's in an active aggregator 2070 */ 2071 static void ad_enable_collecting_distributing(struct port *port, 2072 bool *update_slave_arr) 2073 { 2074 if (port->aggregator->is_active) { 2075 slave_dbg(port->slave->bond->dev, port->slave->dev, 2076 "Enabling port %d (LAG %d)\n", 2077 port->actor_port_number, 2078 port->aggregator->aggregator_identifier); 2079 __enable_port(port); 2080 /* Slave array needs update */ 2081 *update_slave_arr = true; 2082 /* Should notify peers if possible */ 2083 ad_cond_set_peer_notif(port); 2084 } 2085 } 2086 2087 /** 2088 * ad_disable_collecting_distributing - disable a port's transmit/receive 2089 * @port: the port we're looking at 2090 * @update_slave_arr: Does slave array need update? 2091 */ 2092 static void ad_disable_collecting_distributing(struct port *port, 2093 bool *update_slave_arr) 2094 { 2095 if (port->aggregator && __agg_has_partner(port->aggregator)) { 2096 slave_dbg(port->slave->bond->dev, port->slave->dev, 2097 "Disabling port %d (LAG %d)\n", 2098 port->actor_port_number, 2099 port->aggregator->aggregator_identifier); 2100 __disable_port(port); 2101 /* Slave array needs an update */ 2102 *update_slave_arr = true; 2103 } 2104 } 2105 2106 /** 2107 * ad_marker_info_received - handle receive of a Marker information frame 2108 * @marker_info: Marker info received 2109 * @port: the port we're looking at 2110 */ 2111 static void ad_marker_info_received(struct bond_marker *marker_info, 2112 struct port *port) 2113 { 2114 struct bond_marker marker; 2115 2116 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.marker_rx); 2117 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.marker_rx); 2118 2119 /* copy the received marker data to the response marker */ 2120 memcpy(&marker, marker_info, sizeof(struct bond_marker)); 2121 /* change the marker subtype to marker response */ 2122 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE; 2123 2124 /* send the marker response */ 2125 if (ad_marker_send(port, &marker) >= 0) 2126 slave_dbg(port->slave->bond->dev, port->slave->dev, 2127 "Sent Marker Response on port %d\n", 2128 port->actor_port_number); 2129 } 2130 2131 /** 2132 * ad_marker_response_received - handle receive of a marker response frame 2133 * @marker: marker PDU received 2134 * @port: the port we're looking at 2135 * 2136 * This function does nothing since we decided not to implement send and handle 2137 * response for marker PDU's, in this stage, but only to respond to marker 2138 * information. 2139 */ 2140 static void ad_marker_response_received(struct bond_marker *marker, 2141 struct port *port) 2142 { 2143 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.marker_resp_rx); 2144 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.marker_resp_rx); 2145 2146 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */ 2147 } 2148 2149 /* ========= AD exported functions to the main bonding code ========= */ 2150 2151 /* Check aggregators status in team every T seconds */ 2152 #define AD_AGGREGATOR_SELECTION_TIMER 8 2153 2154 /** 2155 * bond_3ad_initiate_agg_selection - initate aggregator selection 2156 * @bond: bonding struct 2157 * @timeout: timeout value to set 2158 * 2159 * Set the aggregation selection timer, to initiate an agg selection in 2160 * the very near future. Called during first initialization, and during 2161 * any down to up transitions of the bond. 2162 */ 2163 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout) 2164 { 2165 atomic_set(&BOND_AD_INFO(bond).agg_select_timer, timeout); 2166 } 2167 2168 /** 2169 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures 2170 * @bond: bonding struct to work on 2171 * 2172 * Can be called only after the mac address of the bond is set. 2173 */ 2174 void bond_3ad_initialize(struct bonding *bond) 2175 { 2176 BOND_AD_INFO(bond).aggregator_identifier = 0; 2177 BOND_AD_INFO(bond).system.sys_priority = 2178 bond->params.ad_actor_sys_prio; 2179 if (is_zero_ether_addr(bond->params.ad_actor_system)) 2180 BOND_AD_INFO(bond).system.sys_mac_addr = 2181 *((struct mac_addr *)bond->dev->dev_addr); 2182 else 2183 BOND_AD_INFO(bond).system.sys_mac_addr = 2184 *((struct mac_addr *)bond->params.ad_actor_system); 2185 2186 bond_3ad_initiate_agg_selection(bond, 2187 AD_AGGREGATOR_SELECTION_TIMER * 2188 ad_ticks_per_sec); 2189 } 2190 2191 /** 2192 * bond_3ad_bind_slave - initialize a slave's port 2193 * @slave: slave struct to work on 2194 * 2195 * Returns: 0 on success 2196 * < 0 on error 2197 */ 2198 void bond_3ad_bind_slave(struct slave *slave) 2199 { 2200 struct bonding *bond = bond_get_bond_by_slave(slave); 2201 struct port *port; 2202 struct aggregator *aggregator; 2203 2204 /* check that the slave has not been initialized yet. */ 2205 if (SLAVE_AD_INFO(slave)->port.slave != slave) { 2206 2207 /* port initialization */ 2208 port = &(SLAVE_AD_INFO(slave)->port); 2209 2210 ad_initialize_port(port, &bond->params); 2211 2212 port->slave = slave; 2213 port->actor_port_number = SLAVE_AD_INFO(slave)->id; 2214 /* key is determined according to the link speed, duplex and 2215 * user key 2216 */ 2217 port->actor_admin_port_key = bond->params.ad_user_port_key << 6; 2218 ad_update_actor_keys(port, false); 2219 /* actor system is the bond's system */ 2220 __ad_actor_update_port(port); 2221 /* tx timer(to verify that no more than MAX_TX_IN_SECOND 2222 * lacpdu's are sent in one second) 2223 */ 2224 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND; 2225 2226 __disable_port(port); 2227 2228 /* aggregator initialization */ 2229 aggregator = &(SLAVE_AD_INFO(slave)->aggregator); 2230 2231 ad_initialize_agg(aggregator); 2232 2233 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr); 2234 aggregator->aggregator_identifier = ++BOND_AD_INFO(bond).aggregator_identifier; 2235 aggregator->slave = slave; 2236 aggregator->is_active = 0; 2237 aggregator->num_of_ports = 0; 2238 } 2239 } 2240 2241 /** 2242 * bond_3ad_unbind_slave - deinitialize a slave's port 2243 * @slave: slave struct to work on 2244 * 2245 * Search for the aggregator that is related to this port, remove the 2246 * aggregator and assign another aggregator for other port related to it 2247 * (if any), and remove the port. 2248 */ 2249 void bond_3ad_unbind_slave(struct slave *slave) 2250 { 2251 struct port *port, *prev_port, *temp_port; 2252 struct aggregator *aggregator, *new_aggregator, *temp_aggregator; 2253 int select_new_active_agg = 0; 2254 struct bonding *bond = slave->bond; 2255 struct slave *slave_iter; 2256 struct list_head *iter; 2257 bool dummy_slave_update; /* Ignore this value as caller updates array */ 2258 2259 /* Sync against bond_3ad_state_machine_handler() */ 2260 spin_lock_bh(&bond->mode_lock); 2261 aggregator = &(SLAVE_AD_INFO(slave)->aggregator); 2262 port = &(SLAVE_AD_INFO(slave)->port); 2263 2264 /* if slave is null, the whole port is not initialized */ 2265 if (!port->slave) { 2266 slave_warn(bond->dev, slave->dev, "Trying to unbind an uninitialized port\n"); 2267 goto out; 2268 } 2269 2270 slave_dbg(bond->dev, slave->dev, "Unbinding Link Aggregation Group %d\n", 2271 aggregator->aggregator_identifier); 2272 2273 /* Tell the partner that this port is not suitable for aggregation */ 2274 port->actor_oper_port_state &= ~LACP_STATE_SYNCHRONIZATION; 2275 port->actor_oper_port_state &= ~LACP_STATE_COLLECTING; 2276 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING; 2277 port->actor_oper_port_state &= ~LACP_STATE_AGGREGATION; 2278 __update_lacpdu_from_port(port); 2279 ad_lacpdu_send(port); 2280 2281 /* check if this aggregator is occupied */ 2282 if (aggregator->lag_ports) { 2283 /* check if there are other ports related to this aggregator 2284 * except the port related to this slave(thats ensure us that 2285 * there is a reason to search for new aggregator, and that we 2286 * will find one 2287 */ 2288 if ((aggregator->lag_ports != port) || 2289 (aggregator->lag_ports->next_port_in_aggregator)) { 2290 /* find new aggregator for the related port(s) */ 2291 bond_for_each_slave(bond, slave_iter, iter) { 2292 new_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator); 2293 /* if the new aggregator is empty, or it is 2294 * connected to our port only 2295 */ 2296 if (!new_aggregator->lag_ports || 2297 ((new_aggregator->lag_ports == port) && 2298 !new_aggregator->lag_ports->next_port_in_aggregator)) 2299 break; 2300 } 2301 if (!slave_iter) 2302 new_aggregator = NULL; 2303 2304 /* if new aggregator found, copy the aggregator's 2305 * parameters and connect the related lag_ports to the 2306 * new aggregator 2307 */ 2308 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) { 2309 slave_dbg(bond->dev, slave->dev, "Some port(s) related to LAG %d - replacing with LAG %d\n", 2310 aggregator->aggregator_identifier, 2311 new_aggregator->aggregator_identifier); 2312 2313 if ((new_aggregator->lag_ports == port) && 2314 new_aggregator->is_active) { 2315 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n"); 2316 select_new_active_agg = 1; 2317 } 2318 2319 new_aggregator->is_individual = aggregator->is_individual; 2320 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key; 2321 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key; 2322 new_aggregator->partner_system = aggregator->partner_system; 2323 new_aggregator->partner_system_priority = aggregator->partner_system_priority; 2324 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key; 2325 new_aggregator->receive_state = aggregator->receive_state; 2326 new_aggregator->transmit_state = aggregator->transmit_state; 2327 new_aggregator->lag_ports = aggregator->lag_ports; 2328 new_aggregator->is_active = aggregator->is_active; 2329 new_aggregator->num_of_ports = aggregator->num_of_ports; 2330 2331 /* update the information that is written on 2332 * the ports about the aggregator 2333 */ 2334 for (temp_port = aggregator->lag_ports; temp_port; 2335 temp_port = temp_port->next_port_in_aggregator) { 2336 temp_port->aggregator = new_aggregator; 2337 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier; 2338 } 2339 2340 ad_clear_agg(aggregator); 2341 2342 if (select_new_active_agg) 2343 ad_agg_selection_logic(__get_first_agg(port), 2344 &dummy_slave_update); 2345 } else { 2346 slave_warn(bond->dev, slave->dev, "unbinding aggregator, and could not find a new aggregator for its ports\n"); 2347 } 2348 } else { 2349 /* in case that the only port related to this 2350 * aggregator is the one we want to remove 2351 */ 2352 select_new_active_agg = aggregator->is_active; 2353 ad_clear_agg(aggregator); 2354 if (select_new_active_agg) { 2355 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n"); 2356 /* select new active aggregator */ 2357 temp_aggregator = __get_first_agg(port); 2358 if (temp_aggregator) 2359 ad_agg_selection_logic(temp_aggregator, 2360 &dummy_slave_update); 2361 } 2362 } 2363 } 2364 2365 slave_dbg(bond->dev, slave->dev, "Unbinding port %d\n", port->actor_port_number); 2366 2367 /* find the aggregator that this port is connected to */ 2368 bond_for_each_slave(bond, slave_iter, iter) { 2369 temp_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator); 2370 prev_port = NULL; 2371 /* search the port in the aggregator's related ports */ 2372 for (temp_port = temp_aggregator->lag_ports; temp_port; 2373 prev_port = temp_port, 2374 temp_port = temp_port->next_port_in_aggregator) { 2375 if (temp_port == port) { 2376 /* the aggregator found - detach the port from 2377 * this aggregator 2378 */ 2379 if (prev_port) 2380 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator; 2381 else 2382 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator; 2383 temp_aggregator->num_of_ports--; 2384 if (__agg_active_ports(temp_aggregator) == 0) { 2385 select_new_active_agg = temp_aggregator->is_active; 2386 if (temp_aggregator->num_of_ports == 0) 2387 ad_clear_agg(temp_aggregator); 2388 if (select_new_active_agg) { 2389 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n"); 2390 /* select new active aggregator */ 2391 ad_agg_selection_logic(__get_first_agg(port), 2392 &dummy_slave_update); 2393 } 2394 } 2395 break; 2396 } 2397 } 2398 } 2399 port->slave = NULL; 2400 2401 out: 2402 spin_unlock_bh(&bond->mode_lock); 2403 } 2404 2405 /** 2406 * bond_3ad_update_ad_actor_settings - reflect change of actor settings to ports 2407 * @bond: bonding struct to work on 2408 * 2409 * If an ad_actor setting gets changed we need to update the individual port 2410 * settings so the bond device will use the new values when it gets upped. 2411 */ 2412 void bond_3ad_update_ad_actor_settings(struct bonding *bond) 2413 { 2414 struct list_head *iter; 2415 struct slave *slave; 2416 2417 ASSERT_RTNL(); 2418 2419 BOND_AD_INFO(bond).system.sys_priority = bond->params.ad_actor_sys_prio; 2420 if (is_zero_ether_addr(bond->params.ad_actor_system)) 2421 BOND_AD_INFO(bond).system.sys_mac_addr = 2422 *((struct mac_addr *)bond->dev->dev_addr); 2423 else 2424 BOND_AD_INFO(bond).system.sys_mac_addr = 2425 *((struct mac_addr *)bond->params.ad_actor_system); 2426 2427 spin_lock_bh(&bond->mode_lock); 2428 bond_for_each_slave(bond, slave, iter) { 2429 struct port *port = &(SLAVE_AD_INFO(slave))->port; 2430 2431 __ad_actor_update_port(port); 2432 port->ntt = true; 2433 } 2434 spin_unlock_bh(&bond->mode_lock); 2435 } 2436 2437 /** 2438 * bond_agg_timer_advance - advance agg_select_timer 2439 * @bond: bonding structure 2440 * 2441 * Return true when agg_select_timer reaches 0. 2442 */ 2443 static bool bond_agg_timer_advance(struct bonding *bond) 2444 { 2445 int val, nval; 2446 2447 while (1) { 2448 val = atomic_read(&BOND_AD_INFO(bond).agg_select_timer); 2449 if (!val) 2450 return false; 2451 nval = val - 1; 2452 if (atomic_cmpxchg(&BOND_AD_INFO(bond).agg_select_timer, 2453 val, nval) == val) 2454 break; 2455 } 2456 return nval == 0; 2457 } 2458 2459 /** 2460 * bond_3ad_state_machine_handler - handle state machines timeout 2461 * @work: work context to fetch bonding struct to work on from 2462 * 2463 * The state machine handling concept in this module is to check every tick 2464 * which state machine should operate any function. The execution order is 2465 * round robin, so when we have an interaction between state machines, the 2466 * reply of one to each other might be delayed until next tick. 2467 * 2468 * This function also complete the initialization when the agg_select_timer 2469 * times out, and it selects an aggregator for the ports that are yet not 2470 * related to any aggregator, and selects the active aggregator for a bond. 2471 */ 2472 void bond_3ad_state_machine_handler(struct work_struct *work) 2473 { 2474 struct bonding *bond = container_of(work, struct bonding, 2475 ad_work.work); 2476 struct aggregator *aggregator; 2477 struct list_head *iter; 2478 struct slave *slave; 2479 struct port *port; 2480 bool should_notify_rtnl = BOND_SLAVE_NOTIFY_LATER; 2481 bool update_slave_arr = false; 2482 2483 /* Lock to protect data accessed by all (e.g., port->sm_vars) and 2484 * against running with bond_3ad_unbind_slave. ad_rx_machine may run 2485 * concurrently due to incoming LACPDU as well. 2486 */ 2487 spin_lock_bh(&bond->mode_lock); 2488 rcu_read_lock(); 2489 2490 /* check if there are any slaves */ 2491 if (!bond_has_slaves(bond)) 2492 goto re_arm; 2493 2494 if (bond_agg_timer_advance(bond)) { 2495 slave = bond_first_slave_rcu(bond); 2496 port = slave ? &(SLAVE_AD_INFO(slave)->port) : NULL; 2497 2498 /* select the active aggregator for the bond */ 2499 if (port) { 2500 if (!port->slave) { 2501 net_warn_ratelimited("%s: Warning: bond's first port is uninitialized\n", 2502 bond->dev->name); 2503 goto re_arm; 2504 } 2505 2506 aggregator = __get_first_agg(port); 2507 ad_agg_selection_logic(aggregator, &update_slave_arr); 2508 } 2509 bond_3ad_set_carrier(bond); 2510 } 2511 2512 /* for each port run the state machines */ 2513 bond_for_each_slave_rcu(bond, slave, iter) { 2514 port = &(SLAVE_AD_INFO(slave)->port); 2515 if (!port->slave) { 2516 net_warn_ratelimited("%s: Warning: Found an uninitialized port\n", 2517 bond->dev->name); 2518 goto re_arm; 2519 } 2520 2521 ad_rx_machine(NULL, port); 2522 ad_periodic_machine(port); 2523 ad_port_selection_logic(port, &update_slave_arr); 2524 ad_mux_machine(port, &update_slave_arr); 2525 ad_tx_machine(port); 2526 ad_churn_machine(port); 2527 2528 /* turn off the BEGIN bit, since we already handled it */ 2529 if (port->sm_vars & AD_PORT_BEGIN) 2530 port->sm_vars &= ~AD_PORT_BEGIN; 2531 } 2532 2533 re_arm: 2534 bond_for_each_slave_rcu(bond, slave, iter) { 2535 if (slave->should_notify) { 2536 should_notify_rtnl = BOND_SLAVE_NOTIFY_NOW; 2537 break; 2538 } 2539 } 2540 rcu_read_unlock(); 2541 spin_unlock_bh(&bond->mode_lock); 2542 2543 if (update_slave_arr) 2544 bond_slave_arr_work_rearm(bond, 0); 2545 2546 if (should_notify_rtnl && rtnl_trylock()) { 2547 bond_slave_state_notify(bond); 2548 rtnl_unlock(); 2549 } 2550 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks); 2551 } 2552 2553 /** 2554 * bond_3ad_rx_indication - handle a received frame 2555 * @lacpdu: received lacpdu 2556 * @slave: slave struct to work on 2557 * 2558 * It is assumed that frames that were sent on this NIC don't returned as new 2559 * received frames (loopback). Since only the payload is given to this 2560 * function, it check for loopback. 2561 */ 2562 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave) 2563 { 2564 struct bonding *bond = slave->bond; 2565 int ret = RX_HANDLER_ANOTHER; 2566 struct bond_marker *marker; 2567 struct port *port; 2568 atomic64_t *stat; 2569 2570 port = &(SLAVE_AD_INFO(slave)->port); 2571 if (!port->slave) { 2572 net_warn_ratelimited("%s: Warning: port of slave %s is uninitialized\n", 2573 slave->dev->name, slave->bond->dev->name); 2574 return ret; 2575 } 2576 2577 switch (lacpdu->subtype) { 2578 case AD_TYPE_LACPDU: 2579 ret = RX_HANDLER_CONSUMED; 2580 slave_dbg(slave->bond->dev, slave->dev, 2581 "Received LACPDU on port %d\n", 2582 port->actor_port_number); 2583 /* Protect against concurrent state machines */ 2584 spin_lock(&slave->bond->mode_lock); 2585 ad_rx_machine(lacpdu, port); 2586 spin_unlock(&slave->bond->mode_lock); 2587 break; 2588 case AD_TYPE_MARKER: 2589 ret = RX_HANDLER_CONSUMED; 2590 /* No need to convert fields to Little Endian since we 2591 * don't use the marker's fields. 2592 */ 2593 marker = (struct bond_marker *)lacpdu; 2594 switch (marker->tlv_type) { 2595 case AD_MARKER_INFORMATION_SUBTYPE: 2596 slave_dbg(slave->bond->dev, slave->dev, "Received Marker Information on port %d\n", 2597 port->actor_port_number); 2598 ad_marker_info_received(marker, port); 2599 break; 2600 case AD_MARKER_RESPONSE_SUBTYPE: 2601 slave_dbg(slave->bond->dev, slave->dev, "Received Marker Response on port %d\n", 2602 port->actor_port_number); 2603 ad_marker_response_received(marker, port); 2604 break; 2605 default: 2606 slave_dbg(slave->bond->dev, slave->dev, "Received an unknown Marker subtype on port %d\n", 2607 port->actor_port_number); 2608 stat = &SLAVE_AD_INFO(slave)->stats.marker_unknown_rx; 2609 atomic64_inc(stat); 2610 stat = &BOND_AD_INFO(bond).stats.marker_unknown_rx; 2611 atomic64_inc(stat); 2612 } 2613 break; 2614 default: 2615 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_unknown_rx); 2616 atomic64_inc(&BOND_AD_INFO(bond).stats.lacpdu_unknown_rx); 2617 } 2618 2619 return ret; 2620 } 2621 2622 /** 2623 * ad_update_actor_keys - Update the oper / admin keys for a port based on 2624 * its current speed and duplex settings. 2625 * 2626 * @port: the port we'are looking at 2627 * @reset: Boolean to just reset the speed and the duplex part of the key 2628 * 2629 * The logic to change the oper / admin keys is: 2630 * (a) A full duplex port can participate in LACP with partner. 2631 * (b) When the speed is changed, LACP need to be reinitiated. 2632 */ 2633 static void ad_update_actor_keys(struct port *port, bool reset) 2634 { 2635 u8 duplex = 0; 2636 u16 ospeed = 0, speed = 0; 2637 u16 old_oper_key = port->actor_oper_port_key; 2638 2639 port->actor_admin_port_key &= ~(AD_SPEED_KEY_MASKS|AD_DUPLEX_KEY_MASKS); 2640 if (!reset) { 2641 speed = __get_link_speed(port); 2642 ospeed = (old_oper_key & AD_SPEED_KEY_MASKS) >> 1; 2643 duplex = __get_duplex(port); 2644 port->actor_admin_port_key |= (speed << 1) | duplex; 2645 } 2646 port->actor_oper_port_key = port->actor_admin_port_key; 2647 2648 if (old_oper_key != port->actor_oper_port_key) { 2649 /* Only 'duplex' port participates in LACP */ 2650 if (duplex) 2651 port->sm_vars |= AD_PORT_LACP_ENABLED; 2652 else 2653 port->sm_vars &= ~AD_PORT_LACP_ENABLED; 2654 2655 if (!reset) { 2656 if (!speed) { 2657 slave_err(port->slave->bond->dev, 2658 port->slave->dev, 2659 "speed changed to 0 on port %d\n", 2660 port->actor_port_number); 2661 } else if (duplex && ospeed != speed) { 2662 /* Speed change restarts LACP state-machine */ 2663 port->sm_vars |= AD_PORT_BEGIN; 2664 } 2665 } 2666 } 2667 } 2668 2669 /** 2670 * bond_3ad_adapter_speed_duplex_changed - handle a slave's speed / duplex 2671 * change indication 2672 * 2673 * @slave: slave struct to work on 2674 * 2675 * Handle reselection of aggregator (if needed) for this port. 2676 */ 2677 void bond_3ad_adapter_speed_duplex_changed(struct slave *slave) 2678 { 2679 struct port *port; 2680 2681 port = &(SLAVE_AD_INFO(slave)->port); 2682 2683 /* if slave is null, the whole port is not initialized */ 2684 if (!port->slave) { 2685 slave_warn(slave->bond->dev, slave->dev, 2686 "speed/duplex changed for uninitialized port\n"); 2687 return; 2688 } 2689 2690 spin_lock_bh(&slave->bond->mode_lock); 2691 ad_update_actor_keys(port, false); 2692 spin_unlock_bh(&slave->bond->mode_lock); 2693 slave_dbg(slave->bond->dev, slave->dev, "Port %d changed speed/duplex\n", 2694 port->actor_port_number); 2695 } 2696 2697 /** 2698 * bond_3ad_handle_link_change - handle a slave's link status change indication 2699 * @slave: slave struct to work on 2700 * @link: whether the link is now up or down 2701 * 2702 * Handle reselection of aggregator (if needed) for this port. 2703 */ 2704 void bond_3ad_handle_link_change(struct slave *slave, char link) 2705 { 2706 struct aggregator *agg; 2707 struct port *port; 2708 bool dummy; 2709 2710 port = &(SLAVE_AD_INFO(slave)->port); 2711 2712 /* if slave is null, the whole port is not initialized */ 2713 if (!port->slave) { 2714 slave_warn(slave->bond->dev, slave->dev, "link status changed for uninitialized port\n"); 2715 return; 2716 } 2717 2718 spin_lock_bh(&slave->bond->mode_lock); 2719 /* on link down we are zeroing duplex and speed since 2720 * some of the adaptors(ce1000.lan) report full duplex/speed 2721 * instead of N/A(duplex) / 0(speed). 2722 * 2723 * on link up we are forcing recheck on the duplex and speed since 2724 * some of he adaptors(ce1000.lan) report. 2725 */ 2726 if (link == BOND_LINK_UP) { 2727 port->is_enabled = true; 2728 ad_update_actor_keys(port, false); 2729 } else { 2730 /* link has failed */ 2731 port->is_enabled = false; 2732 ad_update_actor_keys(port, true); 2733 } 2734 agg = __get_first_agg(port); 2735 ad_agg_selection_logic(agg, &dummy); 2736 2737 spin_unlock_bh(&slave->bond->mode_lock); 2738 2739 slave_dbg(slave->bond->dev, slave->dev, "Port %d changed link status to %s\n", 2740 port->actor_port_number, 2741 link == BOND_LINK_UP ? "UP" : "DOWN"); 2742 2743 /* RTNL is held and mode_lock is released so it's safe 2744 * to update slave_array here. 2745 */ 2746 bond_update_slave_arr(slave->bond, NULL); 2747 } 2748 2749 /** 2750 * bond_3ad_set_carrier - set link state for bonding master 2751 * @bond: bonding structure 2752 * 2753 * if we have an active aggregator, we're up, if not, we're down. 2754 * Presumes that we cannot have an active aggregator if there are 2755 * no slaves with link up. 2756 * 2757 * This behavior complies with IEEE 802.3 section 43.3.9. 2758 * 2759 * Called by bond_set_carrier(). Return zero if carrier state does not 2760 * change, nonzero if it does. 2761 */ 2762 int bond_3ad_set_carrier(struct bonding *bond) 2763 { 2764 struct aggregator *active; 2765 struct slave *first_slave; 2766 int ret = 1; 2767 2768 rcu_read_lock(); 2769 first_slave = bond_first_slave_rcu(bond); 2770 if (!first_slave) { 2771 ret = 0; 2772 goto out; 2773 } 2774 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave)->aggregator)); 2775 if (active) { 2776 /* are enough slaves available to consider link up? */ 2777 if (__agg_active_ports(active) < bond->params.min_links) { 2778 if (netif_carrier_ok(bond->dev)) { 2779 netif_carrier_off(bond->dev); 2780 goto out; 2781 } 2782 } else if (!netif_carrier_ok(bond->dev)) { 2783 netif_carrier_on(bond->dev); 2784 goto out; 2785 } 2786 } else if (netif_carrier_ok(bond->dev)) { 2787 netif_carrier_off(bond->dev); 2788 } 2789 out: 2790 rcu_read_unlock(); 2791 return ret; 2792 } 2793 2794 /** 2795 * __bond_3ad_get_active_agg_info - get information of the active aggregator 2796 * @bond: bonding struct to work on 2797 * @ad_info: ad_info struct to fill with the bond's info 2798 * 2799 * Returns: 0 on success 2800 * < 0 on error 2801 */ 2802 int __bond_3ad_get_active_agg_info(struct bonding *bond, 2803 struct ad_info *ad_info) 2804 { 2805 struct aggregator *aggregator = NULL; 2806 struct list_head *iter; 2807 struct slave *slave; 2808 struct port *port; 2809 2810 bond_for_each_slave_rcu(bond, slave, iter) { 2811 port = &(SLAVE_AD_INFO(slave)->port); 2812 if (port->aggregator && port->aggregator->is_active) { 2813 aggregator = port->aggregator; 2814 break; 2815 } 2816 } 2817 2818 if (!aggregator) 2819 return -1; 2820 2821 ad_info->aggregator_id = aggregator->aggregator_identifier; 2822 ad_info->ports = __agg_active_ports(aggregator); 2823 ad_info->actor_key = aggregator->actor_oper_aggregator_key; 2824 ad_info->partner_key = aggregator->partner_oper_aggregator_key; 2825 ether_addr_copy(ad_info->partner_system, 2826 aggregator->partner_system.mac_addr_value); 2827 return 0; 2828 } 2829 2830 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info) 2831 { 2832 int ret; 2833 2834 rcu_read_lock(); 2835 ret = __bond_3ad_get_active_agg_info(bond, ad_info); 2836 rcu_read_unlock(); 2837 2838 return ret; 2839 } 2840 2841 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond, 2842 struct slave *slave) 2843 { 2844 struct lacpdu *lacpdu, _lacpdu; 2845 2846 if (skb->protocol != PKT_TYPE_LACPDU) 2847 return RX_HANDLER_ANOTHER; 2848 2849 if (!MAC_ADDRESS_EQUAL(eth_hdr(skb)->h_dest, lacpdu_mcast_addr)) 2850 return RX_HANDLER_ANOTHER; 2851 2852 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu); 2853 if (!lacpdu) { 2854 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_illegal_rx); 2855 atomic64_inc(&BOND_AD_INFO(bond).stats.lacpdu_illegal_rx); 2856 return RX_HANDLER_ANOTHER; 2857 } 2858 2859 return bond_3ad_rx_indication(lacpdu, slave); 2860 } 2861 2862 /** 2863 * bond_3ad_update_lacp_rate - change the lacp rate 2864 * @bond: bonding struct 2865 * 2866 * When modify lacp_rate parameter via sysfs, 2867 * update actor_oper_port_state of each port. 2868 * 2869 * Hold bond->mode_lock, 2870 * so we can modify port->actor_oper_port_state, 2871 * no matter bond is up or down. 2872 */ 2873 void bond_3ad_update_lacp_rate(struct bonding *bond) 2874 { 2875 struct port *port = NULL; 2876 struct list_head *iter; 2877 struct slave *slave; 2878 int lacp_fast; 2879 2880 lacp_fast = bond->params.lacp_fast; 2881 spin_lock_bh(&bond->mode_lock); 2882 bond_for_each_slave(bond, slave, iter) { 2883 port = &(SLAVE_AD_INFO(slave)->port); 2884 if (lacp_fast) 2885 port->actor_oper_port_state |= LACP_STATE_LACP_TIMEOUT; 2886 else 2887 port->actor_oper_port_state &= ~LACP_STATE_LACP_TIMEOUT; 2888 } 2889 spin_unlock_bh(&bond->mode_lock); 2890 } 2891 2892 /** 2893 * bond_3ad_update_lacp_active - change the lacp active 2894 * @bond: bonding struct 2895 * 2896 * Update actor_oper_port_state when lacp_active is modified. 2897 */ 2898 void bond_3ad_update_lacp_active(struct bonding *bond) 2899 { 2900 struct port *port = NULL; 2901 struct list_head *iter; 2902 struct slave *slave; 2903 int lacp_active; 2904 2905 lacp_active = bond->params.lacp_active; 2906 spin_lock_bh(&bond->mode_lock); 2907 bond_for_each_slave(bond, slave, iter) { 2908 port = &(SLAVE_AD_INFO(slave)->port); 2909 if (lacp_active) 2910 port->actor_oper_port_state |= LACP_STATE_LACP_ACTIVITY; 2911 else 2912 port->actor_oper_port_state &= ~LACP_STATE_LACP_ACTIVITY; 2913 } 2914 spin_unlock_bh(&bond->mode_lock); 2915 } 2916 2917 size_t bond_3ad_stats_size(void) 2918 { 2919 return nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_RX */ 2920 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_TX */ 2921 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_UNKNOWN_RX */ 2922 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_ILLEGAL_RX */ 2923 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RX */ 2924 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_TX */ 2925 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RESP_RX */ 2926 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RESP_TX */ 2927 nla_total_size_64bit(sizeof(u64)); /* BOND_3AD_STAT_MARKER_UNKNOWN_RX */ 2928 } 2929 2930 int bond_3ad_stats_fill(struct sk_buff *skb, struct bond_3ad_stats *stats) 2931 { 2932 u64 val; 2933 2934 val = atomic64_read(&stats->lacpdu_rx); 2935 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_RX, val, 2936 BOND_3AD_STAT_PAD)) 2937 return -EMSGSIZE; 2938 val = atomic64_read(&stats->lacpdu_tx); 2939 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_TX, val, 2940 BOND_3AD_STAT_PAD)) 2941 return -EMSGSIZE; 2942 val = atomic64_read(&stats->lacpdu_unknown_rx); 2943 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_UNKNOWN_RX, val, 2944 BOND_3AD_STAT_PAD)) 2945 return -EMSGSIZE; 2946 val = atomic64_read(&stats->lacpdu_illegal_rx); 2947 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_ILLEGAL_RX, val, 2948 BOND_3AD_STAT_PAD)) 2949 return -EMSGSIZE; 2950 2951 val = atomic64_read(&stats->marker_rx); 2952 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RX, val, 2953 BOND_3AD_STAT_PAD)) 2954 return -EMSGSIZE; 2955 val = atomic64_read(&stats->marker_tx); 2956 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_TX, val, 2957 BOND_3AD_STAT_PAD)) 2958 return -EMSGSIZE; 2959 val = atomic64_read(&stats->marker_resp_rx); 2960 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RESP_RX, val, 2961 BOND_3AD_STAT_PAD)) 2962 return -EMSGSIZE; 2963 val = atomic64_read(&stats->marker_resp_tx); 2964 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RESP_TX, val, 2965 BOND_3AD_STAT_PAD)) 2966 return -EMSGSIZE; 2967 val = atomic64_read(&stats->marker_unknown_rx); 2968 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_UNKNOWN_RX, val, 2969 BOND_3AD_STAT_PAD)) 2970 return -EMSGSIZE; 2971 2972 return 0; 2973 } 2974