2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * The full GNU General Public License is included in this distribution in the
19 * file called LICENSE.
23 #include <linux/skbuff.h>
24 #include <linux/if_ether.h>
25 #include <linux/netdevice.h>
26 #include <linux/spinlock.h>
27 #include <linux/ethtool.h>
28 #include <linux/etherdevice.h>
29 #include <linux/if_bonding.h>
30 #include <linux/pkt_sched.h>
31 #include <net/net_namespace.h>
32 #include <net/bonding.h>
33 #include <net/bond_3ad.h>
35 /* General definitions */
36 #define AD_SHORT_TIMEOUT 1
37 #define AD_LONG_TIMEOUT 0
38 #define AD_STANDBY 0x2
39 #define AD_MAX_TX_IN_SECOND 3
40 #define AD_COLLECTOR_MAX_DELAY 0
42 /* Timer definitions (43.4.4 in the 802.3ad standard) */
43 #define AD_FAST_PERIODIC_TIME 1
44 #define AD_SLOW_PERIODIC_TIME 30
45 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
46 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
47 #define AD_CHURN_DETECTION_TIME 60
48 #define AD_AGGREGATE_WAIT_TIME 2
50 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */
51 #define AD_STATE_LACP_ACTIVITY 0x1
52 #define AD_STATE_LACP_TIMEOUT 0x2
53 #define AD_STATE_AGGREGATION 0x4
54 #define AD_STATE_SYNCHRONIZATION 0x8
55 #define AD_STATE_COLLECTING 0x10
56 #define AD_STATE_DISTRIBUTING 0x20
57 #define AD_STATE_DEFAULTED 0x40
58 #define AD_STATE_EXPIRED 0x80
60 /* Port Variables definitions used by the State Machines (43.4.7 in the
63 #define AD_PORT_BEGIN 0x1
64 #define AD_PORT_LACP_ENABLED 0x2
65 #define AD_PORT_ACTOR_CHURN 0x4
66 #define AD_PORT_PARTNER_CHURN 0x8
67 #define AD_PORT_READY 0x10
68 #define AD_PORT_READY_N 0x20
69 #define AD_PORT_MATCHED 0x40
70 #define AD_PORT_STANDBY 0x80
71 #define AD_PORT_SELECTED 0x100
72 #define AD_PORT_MOVED 0x200
73 #define AD_PORT_CHURNED (AD_PORT_ACTOR_CHURN | AD_PORT_PARTNER_CHURN)
75 /* Port Key definitions
76 * key is determined according to the link speed, duplex and
77 * user key (which is yet not supported)
78 * --------------------------------------------------------------
79 * Port key | User key (10 bits) | Speed (5 bits) | Duplex|
80 * --------------------------------------------------------------
83 #define AD_DUPLEX_KEY_MASKS 0x1
84 #define AD_SPEED_KEY_MASKS 0x3E
85 #define AD_USER_KEY_MASKS 0xFFC0
87 enum ad_link_speed_type {
88 AD_LINK_SPEED_1MBPS = 1,
90 AD_LINK_SPEED_100MBPS,
91 AD_LINK_SPEED_1000MBPS,
92 AD_LINK_SPEED_2500MBPS,
93 AD_LINK_SPEED_10000MBPS,
94 AD_LINK_SPEED_20000MBPS,
95 AD_LINK_SPEED_40000MBPS,
96 AD_LINK_SPEED_56000MBPS
99 /* compare MAC addresses */
100 #define MAC_ADDRESS_EQUAL(A, B) \
101 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
103 static struct mac_addr null_mac_addr = { { 0, 0, 0, 0, 0, 0 } };
104 static u16 ad_ticks_per_sec;
105 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000;
107 static const u8 lacpdu_mcast_addr[ETH_ALEN] = MULTICAST_LACPDU_ADDR;
109 /* ================= main 802.3ad protocol functions ================== */
110 static int ad_lacpdu_send(struct port *port);
111 static int ad_marker_send(struct port *port, struct bond_marker *marker);
112 static void ad_mux_machine(struct port *port, bool *update_slave_arr);
113 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
114 static void ad_tx_machine(struct port *port);
115 static void ad_periodic_machine(struct port *port);
116 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr);
117 static void ad_agg_selection_logic(struct aggregator *aggregator,
118 bool *update_slave_arr);
119 static void ad_clear_agg(struct aggregator *aggregator);
120 static void ad_initialize_agg(struct aggregator *aggregator);
121 static void ad_initialize_port(struct port *port, int lacp_fast);
122 static void ad_enable_collecting_distributing(struct port *port,
123 bool *update_slave_arr);
124 static void ad_disable_collecting_distributing(struct port *port,
125 bool *update_slave_arr);
126 static void ad_marker_info_received(struct bond_marker *marker_info,
128 static void ad_marker_response_received(struct bond_marker *marker,
132 /* ================= api to bonding and kernel code ================== */
135 * __get_bond_by_port - get the port's bonding struct
136 * @port: the port we're looking at
138 * Return @port's bonding struct, or %NULL if it can't be found.
140 static inline struct bonding *__get_bond_by_port(struct port *port)
142 if (port->slave == NULL)
145 return bond_get_bond_by_slave(port->slave);
149 * __get_first_agg - get the first aggregator in the bond
150 * @bond: the bond we're looking at
152 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
154 * The caller must hold RCU or RTNL lock.
156 static inline struct aggregator *__get_first_agg(struct port *port)
158 struct bonding *bond = __get_bond_by_port(port);
159 struct slave *first_slave;
160 struct aggregator *agg;
162 /* If there's no bond for this port, or bond has no slaves */
167 first_slave = bond_first_slave_rcu(bond);
168 agg = first_slave ? &(SLAVE_AD_INFO(first_slave)->aggregator) : NULL;
175 * __agg_has_partner - see if we have a partner
176 * @agg: the agregator we're looking at
178 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
179 * address for the partner). Return 0 if not.
181 static inline int __agg_has_partner(struct aggregator *agg)
183 return !is_zero_ether_addr(agg->partner_system.mac_addr_value);
187 * __disable_port - disable the port's slave
188 * @port: the port we're looking at
190 static inline void __disable_port(struct port *port)
192 bond_set_slave_inactive_flags(port->slave, BOND_SLAVE_NOTIFY_LATER);
196 * __enable_port - enable the port's slave, if it's up
197 * @port: the port we're looking at
199 static inline void __enable_port(struct port *port)
201 struct slave *slave = port->slave;
203 if ((slave->link == BOND_LINK_UP) && bond_slave_is_up(slave))
204 bond_set_slave_active_flags(slave, BOND_SLAVE_NOTIFY_LATER);
208 * __port_is_enabled - check if the port's slave is in active state
209 * @port: the port we're looking at
211 static inline int __port_is_enabled(struct port *port)
213 return bond_is_active_slave(port->slave);
217 * __get_agg_selection_mode - get the aggregator selection mode
218 * @port: the port we're looking at
220 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
222 static inline u32 __get_agg_selection_mode(struct port *port)
224 struct bonding *bond = __get_bond_by_port(port);
227 return BOND_AD_STABLE;
229 return bond->params.ad_select;
233 * __check_agg_selection_timer - check if the selection timer has expired
234 * @port: the port we're looking at
236 static inline int __check_agg_selection_timer(struct port *port)
238 struct bonding *bond = __get_bond_by_port(port);
243 return BOND_AD_INFO(bond).agg_select_timer ? 1 : 0;
247 * __get_link_speed - get a port's speed
248 * @port: the port we're looking at
250 * Return @port's speed in 802.3ad enum format. i.e. one of:
252 * %AD_LINK_SPEED_10MBPS,
253 * %AD_LINK_SPEED_100MBPS,
254 * %AD_LINK_SPEED_1000MBPS,
255 * %AD_LINK_SPEED_2500MBPS,
256 * %AD_LINK_SPEED_10000MBPS
257 * %AD_LINK_SPEED_20000MBPS
258 * %AD_LINK_SPEED_40000MBPS
259 * %AD_LINK_SPEED_56000MBPS
261 static u16 __get_link_speed(struct port *port)
263 struct slave *slave = port->slave;
266 /* this if covers only a special case: when the configuration starts
267 * with link down, it sets the speed to 0.
268 * This is done in spite of the fact that the e100 driver reports 0
269 * to be compatible with MVT in the future.
271 if (slave->link != BOND_LINK_UP)
274 switch (slave->speed) {
276 speed = AD_LINK_SPEED_10MBPS;
280 speed = AD_LINK_SPEED_100MBPS;
284 speed = AD_LINK_SPEED_1000MBPS;
288 speed = AD_LINK_SPEED_2500MBPS;
292 speed = AD_LINK_SPEED_10000MBPS;
296 speed = AD_LINK_SPEED_20000MBPS;
300 speed = AD_LINK_SPEED_40000MBPS;
304 speed = AD_LINK_SPEED_56000MBPS;
308 /* unknown speed value from ethtool. shouldn't happen */
314 netdev_dbg(slave->bond->dev, "Port %d Received link speed %d update from adapter\n",
315 port->actor_port_number, speed);
320 * __get_duplex - get a port's duplex
321 * @port: the port we're looking at
323 * Return @port's duplex in 802.3ad bitmask format. i.e.:
324 * 0x01 if in full duplex
327 static u8 __get_duplex(struct port *port)
329 struct slave *slave = port->slave;
332 /* handling a special case: when the configuration starts with
333 * link down, it sets the duplex to 0.
335 if (slave->link != BOND_LINK_UP) {
338 switch (slave->duplex) {
341 netdev_dbg(slave->bond->dev, "Port %d Received status full duplex update from adapter\n",
342 port->actor_port_number);
347 netdev_dbg(slave->bond->dev, "Port %d Received status NOT full duplex update from adapter\n",
348 port->actor_port_number);
358 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
359 * @timer_type: which timer to operate
360 * @par: timer parameter. see below
362 * If @timer_type is %current_while_timer, @par indicates long/short timer.
363 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
364 * %SLOW_PERIODIC_TIME.
366 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par)
368 u16 retval = 0; /* to silence the compiler */
370 switch (timer_type) {
371 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */
373 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec);
375 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec);
377 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */
378 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
380 case AD_PERIODIC_TIMER: /* for periodic machine */
381 retval = (par*ad_ticks_per_sec); /* long timeout */
383 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */
384 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
386 case AD_WAIT_WHILE_TIMER: /* for selection machine */
387 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec);
395 /* ================= ad_rx_machine helper functions ================== */
398 * __choose_matched - update a port's matched variable from a received lacpdu
399 * @lacpdu: the lacpdu we've received
400 * @port: the port we're looking at
402 * Update the value of the matched variable, using parameter values from a
403 * newly received lacpdu. Parameter values for the partner carried in the
404 * received PDU are compared with the corresponding operational parameter
405 * values for the actor. Matched is set to TRUE if all of these parameters
406 * match and the PDU parameter partner_state.aggregation has the same value as
407 * actor_oper_port_state.aggregation and lacp will actively maintain the link
408 * in the aggregation. Matched is also set to TRUE if the value of
409 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
410 * an individual link and lacp will actively maintain the link. Otherwise,
411 * matched is set to FALSE. LACP is considered to be actively maintaining the
412 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
413 * the actor's actor_oper_port_state.lacp_activity and the PDU's
414 * partner_state.lacp_activity variables are TRUE.
416 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
417 * used here to implement the language from 802.3ad 43.4.9 that requires
418 * recordPDU to "match" the LACPDU parameters to the stored values.
420 static void __choose_matched(struct lacpdu *lacpdu, struct port *port)
422 /* check if all parameters are alike
423 * or this is individual link(aggregation == FALSE)
424 * then update the state machine Matched variable.
426 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) &&
427 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) &&
428 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) &&
429 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) &&
430 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) &&
431 ((lacpdu->partner_state & AD_STATE_AGGREGATION) == (port->actor_oper_port_state & AD_STATE_AGGREGATION))) ||
432 ((lacpdu->actor_state & AD_STATE_AGGREGATION) == 0)
434 port->sm_vars |= AD_PORT_MATCHED;
436 port->sm_vars &= ~AD_PORT_MATCHED;
441 * __record_pdu - record parameters from a received lacpdu
442 * @lacpdu: the lacpdu we've received
443 * @port: the port we're looking at
445 * Record the parameter values for the Actor carried in a received lacpdu as
446 * the current partner operational parameter values and sets
447 * actor_oper_port_state.defaulted to FALSE.
449 static void __record_pdu(struct lacpdu *lacpdu, struct port *port)
451 if (lacpdu && port) {
452 struct port_params *partner = &port->partner_oper;
454 __choose_matched(lacpdu, port);
455 /* record the new parameter values for the partner
458 partner->port_number = ntohs(lacpdu->actor_port);
459 partner->port_priority = ntohs(lacpdu->actor_port_priority);
460 partner->system = lacpdu->actor_system;
461 partner->system_priority = ntohs(lacpdu->actor_system_priority);
462 partner->key = ntohs(lacpdu->actor_key);
463 partner->port_state = lacpdu->actor_state;
465 /* set actor_oper_port_state.defaulted to FALSE */
466 port->actor_oper_port_state &= ~AD_STATE_DEFAULTED;
468 /* set the partner sync. to on if the partner is sync,
469 * and the port is matched
471 if ((port->sm_vars & AD_PORT_MATCHED) &&
472 (lacpdu->actor_state & AD_STATE_SYNCHRONIZATION)) {
473 partner->port_state |= AD_STATE_SYNCHRONIZATION;
474 pr_debug("%s partner sync=1\n", port->slave->dev->name);
476 partner->port_state &= ~AD_STATE_SYNCHRONIZATION;
477 pr_debug("%s partner sync=0\n", port->slave->dev->name);
483 * __record_default - record default parameters
484 * @port: the port we're looking at
486 * This function records the default parameter values for the partner carried
487 * in the Partner Admin parameters as the current partner operational parameter
488 * values and sets actor_oper_port_state.defaulted to TRUE.
490 static void __record_default(struct port *port)
493 /* record the partner admin parameters */
494 memcpy(&port->partner_oper, &port->partner_admin,
495 sizeof(struct port_params));
497 /* set actor_oper_port_state.defaulted to true */
498 port->actor_oper_port_state |= AD_STATE_DEFAULTED;
503 * __update_selected - update a port's Selected variable from a received lacpdu
504 * @lacpdu: the lacpdu we've received
505 * @port: the port we're looking at
507 * Update the value of the selected variable, using parameter values from a
508 * newly received lacpdu. The parameter values for the Actor carried in the
509 * received PDU are compared with the corresponding operational parameter
510 * values for the ports partner. If one or more of the comparisons shows that
511 * the value(s) received in the PDU differ from the current operational values,
512 * then selected is set to FALSE and actor_oper_port_state.synchronization is
513 * set to out_of_sync. Otherwise, selected remains unchanged.
515 static void __update_selected(struct lacpdu *lacpdu, struct port *port)
517 if (lacpdu && port) {
518 const struct port_params *partner = &port->partner_oper;
520 /* check if any parameter is different then
521 * update the state machine selected variable.
523 if (ntohs(lacpdu->actor_port) != partner->port_number ||
524 ntohs(lacpdu->actor_port_priority) != partner->port_priority ||
525 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) ||
526 ntohs(lacpdu->actor_system_priority) != partner->system_priority ||
527 ntohs(lacpdu->actor_key) != partner->key ||
528 (lacpdu->actor_state & AD_STATE_AGGREGATION) != (partner->port_state & AD_STATE_AGGREGATION)) {
529 port->sm_vars &= ~AD_PORT_SELECTED;
535 * __update_default_selected - update a port's Selected variable from Partner
536 * @port: the port we're looking at
538 * This function updates the value of the selected variable, using the partner
539 * administrative parameter values. The administrative values are compared with
540 * the corresponding operational parameter values for the partner. If one or
541 * more of the comparisons shows that the administrative value(s) differ from
542 * the current operational values, then Selected is set to FALSE and
543 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
544 * Selected remains unchanged.
546 static void __update_default_selected(struct port *port)
549 const struct port_params *admin = &port->partner_admin;
550 const struct port_params *oper = &port->partner_oper;
552 /* check if any parameter is different then
553 * update the state machine selected variable.
555 if (admin->port_number != oper->port_number ||
556 admin->port_priority != oper->port_priority ||
557 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) ||
558 admin->system_priority != oper->system_priority ||
559 admin->key != oper->key ||
560 (admin->port_state & AD_STATE_AGGREGATION)
561 != (oper->port_state & AD_STATE_AGGREGATION)) {
562 port->sm_vars &= ~AD_PORT_SELECTED;
568 * __update_ntt - update a port's ntt variable from a received lacpdu
569 * @lacpdu: the lacpdu we've received
570 * @port: the port we're looking at
572 * Updates the value of the ntt variable, using parameter values from a newly
573 * received lacpdu. The parameter values for the partner carried in the
574 * received PDU are compared with the corresponding operational parameter
575 * values for the Actor. If one or more of the comparisons shows that the
576 * value(s) received in the PDU differ from the current operational values,
577 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
579 static void __update_ntt(struct lacpdu *lacpdu, struct port *port)
581 /* validate lacpdu and port */
582 if (lacpdu && port) {
583 /* check if any parameter is different then
584 * update the port->ntt.
586 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) ||
587 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) ||
588 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) ||
589 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) ||
590 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) ||
591 ((lacpdu->partner_state & AD_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY)) ||
592 ((lacpdu->partner_state & AD_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)) ||
593 ((lacpdu->partner_state & AD_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) ||
594 ((lacpdu->partner_state & AD_STATE_AGGREGATION) != (port->actor_oper_port_state & AD_STATE_AGGREGATION))
602 * __agg_ports_are_ready - check if all ports in an aggregator are ready
603 * @aggregator: the aggregator we're looking at
606 static int __agg_ports_are_ready(struct aggregator *aggregator)
612 /* scan all ports in this aggregator to verfy if they are
615 for (port = aggregator->lag_ports;
617 port = port->next_port_in_aggregator) {
618 if (!(port->sm_vars & AD_PORT_READY_N)) {
629 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
630 * @aggregator: the aggregator we're looking at
631 * @val: Should the ports' ready bit be set on or off
634 static void __set_agg_ports_ready(struct aggregator *aggregator, int val)
638 for (port = aggregator->lag_ports; port;
639 port = port->next_port_in_aggregator) {
641 port->sm_vars |= AD_PORT_READY;
643 port->sm_vars &= ~AD_PORT_READY;
648 * __get_agg_bandwidth - get the total bandwidth of an aggregator
649 * @aggregator: the aggregator we're looking at
652 static u32 __get_agg_bandwidth(struct aggregator *aggregator)
656 if (aggregator->num_of_ports) {
657 switch (__get_link_speed(aggregator->lag_ports)) {
658 case AD_LINK_SPEED_1MBPS:
659 bandwidth = aggregator->num_of_ports;
661 case AD_LINK_SPEED_10MBPS:
662 bandwidth = aggregator->num_of_ports * 10;
664 case AD_LINK_SPEED_100MBPS:
665 bandwidth = aggregator->num_of_ports * 100;
667 case AD_LINK_SPEED_1000MBPS:
668 bandwidth = aggregator->num_of_ports * 1000;
670 case AD_LINK_SPEED_2500MBPS:
671 bandwidth = aggregator->num_of_ports * 2500;
673 case AD_LINK_SPEED_10000MBPS:
674 bandwidth = aggregator->num_of_ports * 10000;
676 case AD_LINK_SPEED_20000MBPS:
677 bandwidth = aggregator->num_of_ports * 20000;
679 case AD_LINK_SPEED_40000MBPS:
680 bandwidth = aggregator->num_of_ports * 40000;
682 case AD_LINK_SPEED_56000MBPS:
683 bandwidth = aggregator->num_of_ports * 56000;
686 bandwidth = 0; /* to silence the compiler */
693 * __get_active_agg - get the current active aggregator
694 * @aggregator: the aggregator we're looking at
696 * Caller must hold RCU lock.
698 static struct aggregator *__get_active_agg(struct aggregator *aggregator)
700 struct bonding *bond = aggregator->slave->bond;
701 struct list_head *iter;
704 bond_for_each_slave_rcu(bond, slave, iter)
705 if (SLAVE_AD_INFO(slave)->aggregator.is_active)
706 return &(SLAVE_AD_INFO(slave)->aggregator);
712 * __update_lacpdu_from_port - update a port's lacpdu fields
713 * @port: the port we're looking at
715 static inline void __update_lacpdu_from_port(struct port *port)
717 struct lacpdu *lacpdu = &port->lacpdu;
718 const struct port_params *partner = &port->partner_oper;
720 /* update current actual Actor parameters
721 * lacpdu->subtype initialized
722 * lacpdu->version_number initialized
723 * lacpdu->tlv_type_actor_info initialized
724 * lacpdu->actor_information_length initialized
727 lacpdu->actor_system_priority = htons(port->actor_system_priority);
728 lacpdu->actor_system = port->actor_system;
729 lacpdu->actor_key = htons(port->actor_oper_port_key);
730 lacpdu->actor_port_priority = htons(port->actor_port_priority);
731 lacpdu->actor_port = htons(port->actor_port_number);
732 lacpdu->actor_state = port->actor_oper_port_state;
733 pr_debug("update lacpdu: %s, actor port state %x\n",
734 port->slave->dev->name, port->actor_oper_port_state);
736 /* lacpdu->reserved_3_1 initialized
737 * lacpdu->tlv_type_partner_info initialized
738 * lacpdu->partner_information_length initialized
741 lacpdu->partner_system_priority = htons(partner->system_priority);
742 lacpdu->partner_system = partner->system;
743 lacpdu->partner_key = htons(partner->key);
744 lacpdu->partner_port_priority = htons(partner->port_priority);
745 lacpdu->partner_port = htons(partner->port_number);
746 lacpdu->partner_state = partner->port_state;
748 /* lacpdu->reserved_3_2 initialized
749 * lacpdu->tlv_type_collector_info initialized
750 * lacpdu->collector_information_length initialized
751 * collector_max_delay initialized
752 * reserved_12[12] initialized
753 * tlv_type_terminator initialized
754 * terminator_length initialized
755 * reserved_50[50] initialized
759 /* ================= main 802.3ad protocol code ========================= */
762 * ad_lacpdu_send - send out a lacpdu packet on a given port
763 * @port: the port we're looking at
765 * Returns: 0 on success
768 static int ad_lacpdu_send(struct port *port)
770 struct slave *slave = port->slave;
772 struct lacpdu_header *lacpdu_header;
773 int length = sizeof(struct lacpdu_header);
775 skb = dev_alloc_skb(length);
779 skb->dev = slave->dev;
780 skb_reset_mac_header(skb);
781 skb->network_header = skb->mac_header + ETH_HLEN;
782 skb->protocol = PKT_TYPE_LACPDU;
783 skb->priority = TC_PRIO_CONTROL;
785 lacpdu_header = (struct lacpdu_header *)skb_put(skb, length);
787 ether_addr_copy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr);
788 /* Note: source address is set to be the member's PERMANENT address,
789 * because we use it to identify loopback lacpdus in receive.
791 ether_addr_copy(lacpdu_header->hdr.h_source, slave->perm_hwaddr);
792 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU;
794 lacpdu_header->lacpdu = port->lacpdu;
802 * ad_marker_send - send marker information/response on a given port
803 * @port: the port we're looking at
804 * @marker: marker data to send
806 * Returns: 0 on success
809 static int ad_marker_send(struct port *port, struct bond_marker *marker)
811 struct slave *slave = port->slave;
813 struct bond_marker_header *marker_header;
814 int length = sizeof(struct bond_marker_header);
816 skb = dev_alloc_skb(length + 16);
820 skb_reserve(skb, 16);
822 skb->dev = slave->dev;
823 skb_reset_mac_header(skb);
824 skb->network_header = skb->mac_header + ETH_HLEN;
825 skb->protocol = PKT_TYPE_LACPDU;
827 marker_header = (struct bond_marker_header *)skb_put(skb, length);
829 ether_addr_copy(marker_header->hdr.h_dest, lacpdu_mcast_addr);
830 /* Note: source address is set to be the member's PERMANENT address,
831 * because we use it to identify loopback MARKERs in receive.
833 ether_addr_copy(marker_header->hdr.h_source, slave->perm_hwaddr);
834 marker_header->hdr.h_proto = PKT_TYPE_LACPDU;
836 marker_header->marker = *marker;
844 * ad_mux_machine - handle a port's mux state machine
845 * @port: the port we're looking at
846 * @update_slave_arr: Does slave array need update?
848 static void ad_mux_machine(struct port *port, bool *update_slave_arr)
850 mux_states_t last_state;
852 /* keep current State Machine state to compare later if it was
855 last_state = port->sm_mux_state;
857 if (port->sm_vars & AD_PORT_BEGIN) {
858 port->sm_mux_state = AD_MUX_DETACHED;
860 switch (port->sm_mux_state) {
861 case AD_MUX_DETACHED:
862 if ((port->sm_vars & AD_PORT_SELECTED)
863 || (port->sm_vars & AD_PORT_STANDBY))
864 /* if SELECTED or STANDBY */
865 port->sm_mux_state = AD_MUX_WAITING;
868 /* if SELECTED == FALSE return to DETACH state */
869 if (!(port->sm_vars & AD_PORT_SELECTED)) {
870 port->sm_vars &= ~AD_PORT_READY_N;
871 /* in order to withhold the Selection Logic to
872 * check all ports READY_N value every callback
873 * cycle to update ready variable, we check
874 * READY_N and update READY here
876 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
877 port->sm_mux_state = AD_MUX_DETACHED;
881 /* check if the wait_while_timer expired */
882 if (port->sm_mux_timer_counter
883 && !(--port->sm_mux_timer_counter))
884 port->sm_vars |= AD_PORT_READY_N;
886 /* in order to withhold the selection logic to check
887 * all ports READY_N value every callback cycle to
888 * update ready variable, we check READY_N and update
891 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
893 /* if the wait_while_timer expired, and the port is
894 * in READY state, move to ATTACHED state
896 if ((port->sm_vars & AD_PORT_READY)
897 && !port->sm_mux_timer_counter)
898 port->sm_mux_state = AD_MUX_ATTACHED;
900 case AD_MUX_ATTACHED:
901 /* check also if agg_select_timer expired (so the
902 * edable port will take place only after this timer)
904 if ((port->sm_vars & AD_PORT_SELECTED) &&
905 (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) &&
906 !__check_agg_selection_timer(port)) {
907 if (port->aggregator->is_active)
909 AD_MUX_COLLECTING_DISTRIBUTING;
910 } else if (!(port->sm_vars & AD_PORT_SELECTED) ||
911 (port->sm_vars & AD_PORT_STANDBY)) {
912 /* if UNSELECTED or STANDBY */
913 port->sm_vars &= ~AD_PORT_READY_N;
914 /* in order to withhold the selection logic to
915 * check all ports READY_N value every callback
916 * cycle to update ready variable, we check
917 * READY_N and update READY here
919 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
920 port->sm_mux_state = AD_MUX_DETACHED;
921 } else if (port->aggregator->is_active) {
922 port->actor_oper_port_state |=
923 AD_STATE_SYNCHRONIZATION;
926 case AD_MUX_COLLECTING_DISTRIBUTING:
927 if (!(port->sm_vars & AD_PORT_SELECTED) ||
928 (port->sm_vars & AD_PORT_STANDBY) ||
929 !(port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) ||
930 !(port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) {
931 port->sm_mux_state = AD_MUX_ATTACHED;
933 /* if port state hasn't changed make
934 * sure that a collecting distributing
935 * port in an active aggregator is enabled
937 if (port->aggregator &&
938 port->aggregator->is_active &&
939 !__port_is_enabled(port)) {
950 /* check if the state machine was changed */
951 if (port->sm_mux_state != last_state) {
952 pr_debug("Mux Machine: Port=%d (%s), Last State=%d, Curr State=%d\n",
953 port->actor_port_number,
954 port->slave->dev->name,
957 switch (port->sm_mux_state) {
958 case AD_MUX_DETACHED:
959 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
960 ad_disable_collecting_distributing(port,
962 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
963 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
967 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0);
969 case AD_MUX_ATTACHED:
970 if (port->aggregator->is_active)
971 port->actor_oper_port_state |=
972 AD_STATE_SYNCHRONIZATION;
974 port->actor_oper_port_state &=
975 ~AD_STATE_SYNCHRONIZATION;
976 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
977 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
978 ad_disable_collecting_distributing(port,
982 case AD_MUX_COLLECTING_DISTRIBUTING:
983 port->actor_oper_port_state |= AD_STATE_COLLECTING;
984 port->actor_oper_port_state |= AD_STATE_DISTRIBUTING;
985 port->actor_oper_port_state |= AD_STATE_SYNCHRONIZATION;
986 ad_enable_collecting_distributing(port,
997 * ad_rx_machine - handle a port's rx State Machine
998 * @lacpdu: the lacpdu we've received
999 * @port: the port we're looking at
1001 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
1002 * CURRENT. If timer expired set the state machine in the proper state.
1003 * In other cases, this function checks if we need to switch to other state.
1005 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
1007 rx_states_t last_state;
1009 /* keep current State Machine state to compare later if it was
1012 last_state = port->sm_rx_state;
1014 /* check if state machine should change state */
1016 /* first, check if port was reinitialized */
1017 if (port->sm_vars & AD_PORT_BEGIN) {
1018 port->sm_rx_state = AD_RX_INITIALIZE;
1019 port->sm_vars |= AD_PORT_CHURNED;
1020 /* check if port is not enabled */
1021 } else if (!(port->sm_vars & AD_PORT_BEGIN)
1022 && !port->is_enabled && !(port->sm_vars & AD_PORT_MOVED))
1023 port->sm_rx_state = AD_RX_PORT_DISABLED;
1024 /* check if new lacpdu arrived */
1025 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) ||
1026 (port->sm_rx_state == AD_RX_DEFAULTED) ||
1027 (port->sm_rx_state == AD_RX_CURRENT))) {
1028 if (port->sm_rx_state != AD_RX_CURRENT)
1029 port->sm_vars |= AD_PORT_CHURNED;
1030 port->sm_rx_timer_counter = 0;
1031 port->sm_rx_state = AD_RX_CURRENT;
1033 /* if timer is on, and if it is expired */
1034 if (port->sm_rx_timer_counter &&
1035 !(--port->sm_rx_timer_counter)) {
1036 switch (port->sm_rx_state) {
1038 port->sm_rx_state = AD_RX_DEFAULTED;
1041 port->sm_rx_state = AD_RX_EXPIRED;
1047 /* if no lacpdu arrived and no timer is on */
1048 switch (port->sm_rx_state) {
1049 case AD_RX_PORT_DISABLED:
1050 if (port->sm_vars & AD_PORT_MOVED)
1051 port->sm_rx_state = AD_RX_INITIALIZE;
1052 else if (port->is_enabled
1054 & AD_PORT_LACP_ENABLED))
1055 port->sm_rx_state = AD_RX_EXPIRED;
1056 else if (port->is_enabled
1058 & AD_PORT_LACP_ENABLED) == 0))
1059 port->sm_rx_state = AD_RX_LACP_DISABLED;
1068 /* check if the State machine was changed or new lacpdu arrived */
1069 if ((port->sm_rx_state != last_state) || (lacpdu)) {
1070 pr_debug("Rx Machine: Port=%d (%s), Last State=%d, Curr State=%d\n",
1071 port->actor_port_number,
1072 port->slave->dev->name,
1075 switch (port->sm_rx_state) {
1076 case AD_RX_INITIALIZE:
1077 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS))
1078 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1080 port->sm_vars |= AD_PORT_LACP_ENABLED;
1081 port->sm_vars &= ~AD_PORT_SELECTED;
1082 __record_default(port);
1083 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1084 port->sm_vars &= ~AD_PORT_MOVED;
1085 port->sm_rx_state = AD_RX_PORT_DISABLED;
1088 case AD_RX_PORT_DISABLED:
1089 port->sm_vars &= ~AD_PORT_MATCHED;
1091 case AD_RX_LACP_DISABLED:
1092 port->sm_vars &= ~AD_PORT_SELECTED;
1093 __record_default(port);
1094 port->partner_oper.port_state &= ~AD_STATE_AGGREGATION;
1095 port->sm_vars |= AD_PORT_MATCHED;
1096 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1099 /* Reset of the Synchronization flag (Standard 43.4.12)
1100 * This reset cause to disable this port in the
1101 * COLLECTING_DISTRIBUTING state of the mux machine in
1102 * case of EXPIRED even if LINK_DOWN didn't arrive for
1105 port->partner_oper.port_state &= ~AD_STATE_SYNCHRONIZATION;
1106 port->sm_vars &= ~AD_PORT_MATCHED;
1107 port->partner_oper.port_state |= AD_STATE_LACP_TIMEOUT;
1108 port->partner_oper.port_state |= AD_STATE_LACP_ACTIVITY;
1109 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
1110 port->actor_oper_port_state |= AD_STATE_EXPIRED;
1111 port->sm_vars |= AD_PORT_CHURNED;
1113 case AD_RX_DEFAULTED:
1114 __update_default_selected(port);
1115 __record_default(port);
1116 port->sm_vars |= AD_PORT_MATCHED;
1117 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1120 /* detect loopback situation */
1121 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system),
1122 &(port->actor_system))) {
1123 netdev_err(port->slave->bond->dev, "An illegal loopback occurred on adapter (%s)\n"
1124 "Check the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n",
1125 port->slave->dev->name);
1128 __update_selected(lacpdu, port);
1129 __update_ntt(lacpdu, port);
1130 __record_pdu(lacpdu, port);
1131 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT));
1132 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1141 * ad_churn_machine - handle port churn's state machine
1142 * @port: the port we're looking at
1145 static void ad_churn_machine(struct port *port)
1147 if (port->sm_vars & AD_PORT_CHURNED) {
1148 port->sm_vars &= ~AD_PORT_CHURNED;
1149 port->sm_churn_actor_state = AD_CHURN_MONITOR;
1150 port->sm_churn_partner_state = AD_CHURN_MONITOR;
1151 port->sm_churn_actor_timer_counter =
1152 __ad_timer_to_ticks(AD_ACTOR_CHURN_TIMER, 0);
1153 port->sm_churn_partner_timer_counter =
1154 __ad_timer_to_ticks(AD_PARTNER_CHURN_TIMER, 0);
1157 if (port->sm_churn_actor_timer_counter &&
1158 !(--port->sm_churn_actor_timer_counter) &&
1159 port->sm_churn_actor_state == AD_CHURN_MONITOR) {
1160 if (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION) {
1161 port->sm_churn_actor_state = AD_NO_CHURN;
1163 port->churn_actor_count++;
1164 port->sm_churn_actor_state = AD_CHURN;
1167 if (port->sm_churn_partner_timer_counter &&
1168 !(--port->sm_churn_partner_timer_counter) &&
1169 port->sm_churn_partner_state == AD_CHURN_MONITOR) {
1170 if (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) {
1171 port->sm_churn_partner_state = AD_NO_CHURN;
1173 port->churn_partner_count++;
1174 port->sm_churn_partner_state = AD_CHURN;
1180 * ad_tx_machine - handle a port's tx state machine
1181 * @port: the port we're looking at
1183 static void ad_tx_machine(struct port *port)
1185 /* check if tx timer expired, to verify that we do not send more than
1186 * 3 packets per second
1188 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) {
1189 /* check if there is something to send */
1190 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1191 __update_lacpdu_from_port(port);
1193 if (ad_lacpdu_send(port) >= 0) {
1194 pr_debug("Sent LACPDU on port %d\n",
1195 port->actor_port_number);
1197 /* mark ntt as false, so it will not be sent
1198 * again until demanded
1203 /* restart tx timer(to verify that we will not exceed
1204 * AD_MAX_TX_IN_SECOND
1206 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1211 * ad_periodic_machine - handle a port's periodic state machine
1212 * @port: the port we're looking at
1214 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1216 static void ad_periodic_machine(struct port *port)
1218 periodic_states_t last_state;
1220 /* keep current state machine state to compare later if it was changed */
1221 last_state = port->sm_periodic_state;
1223 /* check if port was reinitialized */
1224 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
1225 (!(port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & AD_STATE_LACP_ACTIVITY))
1227 port->sm_periodic_state = AD_NO_PERIODIC;
1229 /* check if state machine should change state */
1230 else if (port->sm_periodic_timer_counter) {
1231 /* check if periodic state machine expired */
1232 if (!(--port->sm_periodic_timer_counter)) {
1233 /* if expired then do tx */
1234 port->sm_periodic_state = AD_PERIODIC_TX;
1236 /* If not expired, check if there is some new timeout
1237 * parameter from the partner state
1239 switch (port->sm_periodic_state) {
1240 case AD_FAST_PERIODIC:
1241 if (!(port->partner_oper.port_state
1242 & AD_STATE_LACP_TIMEOUT))
1243 port->sm_periodic_state = AD_SLOW_PERIODIC;
1245 case AD_SLOW_PERIODIC:
1246 if ((port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1247 port->sm_periodic_timer_counter = 0;
1248 port->sm_periodic_state = AD_PERIODIC_TX;
1256 switch (port->sm_periodic_state) {
1257 case AD_NO_PERIODIC:
1258 port->sm_periodic_state = AD_FAST_PERIODIC;
1260 case AD_PERIODIC_TX:
1261 if (!(port->partner_oper.port_state &
1262 AD_STATE_LACP_TIMEOUT))
1263 port->sm_periodic_state = AD_SLOW_PERIODIC;
1265 port->sm_periodic_state = AD_FAST_PERIODIC;
1272 /* check if the state machine was changed */
1273 if (port->sm_periodic_state != last_state) {
1274 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1275 port->actor_port_number, last_state,
1276 port->sm_periodic_state);
1277 switch (port->sm_periodic_state) {
1278 case AD_NO_PERIODIC:
1279 port->sm_periodic_timer_counter = 0;
1281 case AD_FAST_PERIODIC:
1282 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1283 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1;
1285 case AD_SLOW_PERIODIC:
1286 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1287 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1;
1289 case AD_PERIODIC_TX:
1299 * ad_port_selection_logic - select aggregation groups
1300 * @port: the port we're looking at
1301 * @update_slave_arr: Does slave array need update?
1303 * Select aggregation groups, and assign each port for it's aggregetor. The
1304 * selection logic is called in the inititalization (after all the handshkes),
1305 * and after every lacpdu receive (if selected is off).
1307 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr)
1309 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator;
1310 struct port *last_port = NULL, *curr_port;
1311 struct list_head *iter;
1312 struct bonding *bond;
1313 struct slave *slave;
1316 /* if the port is already Selected, do nothing */
1317 if (port->sm_vars & AD_PORT_SELECTED)
1320 bond = __get_bond_by_port(port);
1322 /* if the port is connected to other aggregator, detach it */
1323 if (port->aggregator) {
1324 /* detach the port from its former aggregator */
1325 temp_aggregator = port->aggregator;
1326 for (curr_port = temp_aggregator->lag_ports; curr_port;
1327 last_port = curr_port,
1328 curr_port = curr_port->next_port_in_aggregator) {
1329 if (curr_port == port) {
1330 temp_aggregator->num_of_ports--;
1331 /* if it is the first port attached to the
1335 temp_aggregator->lag_ports =
1336 port->next_port_in_aggregator;
1338 /* not the first port attached to the
1341 last_port->next_port_in_aggregator =
1342 port->next_port_in_aggregator;
1345 /* clear the port's relations to this
1348 port->aggregator = NULL;
1349 port->next_port_in_aggregator = NULL;
1350 port->actor_port_aggregator_identifier = 0;
1352 netdev_dbg(bond->dev, "Port %d left LAG %d\n",
1353 port->actor_port_number,
1354 temp_aggregator->aggregator_identifier);
1355 /* if the aggregator is empty, clear its
1356 * parameters, and set it ready to be attached
1358 if (!temp_aggregator->lag_ports)
1359 ad_clear_agg(temp_aggregator);
1364 /* meaning: the port was related to an aggregator
1365 * but was not on the aggregator port list
1367 net_warn_ratelimited("%s: Warning: Port %d (on %s) was related to aggregator %d but was not on its port list\n",
1368 port->slave->bond->dev->name,
1369 port->actor_port_number,
1370 port->slave->dev->name,
1371 port->aggregator->aggregator_identifier);
1374 /* search on all aggregators for a suitable aggregator for this port */
1375 bond_for_each_slave(bond, slave, iter) {
1376 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
1378 /* keep a free aggregator for later use(if needed) */
1379 if (!aggregator->lag_ports) {
1380 if (!free_aggregator)
1381 free_aggregator = aggregator;
1384 /* check if current aggregator suits us */
1385 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */
1386 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) &&
1387 (aggregator->partner_system_priority == port->partner_oper.system_priority) &&
1388 (aggregator->partner_oper_aggregator_key == port->partner_oper.key)
1390 ((!MAC_ADDRESS_EQUAL(&(port->partner_oper.system), &(null_mac_addr)) && /* partner answers */
1391 !aggregator->is_individual) /* but is not individual OR */
1394 /* attach to the founded aggregator */
1395 port->aggregator = aggregator;
1396 port->actor_port_aggregator_identifier =
1397 port->aggregator->aggregator_identifier;
1398 port->next_port_in_aggregator = aggregator->lag_ports;
1399 port->aggregator->num_of_ports++;
1400 aggregator->lag_ports = port;
1401 netdev_dbg(bond->dev, "Port %d joined LAG %d(existing LAG)\n",
1402 port->actor_port_number,
1403 port->aggregator->aggregator_identifier);
1405 /* mark this port as selected */
1406 port->sm_vars |= AD_PORT_SELECTED;
1412 /* the port couldn't find an aggregator - attach it to a new
1416 if (free_aggregator) {
1417 /* assign port a new aggregator */
1418 port->aggregator = free_aggregator;
1419 port->actor_port_aggregator_identifier =
1420 port->aggregator->aggregator_identifier;
1422 /* update the new aggregator's parameters
1423 * if port was responsed from the end-user
1425 if (port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS)
1426 /* if port is full duplex */
1427 port->aggregator->is_individual = false;
1429 port->aggregator->is_individual = true;
1431 port->aggregator->actor_admin_aggregator_key =
1432 port->actor_admin_port_key;
1433 port->aggregator->actor_oper_aggregator_key =
1434 port->actor_oper_port_key;
1435 port->aggregator->partner_system =
1436 port->partner_oper.system;
1437 port->aggregator->partner_system_priority =
1438 port->partner_oper.system_priority;
1439 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key;
1440 port->aggregator->receive_state = 1;
1441 port->aggregator->transmit_state = 1;
1442 port->aggregator->lag_ports = port;
1443 port->aggregator->num_of_ports++;
1445 /* mark this port as selected */
1446 port->sm_vars |= AD_PORT_SELECTED;
1448 netdev_dbg(bond->dev, "Port %d joined LAG %d(new LAG)\n",
1449 port->actor_port_number,
1450 port->aggregator->aggregator_identifier);
1452 netdev_err(bond->dev, "Port %d (on %s) did not find a suitable aggregator\n",
1453 port->actor_port_number, port->slave->dev->name);
1456 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1457 * in all aggregator's ports, else set ready=FALSE in all
1458 * aggregator's ports
1460 __set_agg_ports_ready(port->aggregator,
1461 __agg_ports_are_ready(port->aggregator));
1463 aggregator = __get_first_agg(port);
1464 ad_agg_selection_logic(aggregator, update_slave_arr);
1466 if (!port->aggregator->is_active)
1467 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
1470 /* Decide if "agg" is a better choice for the new active aggregator that
1471 * the current best, according to the ad_select policy.
1473 static struct aggregator *ad_agg_selection_test(struct aggregator *best,
1474 struct aggregator *curr)
1476 /* 0. If no best, select current.
1478 * 1. If the current agg is not individual, and the best is
1479 * individual, select current.
1481 * 2. If current agg is individual and the best is not, keep best.
1483 * 3. Therefore, current and best are both individual or both not
1486 * 3a. If current agg partner replied, and best agg partner did not,
1489 * 3b. If current agg partner did not reply and best agg partner
1490 * did reply, keep best.
1492 * 4. Therefore, current and best both have partner replies or
1493 * both do not, so perform selection policy:
1495 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1496 * select by bandwidth.
1498 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1503 if (!curr->is_individual && best->is_individual)
1506 if (curr->is_individual && !best->is_individual)
1509 if (__agg_has_partner(curr) && !__agg_has_partner(best))
1512 if (!__agg_has_partner(curr) && __agg_has_partner(best))
1515 switch (__get_agg_selection_mode(curr->lag_ports)) {
1517 if (curr->num_of_ports > best->num_of_ports)
1520 if (curr->num_of_ports < best->num_of_ports)
1524 case BOND_AD_STABLE:
1525 case BOND_AD_BANDWIDTH:
1526 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best))
1532 net_warn_ratelimited("%s: Impossible agg select mode %d\n",
1533 curr->slave->bond->dev->name,
1534 __get_agg_selection_mode(curr->lag_ports));
1541 static int agg_device_up(const struct aggregator *agg)
1543 struct port *port = agg->lag_ports;
1548 return netif_running(port->slave->dev) &&
1549 netif_carrier_ok(port->slave->dev);
1553 * ad_agg_selection_logic - select an aggregation group for a team
1554 * @aggregator: the aggregator we're looking at
1555 * @update_slave_arr: Does slave array need update?
1557 * It is assumed that only one aggregator may be selected for a team.
1559 * The logic of this function is to select the aggregator according to
1560 * the ad_select policy:
1562 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1563 * it, and to reselect the active aggregator only if the previous
1564 * aggregator has no more ports related to it.
1566 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1567 * bandwidth, and reselect whenever a link state change takes place or the
1568 * set of slaves in the bond changes.
1570 * BOND_AD_COUNT: select the aggregator with largest number of ports
1571 * (slaves), and reselect whenever a link state change takes place or the
1572 * set of slaves in the bond changes.
1574 * FIXME: this function MUST be called with the first agg in the bond, or
1575 * __get_active_agg() won't work correctly. This function should be better
1576 * called with the bond itself, and retrieve the first agg from it.
1578 static void ad_agg_selection_logic(struct aggregator *agg,
1579 bool *update_slave_arr)
1581 struct aggregator *best, *active, *origin;
1582 struct bonding *bond = agg->slave->bond;
1583 struct list_head *iter;
1584 struct slave *slave;
1589 active = __get_active_agg(agg);
1590 best = (active && agg_device_up(active)) ? active : NULL;
1592 bond_for_each_slave_rcu(bond, slave, iter) {
1593 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1597 if (agg->num_of_ports && agg_device_up(agg))
1598 best = ad_agg_selection_test(best, agg);
1602 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) {
1603 /* For the STABLE policy, don't replace the old active
1604 * aggregator if it's still active (it has an answering
1605 * partner) or if both the best and active don't have an
1606 * answering partner.
1608 if (active && active->lag_ports &&
1609 active->lag_ports->is_enabled &&
1610 (__agg_has_partner(active) ||
1611 (!__agg_has_partner(active) &&
1612 !__agg_has_partner(best)))) {
1613 if (!(!active->actor_oper_aggregator_key &&
1614 best->actor_oper_aggregator_key)) {
1616 active->is_active = 1;
1621 if (best && (best == active)) {
1623 active->is_active = 1;
1626 /* if there is new best aggregator, activate it */
1628 netdev_dbg(bond->dev, "best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1629 best->aggregator_identifier, best->num_of_ports,
1630 best->actor_oper_aggregator_key,
1631 best->partner_oper_aggregator_key,
1632 best->is_individual, best->is_active);
1633 netdev_dbg(bond->dev, "best ports %p slave %p %s\n",
1634 best->lag_ports, best->slave,
1635 best->slave ? best->slave->dev->name : "NULL");
1637 bond_for_each_slave_rcu(bond, slave, iter) {
1638 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1640 netdev_dbg(bond->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1641 agg->aggregator_identifier, agg->num_of_ports,
1642 agg->actor_oper_aggregator_key,
1643 agg->partner_oper_aggregator_key,
1644 agg->is_individual, agg->is_active);
1647 /* check if any partner replys */
1648 if (best->is_individual) {
1649 net_warn_ratelimited("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1651 best->slave->bond->dev->name : "NULL");
1654 best->is_active = 1;
1655 netdev_dbg(bond->dev, "LAG %d chosen as the active LAG\n",
1656 best->aggregator_identifier);
1657 netdev_dbg(bond->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1658 best->aggregator_identifier, best->num_of_ports,
1659 best->actor_oper_aggregator_key,
1660 best->partner_oper_aggregator_key,
1661 best->is_individual, best->is_active);
1663 /* disable the ports that were related to the former
1667 for (port = active->lag_ports; port;
1668 port = port->next_port_in_aggregator) {
1669 __disable_port(port);
1672 /* Slave array needs update. */
1673 *update_slave_arr = true;
1676 /* if the selected aggregator is of join individuals
1677 * (partner_system is NULL), enable their ports
1679 active = __get_active_agg(origin);
1682 if (!__agg_has_partner(active)) {
1683 for (port = active->lag_ports; port;
1684 port = port->next_port_in_aggregator) {
1685 __enable_port(port);
1692 bond_3ad_set_carrier(bond);
1696 * ad_clear_agg - clear a given aggregator's parameters
1697 * @aggregator: the aggregator we're looking at
1699 static void ad_clear_agg(struct aggregator *aggregator)
1702 aggregator->is_individual = false;
1703 aggregator->actor_admin_aggregator_key = 0;
1704 aggregator->actor_oper_aggregator_key = 0;
1705 aggregator->partner_system = null_mac_addr;
1706 aggregator->partner_system_priority = 0;
1707 aggregator->partner_oper_aggregator_key = 0;
1708 aggregator->receive_state = 0;
1709 aggregator->transmit_state = 0;
1710 aggregator->lag_ports = NULL;
1711 aggregator->is_active = 0;
1712 aggregator->num_of_ports = 0;
1713 pr_debug("LAG %d was cleared\n",
1714 aggregator->aggregator_identifier);
1719 * ad_initialize_agg - initialize a given aggregator's parameters
1720 * @aggregator: the aggregator we're looking at
1722 static void ad_initialize_agg(struct aggregator *aggregator)
1725 ad_clear_agg(aggregator);
1727 aggregator->aggregator_mac_address = null_mac_addr;
1728 aggregator->aggregator_identifier = 0;
1729 aggregator->slave = NULL;
1734 * ad_initialize_port - initialize a given port's parameters
1735 * @aggregator: the aggregator we're looking at
1736 * @lacp_fast: boolean. whether fast periodic should be used
1738 static void ad_initialize_port(struct port *port, int lacp_fast)
1740 static const struct port_params tmpl = {
1741 .system_priority = 0xffff,
1744 .port_priority = 0xff,
1747 static const struct lacpdu lacpdu = {
1749 .version_number = 0x01,
1750 .tlv_type_actor_info = 0x01,
1751 .actor_information_length = 0x14,
1752 .tlv_type_partner_info = 0x02,
1753 .partner_information_length = 0x14,
1754 .tlv_type_collector_info = 0x03,
1755 .collector_information_length = 0x10,
1756 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY),
1760 port->actor_port_priority = 0xff;
1761 port->actor_port_aggregator_identifier = 0;
1763 port->actor_admin_port_state = AD_STATE_AGGREGATION |
1764 AD_STATE_LACP_ACTIVITY;
1765 port->actor_oper_port_state = AD_STATE_AGGREGATION |
1766 AD_STATE_LACP_ACTIVITY;
1769 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
1771 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
1772 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl));
1774 port->is_enabled = true;
1775 /* private parameters */
1776 port->sm_vars = AD_PORT_BEGIN | AD_PORT_LACP_ENABLED;
1777 port->sm_rx_state = 0;
1778 port->sm_rx_timer_counter = 0;
1779 port->sm_periodic_state = 0;
1780 port->sm_periodic_timer_counter = 0;
1781 port->sm_mux_state = 0;
1782 port->sm_mux_timer_counter = 0;
1783 port->sm_tx_state = 0;
1784 port->aggregator = NULL;
1785 port->next_port_in_aggregator = NULL;
1786 port->transaction_id = 0;
1788 port->sm_churn_actor_timer_counter = 0;
1789 port->sm_churn_actor_state = 0;
1790 port->churn_actor_count = 0;
1791 port->sm_churn_partner_timer_counter = 0;
1792 port->sm_churn_partner_state = 0;
1793 port->churn_partner_count = 0;
1795 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu));
1800 * ad_enable_collecting_distributing - enable a port's transmit/receive
1801 * @port: the port we're looking at
1802 * @update_slave_arr: Does slave array need update?
1804 * Enable @port if it's in an active aggregator
1806 static void ad_enable_collecting_distributing(struct port *port,
1807 bool *update_slave_arr)
1809 if (port->aggregator->is_active) {
1810 pr_debug("Enabling port %d(LAG %d)\n",
1811 port->actor_port_number,
1812 port->aggregator->aggregator_identifier);
1813 __enable_port(port);
1814 /* Slave array needs update */
1815 *update_slave_arr = true;
1820 * ad_disable_collecting_distributing - disable a port's transmit/receive
1821 * @port: the port we're looking at
1822 * @update_slave_arr: Does slave array need update?
1824 static void ad_disable_collecting_distributing(struct port *port,
1825 bool *update_slave_arr)
1827 if (port->aggregator &&
1828 !MAC_ADDRESS_EQUAL(&(port->aggregator->partner_system),
1829 &(null_mac_addr))) {
1830 pr_debug("Disabling port %d(LAG %d)\n",
1831 port->actor_port_number,
1832 port->aggregator->aggregator_identifier);
1833 __disable_port(port);
1834 /* Slave array needs an update */
1835 *update_slave_arr = true;
1840 * ad_marker_info_received - handle receive of a Marker information frame
1841 * @marker_info: Marker info received
1842 * @port: the port we're looking at
1844 static void ad_marker_info_received(struct bond_marker *marker_info,
1847 struct bond_marker marker;
1849 /* copy the received marker data to the response marker */
1850 memcpy(&marker, marker_info, sizeof(struct bond_marker));
1851 /* change the marker subtype to marker response */
1852 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE;
1854 /* send the marker response */
1855 if (ad_marker_send(port, &marker) >= 0) {
1856 pr_debug("Sent Marker Response on port %d\n",
1857 port->actor_port_number);
1862 * ad_marker_response_received - handle receive of a marker response frame
1863 * @marker: marker PDU received
1864 * @port: the port we're looking at
1866 * This function does nothing since we decided not to implement send and handle
1867 * response for marker PDU's, in this stage, but only to respond to marker
1870 static void ad_marker_response_received(struct bond_marker *marker,
1873 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1876 /* ========= AD exported functions to the main bonding code ========= */
1878 /* Check aggregators status in team every T seconds */
1879 #define AD_AGGREGATOR_SELECTION_TIMER 8
1882 * bond_3ad_initiate_agg_selection - initate aggregator selection
1883 * @bond: bonding struct
1885 * Set the aggregation selection timer, to initiate an agg selection in
1886 * the very near future. Called during first initialization, and during
1887 * any down to up transitions of the bond.
1889 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout)
1891 BOND_AD_INFO(bond).agg_select_timer = timeout;
1895 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1896 * @bond: bonding struct to work on
1897 * @tick_resolution: tick duration (millisecond resolution)
1899 * Can be called only after the mac address of the bond is set.
1901 void bond_3ad_initialize(struct bonding *bond, u16 tick_resolution)
1903 /* check that the bond is not initialized yet */
1904 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond).system.sys_mac_addr),
1905 bond->dev->dev_addr)) {
1907 BOND_AD_INFO(bond).aggregator_identifier = 0;
1909 BOND_AD_INFO(bond).system.sys_priority =
1910 bond->params.ad_actor_sys_prio;
1911 if (is_zero_ether_addr(bond->params.ad_actor_system))
1912 BOND_AD_INFO(bond).system.sys_mac_addr =
1913 *((struct mac_addr *)bond->dev->dev_addr);
1915 BOND_AD_INFO(bond).system.sys_mac_addr =
1916 *((struct mac_addr *)bond->params.ad_actor_system);
1918 /* initialize how many times this module is called in one
1919 * second (should be about every 100ms)
1921 ad_ticks_per_sec = tick_resolution;
1923 bond_3ad_initiate_agg_selection(bond,
1924 AD_AGGREGATOR_SELECTION_TIMER *
1930 * bond_3ad_bind_slave - initialize a slave's port
1931 * @slave: slave struct to work on
1933 * Returns: 0 on success
1936 void bond_3ad_bind_slave(struct slave *slave)
1938 struct bonding *bond = bond_get_bond_by_slave(slave);
1940 struct aggregator *aggregator;
1942 /* check that the slave has not been initialized yet. */
1943 if (SLAVE_AD_INFO(slave)->port.slave != slave) {
1945 /* port initialization */
1946 port = &(SLAVE_AD_INFO(slave)->port);
1948 ad_initialize_port(port, bond->params.lacp_fast);
1950 port->slave = slave;
1951 port->actor_port_number = SLAVE_AD_INFO(slave)->id;
1952 /* key is determined according to the link speed, duplex and
1955 port->actor_admin_port_key = bond->params.ad_user_port_key << 6;
1956 port->actor_admin_port_key |= __get_duplex(port);
1957 port->actor_admin_port_key |= (__get_link_speed(port) << 1);
1958 port->actor_oper_port_key = port->actor_admin_port_key;
1959 /* if the port is not full duplex, then the port should be not
1962 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS))
1963 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1964 /* actor system is the bond's system */
1965 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr;
1966 port->actor_system_priority =
1967 BOND_AD_INFO(bond).system.sys_priority;
1968 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
1969 * lacpdu's are sent in one second)
1971 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1973 __disable_port(port);
1975 /* aggregator initialization */
1976 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
1978 ad_initialize_agg(aggregator);
1980 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr);
1981 aggregator->aggregator_identifier = ++BOND_AD_INFO(bond).aggregator_identifier;
1982 aggregator->slave = slave;
1983 aggregator->is_active = 0;
1984 aggregator->num_of_ports = 0;
1989 * bond_3ad_unbind_slave - deinitialize a slave's port
1990 * @slave: slave struct to work on
1992 * Search for the aggregator that is related to this port, remove the
1993 * aggregator and assign another aggregator for other port related to it
1994 * (if any), and remove the port.
1996 void bond_3ad_unbind_slave(struct slave *slave)
1998 struct port *port, *prev_port, *temp_port;
1999 struct aggregator *aggregator, *new_aggregator, *temp_aggregator;
2000 int select_new_active_agg = 0;
2001 struct bonding *bond = slave->bond;
2002 struct slave *slave_iter;
2003 struct list_head *iter;
2004 bool dummy_slave_update; /* Ignore this value as caller updates array */
2006 /* Sync against bond_3ad_state_machine_handler() */
2007 spin_lock_bh(&bond->mode_lock);
2008 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2009 port = &(SLAVE_AD_INFO(slave)->port);
2011 /* if slave is null, the whole port is not initialized */
2013 netdev_warn(bond->dev, "Trying to unbind an uninitialized port on %s\n",
2018 netdev_dbg(bond->dev, "Unbinding Link Aggregation Group %d\n",
2019 aggregator->aggregator_identifier);
2021 /* Tell the partner that this port is not suitable for aggregation */
2022 port->actor_oper_port_state &= ~AD_STATE_AGGREGATION;
2023 __update_lacpdu_from_port(port);
2024 ad_lacpdu_send(port);
2026 /* check if this aggregator is occupied */
2027 if (aggregator->lag_ports) {
2028 /* check if there are other ports related to this aggregator
2029 * except the port related to this slave(thats ensure us that
2030 * there is a reason to search for new aggregator, and that we
2033 if ((aggregator->lag_ports != port) ||
2034 (aggregator->lag_ports->next_port_in_aggregator)) {
2035 /* find new aggregator for the related port(s) */
2036 bond_for_each_slave(bond, slave_iter, iter) {
2037 new_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2038 /* if the new aggregator is empty, or it is
2039 * connected to our port only
2041 if (!new_aggregator->lag_ports ||
2042 ((new_aggregator->lag_ports == port) &&
2043 !new_aggregator->lag_ports->next_port_in_aggregator))
2047 new_aggregator = NULL;
2049 /* if new aggregator found, copy the aggregator's
2050 * parameters and connect the related lag_ports to the
2053 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) {
2054 netdev_dbg(bond->dev, "Some port(s) related to LAG %d - replacing with LAG %d\n",
2055 aggregator->aggregator_identifier,
2056 new_aggregator->aggregator_identifier);
2058 if ((new_aggregator->lag_ports == port) &&
2059 new_aggregator->is_active) {
2060 netdev_info(bond->dev, "Removing an active aggregator\n");
2061 select_new_active_agg = 1;
2064 new_aggregator->is_individual = aggregator->is_individual;
2065 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key;
2066 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key;
2067 new_aggregator->partner_system = aggregator->partner_system;
2068 new_aggregator->partner_system_priority = aggregator->partner_system_priority;
2069 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key;
2070 new_aggregator->receive_state = aggregator->receive_state;
2071 new_aggregator->transmit_state = aggregator->transmit_state;
2072 new_aggregator->lag_ports = aggregator->lag_ports;
2073 new_aggregator->is_active = aggregator->is_active;
2074 new_aggregator->num_of_ports = aggregator->num_of_ports;
2076 /* update the information that is written on
2077 * the ports about the aggregator
2079 for (temp_port = aggregator->lag_ports; temp_port;
2080 temp_port = temp_port->next_port_in_aggregator) {
2081 temp_port->aggregator = new_aggregator;
2082 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier;
2085 ad_clear_agg(aggregator);
2087 if (select_new_active_agg)
2088 ad_agg_selection_logic(__get_first_agg(port),
2089 &dummy_slave_update);
2091 netdev_warn(bond->dev, "unbinding aggregator, and could not find a new aggregator for its ports\n");
2094 /* in case that the only port related to this
2095 * aggregator is the one we want to remove
2097 select_new_active_agg = aggregator->is_active;
2098 ad_clear_agg(aggregator);
2099 if (select_new_active_agg) {
2100 netdev_info(bond->dev, "Removing an active aggregator\n");
2101 /* select new active aggregator */
2102 temp_aggregator = __get_first_agg(port);
2103 if (temp_aggregator)
2104 ad_agg_selection_logic(temp_aggregator,
2105 &dummy_slave_update);
2110 netdev_dbg(bond->dev, "Unbinding port %d\n", port->actor_port_number);
2112 /* find the aggregator that this port is connected to */
2113 bond_for_each_slave(bond, slave_iter, iter) {
2114 temp_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2116 /* search the port in the aggregator's related ports */
2117 for (temp_port = temp_aggregator->lag_ports; temp_port;
2118 prev_port = temp_port,
2119 temp_port = temp_port->next_port_in_aggregator) {
2120 if (temp_port == port) {
2121 /* the aggregator found - detach the port from
2125 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator;
2127 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator;
2128 temp_aggregator->num_of_ports--;
2129 if (temp_aggregator->num_of_ports == 0) {
2130 select_new_active_agg = temp_aggregator->is_active;
2131 ad_clear_agg(temp_aggregator);
2132 if (select_new_active_agg) {
2133 netdev_info(bond->dev, "Removing an active aggregator\n");
2134 /* select new active aggregator */
2135 ad_agg_selection_logic(__get_first_agg(port),
2136 &dummy_slave_update);
2146 spin_unlock_bh(&bond->mode_lock);
2150 * bond_3ad_state_machine_handler - handle state machines timeout
2151 * @bond: bonding struct to work on
2153 * The state machine handling concept in this module is to check every tick
2154 * which state machine should operate any function. The execution order is
2155 * round robin, so when we have an interaction between state machines, the
2156 * reply of one to each other might be delayed until next tick.
2158 * This function also complete the initialization when the agg_select_timer
2159 * times out, and it selects an aggregator for the ports that are yet not
2160 * related to any aggregator, and selects the active aggregator for a bond.
2162 void bond_3ad_state_machine_handler(struct work_struct *work)
2164 struct bonding *bond = container_of(work, struct bonding,
2166 struct aggregator *aggregator;
2167 struct list_head *iter;
2168 struct slave *slave;
2170 bool should_notify_rtnl = BOND_SLAVE_NOTIFY_LATER;
2171 bool update_slave_arr = false;
2173 /* Lock to protect data accessed by all (e.g., port->sm_vars) and
2174 * against running with bond_3ad_unbind_slave. ad_rx_machine may run
2175 * concurrently due to incoming LACPDU as well.
2177 spin_lock_bh(&bond->mode_lock);
2180 /* check if there are any slaves */
2181 if (!bond_has_slaves(bond))
2184 /* check if agg_select_timer timer after initialize is timed out */
2185 if (BOND_AD_INFO(bond).agg_select_timer &&
2186 !(--BOND_AD_INFO(bond).agg_select_timer)) {
2187 slave = bond_first_slave_rcu(bond);
2188 port = slave ? &(SLAVE_AD_INFO(slave)->port) : NULL;
2190 /* select the active aggregator for the bond */
2193 net_warn_ratelimited("%s: Warning: bond's first port is uninitialized\n",
2198 aggregator = __get_first_agg(port);
2199 ad_agg_selection_logic(aggregator, &update_slave_arr);
2201 bond_3ad_set_carrier(bond);
2204 /* for each port run the state machines */
2205 bond_for_each_slave_rcu(bond, slave, iter) {
2206 port = &(SLAVE_AD_INFO(slave)->port);
2208 net_warn_ratelimited("%s: Warning: Found an uninitialized port\n",
2213 ad_rx_machine(NULL, port);
2214 ad_periodic_machine(port);
2215 ad_port_selection_logic(port, &update_slave_arr);
2216 ad_mux_machine(port, &update_slave_arr);
2217 ad_tx_machine(port);
2218 ad_churn_machine(port);
2220 /* turn off the BEGIN bit, since we already handled it */
2221 if (port->sm_vars & AD_PORT_BEGIN)
2222 port->sm_vars &= ~AD_PORT_BEGIN;
2226 bond_for_each_slave_rcu(bond, slave, iter) {
2227 if (slave->should_notify) {
2228 should_notify_rtnl = BOND_SLAVE_NOTIFY_NOW;
2233 spin_unlock_bh(&bond->mode_lock);
2235 if (update_slave_arr)
2236 bond_slave_arr_work_rearm(bond, 0);
2238 if (should_notify_rtnl && rtnl_trylock()) {
2239 bond_slave_state_notify(bond);
2242 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks);
2246 * bond_3ad_rx_indication - handle a received frame
2247 * @lacpdu: received lacpdu
2248 * @slave: slave struct to work on
2249 * @length: length of the data received
2251 * It is assumed that frames that were sent on this NIC don't returned as new
2252 * received frames (loopback). Since only the payload is given to this
2253 * function, it check for loopback.
2255 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave,
2259 int ret = RX_HANDLER_ANOTHER;
2261 if (length >= sizeof(struct lacpdu)) {
2263 port = &(SLAVE_AD_INFO(slave)->port);
2266 net_warn_ratelimited("%s: Warning: port of slave %s is uninitialized\n",
2267 slave->dev->name, slave->bond->dev->name);
2271 switch (lacpdu->subtype) {
2272 case AD_TYPE_LACPDU:
2273 ret = RX_HANDLER_CONSUMED;
2274 netdev_dbg(slave->bond->dev,
2275 "Received LACPDU on port %d slave %s\n",
2276 port->actor_port_number,
2278 /* Protect against concurrent state machines */
2279 spin_lock(&slave->bond->mode_lock);
2280 ad_rx_machine(lacpdu, port);
2281 spin_unlock(&slave->bond->mode_lock);
2284 case AD_TYPE_MARKER:
2285 ret = RX_HANDLER_CONSUMED;
2286 /* No need to convert fields to Little Endian since we
2287 * don't use the marker's fields.
2290 switch (((struct bond_marker *)lacpdu)->tlv_type) {
2291 case AD_MARKER_INFORMATION_SUBTYPE:
2292 netdev_dbg(slave->bond->dev, "Received Marker Information on port %d\n",
2293 port->actor_port_number);
2294 ad_marker_info_received((struct bond_marker *)lacpdu, port);
2297 case AD_MARKER_RESPONSE_SUBTYPE:
2298 netdev_dbg(slave->bond->dev, "Received Marker Response on port %d\n",
2299 port->actor_port_number);
2300 ad_marker_response_received((struct bond_marker *)lacpdu, port);
2304 netdev_dbg(slave->bond->dev, "Received an unknown Marker subtype on slot %d\n",
2305 port->actor_port_number);
2313 * bond_3ad_adapter_speed_changed - handle a slave's speed change indication
2314 * @slave: slave struct to work on
2316 * Handle reselection of aggregator (if needed) for this port.
2318 void bond_3ad_adapter_speed_changed(struct slave *slave)
2322 port = &(SLAVE_AD_INFO(slave)->port);
2324 /* if slave is null, the whole port is not initialized */
2326 netdev_warn(slave->bond->dev, "speed changed for uninitialized port on %s\n",
2331 spin_lock_bh(&slave->bond->mode_lock);
2333 port->actor_admin_port_key &= ~AD_SPEED_KEY_MASKS;
2334 port->actor_admin_port_key |= __get_link_speed(port) << 1;
2335 port->actor_oper_port_key = port->actor_admin_port_key;
2336 netdev_dbg(slave->bond->dev, "Port %d changed speed\n", port->actor_port_number);
2337 /* there is no need to reselect a new aggregator, just signal the
2338 * state machines to reinitialize
2340 port->sm_vars |= AD_PORT_BEGIN;
2342 spin_unlock_bh(&slave->bond->mode_lock);
2346 * bond_3ad_adapter_duplex_changed - handle a slave's duplex change indication
2347 * @slave: slave struct to work on
2349 * Handle reselection of aggregator (if needed) for this port.
2351 void bond_3ad_adapter_duplex_changed(struct slave *slave)
2355 port = &(SLAVE_AD_INFO(slave)->port);
2357 /* if slave is null, the whole port is not initialized */
2359 netdev_warn(slave->bond->dev, "duplex changed for uninitialized port on %s\n",
2364 spin_lock_bh(&slave->bond->mode_lock);
2366 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_MASKS;
2367 port->actor_admin_port_key |= __get_duplex(port);
2368 port->actor_oper_port_key = port->actor_admin_port_key;
2369 netdev_dbg(slave->bond->dev, "Port %d slave %s changed duplex\n",
2370 port->actor_port_number, slave->dev->name);
2371 if (port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS)
2372 port->sm_vars |= AD_PORT_LACP_ENABLED;
2373 /* there is no need to reselect a new aggregator, just signal the
2374 * state machines to reinitialize
2376 port->sm_vars |= AD_PORT_BEGIN;
2378 spin_unlock_bh(&slave->bond->mode_lock);
2382 * bond_3ad_handle_link_change - handle a slave's link status change indication
2383 * @slave: slave struct to work on
2384 * @status: whether the link is now up or down
2386 * Handle reselection of aggregator (if needed) for this port.
2388 void bond_3ad_handle_link_change(struct slave *slave, char link)
2392 port = &(SLAVE_AD_INFO(slave)->port);
2394 /* if slave is null, the whole port is not initialized */
2396 netdev_warn(slave->bond->dev, "link status changed for uninitialized port on %s\n",
2401 spin_lock_bh(&slave->bond->mode_lock);
2402 /* on link down we are zeroing duplex and speed since
2403 * some of the adaptors(ce1000.lan) report full duplex/speed
2404 * instead of N/A(duplex) / 0(speed).
2406 * on link up we are forcing recheck on the duplex and speed since
2407 * some of he adaptors(ce1000.lan) report.
2409 port->actor_admin_port_key &= ~(AD_DUPLEX_KEY_MASKS|AD_SPEED_KEY_MASKS);
2410 if (link == BOND_LINK_UP) {
2411 port->is_enabled = true;
2412 port->actor_admin_port_key |=
2413 (__get_link_speed(port) << 1) | __get_duplex(port);
2414 if (port->actor_admin_port_key & AD_DUPLEX_KEY_MASKS)
2415 port->sm_vars |= AD_PORT_LACP_ENABLED;
2417 /* link has failed */
2418 port->is_enabled = false;
2419 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
2421 port->actor_oper_port_key = port->actor_admin_port_key;
2422 netdev_dbg(slave->bond->dev, "Port %d changed link status to %s\n",
2423 port->actor_port_number,
2424 link == BOND_LINK_UP ? "UP" : "DOWN");
2425 /* there is no need to reselect a new aggregator, just signal the
2426 * state machines to reinitialize
2428 port->sm_vars |= AD_PORT_BEGIN;
2430 spin_unlock_bh(&slave->bond->mode_lock);
2432 /* RTNL is held and mode_lock is released so it's safe
2433 * to update slave_array here.
2435 bond_update_slave_arr(slave->bond, NULL);
2439 * bond_3ad_set_carrier - set link state for bonding master
2440 * @bond - bonding structure
2442 * if we have an active aggregator, we're up, if not, we're down.
2443 * Presumes that we cannot have an active aggregator if there are
2444 * no slaves with link up.
2446 * This behavior complies with IEEE 802.3 section 43.3.9.
2448 * Called by bond_set_carrier(). Return zero if carrier state does not
2449 * change, nonzero if it does.
2451 int bond_3ad_set_carrier(struct bonding *bond)
2453 struct aggregator *active;
2454 struct slave *first_slave;
2458 first_slave = bond_first_slave_rcu(bond);
2463 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave)->aggregator));
2465 /* are enough slaves available to consider link up? */
2466 if (active->num_of_ports < bond->params.min_links) {
2467 if (netif_carrier_ok(bond->dev)) {
2468 netif_carrier_off(bond->dev);
2471 } else if (!netif_carrier_ok(bond->dev)) {
2472 netif_carrier_on(bond->dev);
2475 } else if (netif_carrier_ok(bond->dev)) {
2476 netif_carrier_off(bond->dev);
2484 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2485 * @bond: bonding struct to work on
2486 * @ad_info: ad_info struct to fill with the bond's info
2488 * Returns: 0 on success
2491 int __bond_3ad_get_active_agg_info(struct bonding *bond,
2492 struct ad_info *ad_info)
2494 struct aggregator *aggregator = NULL;
2495 struct list_head *iter;
2496 struct slave *slave;
2499 bond_for_each_slave_rcu(bond, slave, iter) {
2500 port = &(SLAVE_AD_INFO(slave)->port);
2501 if (port->aggregator && port->aggregator->is_active) {
2502 aggregator = port->aggregator;
2510 ad_info->aggregator_id = aggregator->aggregator_identifier;
2511 ad_info->ports = aggregator->num_of_ports;
2512 ad_info->actor_key = aggregator->actor_oper_aggregator_key;
2513 ad_info->partner_key = aggregator->partner_oper_aggregator_key;
2514 ether_addr_copy(ad_info->partner_system,
2515 aggregator->partner_system.mac_addr_value);
2519 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info)
2524 ret = __bond_3ad_get_active_agg_info(bond, ad_info);
2530 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond,
2531 struct slave *slave)
2533 struct lacpdu *lacpdu, _lacpdu;
2535 if (skb->protocol != PKT_TYPE_LACPDU)
2536 return RX_HANDLER_ANOTHER;
2538 if (!MAC_ADDRESS_EQUAL(eth_hdr(skb)->h_dest, lacpdu_mcast_addr))
2539 return RX_HANDLER_ANOTHER;
2541 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu);
2543 return RX_HANDLER_ANOTHER;
2545 return bond_3ad_rx_indication(lacpdu, slave, skb->len);
2549 * bond_3ad_update_lacp_rate - change the lacp rate
2550 * @bond - bonding struct
2552 * When modify lacp_rate parameter via sysfs,
2553 * update actor_oper_port_state of each port.
2555 * Hold bond->mode_lock,
2556 * so we can modify port->actor_oper_port_state,
2557 * no matter bond is up or down.
2559 void bond_3ad_update_lacp_rate(struct bonding *bond)
2561 struct port *port = NULL;
2562 struct list_head *iter;
2563 struct slave *slave;
2566 lacp_fast = bond->params.lacp_fast;
2567 spin_lock_bh(&bond->mode_lock);
2568 bond_for_each_slave(bond, slave, iter) {
2569 port = &(SLAVE_AD_INFO(slave)->port);
2571 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
2573 port->actor_oper_port_state &= ~AD_STATE_LACP_TIMEOUT;
2575 spin_unlock_bh(&bond->mode_lock);