1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
6 #include <linux/skbuff.h>
7 #include <linux/if_ether.h>
8 #include <linux/netdevice.h>
9 #include <linux/spinlock.h>
10 #include <linux/ethtool.h>
11 #include <linux/etherdevice.h>
12 #include <linux/if_bonding.h>
13 #include <linux/pkt_sched.h>
14 #include <net/net_namespace.h>
15 #include <net/bonding.h>
16 #include <net/bond_3ad.h>
17 #include <net/netlink.h>
19 /* General definitions */
20 #define AD_SHORT_TIMEOUT 1
21 #define AD_LONG_TIMEOUT 0
22 #define AD_STANDBY 0x2
23 #define AD_MAX_TX_IN_SECOND 3
24 #define AD_COLLECTOR_MAX_DELAY 0
26 /* Timer definitions (43.4.4 in the 802.3ad standard) */
27 #define AD_FAST_PERIODIC_TIME 1
28 #define AD_SLOW_PERIODIC_TIME 30
29 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
30 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
31 #define AD_CHURN_DETECTION_TIME 60
32 #define AD_AGGREGATE_WAIT_TIME 2
34 /* Port Variables definitions used by the State Machines (43.4.7 in the
37 #define AD_PORT_BEGIN 0x1
38 #define AD_PORT_LACP_ENABLED 0x2
39 #define AD_PORT_ACTOR_CHURN 0x4
40 #define AD_PORT_PARTNER_CHURN 0x8
41 #define AD_PORT_READY 0x10
42 #define AD_PORT_READY_N 0x20
43 #define AD_PORT_MATCHED 0x40
44 #define AD_PORT_STANDBY 0x80
45 #define AD_PORT_SELECTED 0x100
46 #define AD_PORT_MOVED 0x200
47 #define AD_PORT_CHURNED (AD_PORT_ACTOR_CHURN | AD_PORT_PARTNER_CHURN)
49 /* Port Key definitions
50 * key is determined according to the link speed, duplex and
51 * user key (which is yet not supported)
52 * --------------------------------------------------------------
53 * Port key | User key (10 bits) | Speed (5 bits) | Duplex|
54 * --------------------------------------------------------------
57 #define AD_DUPLEX_KEY_MASKS 0x1
58 #define AD_SPEED_KEY_MASKS 0x3E
59 #define AD_USER_KEY_MASKS 0xFFC0
61 enum ad_link_speed_type {
62 AD_LINK_SPEED_1MBPS = 1,
64 AD_LINK_SPEED_100MBPS,
65 AD_LINK_SPEED_1000MBPS,
66 AD_LINK_SPEED_2500MBPS,
67 AD_LINK_SPEED_5000MBPS,
68 AD_LINK_SPEED_10000MBPS,
69 AD_LINK_SPEED_14000MBPS,
70 AD_LINK_SPEED_20000MBPS,
71 AD_LINK_SPEED_25000MBPS,
72 AD_LINK_SPEED_40000MBPS,
73 AD_LINK_SPEED_50000MBPS,
74 AD_LINK_SPEED_56000MBPS,
75 AD_LINK_SPEED_100000MBPS,
76 AD_LINK_SPEED_200000MBPS,
77 AD_LINK_SPEED_400000MBPS,
78 AD_LINK_SPEED_800000MBPS,
81 /* compare MAC addresses */
82 #define MAC_ADDRESS_EQUAL(A, B) \
83 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
85 static const u8 null_mac_addr[ETH_ALEN + 2] __long_aligned = {
89 static const u16 ad_ticks_per_sec = 1000 / AD_TIMER_INTERVAL;
90 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000;
92 const u8 lacpdu_mcast_addr[ETH_ALEN + 2] __long_aligned = {
93 0x01, 0x80, 0xC2, 0x00, 0x00, 0x02
96 /* ================= main 802.3ad protocol functions ================== */
97 static int ad_lacpdu_send(struct port *port);
98 static int ad_marker_send(struct port *port, struct bond_marker *marker);
99 static void ad_mux_machine(struct port *port, bool *update_slave_arr);
100 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
101 static void ad_tx_machine(struct port *port);
102 static void ad_periodic_machine(struct port *port, struct bond_params *bond_params);
103 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr);
104 static void ad_agg_selection_logic(struct aggregator *aggregator,
105 bool *update_slave_arr);
106 static void ad_clear_agg(struct aggregator *aggregator);
107 static void ad_initialize_agg(struct aggregator *aggregator);
108 static void ad_initialize_port(struct port *port, int lacp_fast);
109 static void ad_enable_collecting_distributing(struct port *port,
110 bool *update_slave_arr);
111 static void ad_disable_collecting_distributing(struct port *port,
112 bool *update_slave_arr);
113 static void ad_marker_info_received(struct bond_marker *marker_info,
115 static void ad_marker_response_received(struct bond_marker *marker,
117 static void ad_update_actor_keys(struct port *port, bool reset);
120 /* ================= api to bonding and kernel code ================== */
123 * __get_bond_by_port - get the port's bonding struct
124 * @port: the port we're looking at
126 * Return @port's bonding struct, or %NULL if it can't be found.
128 static inline struct bonding *__get_bond_by_port(struct port *port)
130 if (port->slave == NULL)
133 return bond_get_bond_by_slave(port->slave);
137 * __get_first_agg - get the first aggregator in the bond
138 * @port: the port we're looking at
140 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
142 * The caller must hold RCU or RTNL lock.
144 static inline struct aggregator *__get_first_agg(struct port *port)
146 struct bonding *bond = __get_bond_by_port(port);
147 struct slave *first_slave;
148 struct aggregator *agg;
150 /* If there's no bond for this port, or bond has no slaves */
155 first_slave = bond_first_slave_rcu(bond);
156 agg = first_slave ? &(SLAVE_AD_INFO(first_slave)->aggregator) : NULL;
163 * __agg_has_partner - see if we have a partner
164 * @agg: the agregator we're looking at
166 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
167 * address for the partner). Return 0 if not.
169 static inline int __agg_has_partner(struct aggregator *agg)
171 return !is_zero_ether_addr(agg->partner_system.mac_addr_value);
175 * __disable_port - disable the port's slave
176 * @port: the port we're looking at
178 static inline void __disable_port(struct port *port)
180 bond_set_slave_inactive_flags(port->slave, BOND_SLAVE_NOTIFY_LATER);
184 * __enable_port - enable the port's slave, if it's up
185 * @port: the port we're looking at
187 static inline void __enable_port(struct port *port)
189 struct slave *slave = port->slave;
191 if ((slave->link == BOND_LINK_UP) && bond_slave_is_up(slave))
192 bond_set_slave_active_flags(slave, BOND_SLAVE_NOTIFY_LATER);
196 * __port_is_enabled - check if the port's slave is in active state
197 * @port: the port we're looking at
199 static inline int __port_is_enabled(struct port *port)
201 return bond_is_active_slave(port->slave);
205 * __get_agg_selection_mode - get the aggregator selection mode
206 * @port: the port we're looking at
208 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
210 static inline u32 __get_agg_selection_mode(struct port *port)
212 struct bonding *bond = __get_bond_by_port(port);
215 return BOND_AD_STABLE;
217 return bond->params.ad_select;
221 * __check_agg_selection_timer - check if the selection timer has expired
222 * @port: the port we're looking at
224 static inline int __check_agg_selection_timer(struct port *port)
226 struct bonding *bond = __get_bond_by_port(port);
231 return atomic_read(&BOND_AD_INFO(bond).agg_select_timer) ? 1 : 0;
235 * __get_link_speed - get a port's speed
236 * @port: the port we're looking at
238 * Return @port's speed in 802.3ad enum format. i.e. one of:
240 * %AD_LINK_SPEED_10MBPS,
241 * %AD_LINK_SPEED_100MBPS,
242 * %AD_LINK_SPEED_1000MBPS,
243 * %AD_LINK_SPEED_2500MBPS,
244 * %AD_LINK_SPEED_5000MBPS,
245 * %AD_LINK_SPEED_10000MBPS
246 * %AD_LINK_SPEED_14000MBPS,
247 * %AD_LINK_SPEED_20000MBPS
248 * %AD_LINK_SPEED_25000MBPS
249 * %AD_LINK_SPEED_40000MBPS
250 * %AD_LINK_SPEED_50000MBPS
251 * %AD_LINK_SPEED_56000MBPS
252 * %AD_LINK_SPEED_100000MBPS
253 * %AD_LINK_SPEED_200000MBPS
254 * %AD_LINK_SPEED_400000MBPS
255 * %AD_LINK_SPEED_800000MBPS
257 static u16 __get_link_speed(struct port *port)
259 struct slave *slave = port->slave;
262 /* this if covers only a special case: when the configuration starts
263 * with link down, it sets the speed to 0.
264 * This is done in spite of the fact that the e100 driver reports 0
265 * to be compatible with MVT in the future.
267 if (slave->link != BOND_LINK_UP)
270 switch (slave->speed) {
272 speed = AD_LINK_SPEED_10MBPS;
276 speed = AD_LINK_SPEED_100MBPS;
280 speed = AD_LINK_SPEED_1000MBPS;
284 speed = AD_LINK_SPEED_2500MBPS;
288 speed = AD_LINK_SPEED_5000MBPS;
292 speed = AD_LINK_SPEED_10000MBPS;
296 speed = AD_LINK_SPEED_14000MBPS;
300 speed = AD_LINK_SPEED_20000MBPS;
304 speed = AD_LINK_SPEED_25000MBPS;
308 speed = AD_LINK_SPEED_40000MBPS;
312 speed = AD_LINK_SPEED_50000MBPS;
316 speed = AD_LINK_SPEED_56000MBPS;
320 speed = AD_LINK_SPEED_100000MBPS;
324 speed = AD_LINK_SPEED_200000MBPS;
328 speed = AD_LINK_SPEED_400000MBPS;
332 speed = AD_LINK_SPEED_800000MBPS;
336 /* unknown speed value from ethtool. shouldn't happen */
337 if (slave->speed != SPEED_UNKNOWN)
338 pr_err_once("%s: (slave %s): unknown ethtool speed (%d) for port %d (set it to 0)\n",
339 slave->bond->dev->name,
340 slave->dev->name, slave->speed,
341 port->actor_port_number);
347 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received link speed %d update from adapter\n",
348 port->actor_port_number, speed);
353 * __get_duplex - get a port's duplex
354 * @port: the port we're looking at
356 * Return @port's duplex in 802.3ad bitmask format. i.e.:
357 * 0x01 if in full duplex
360 static u8 __get_duplex(struct port *port)
362 struct slave *slave = port->slave;
365 /* handling a special case: when the configuration starts with
366 * link down, it sets the duplex to 0.
368 if (slave->link == BOND_LINK_UP) {
369 switch (slave->duplex) {
372 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received status full duplex update from adapter\n",
373 port->actor_port_number);
378 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received status NOT full duplex update from adapter\n",
379 port->actor_port_number);
386 static void __ad_actor_update_port(struct port *port)
388 const struct bonding *bond = bond_get_bond_by_slave(port->slave);
390 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr;
391 port->actor_system_priority = BOND_AD_INFO(bond).system.sys_priority;
397 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
398 * @timer_type: which timer to operate
399 * @par: timer parameter. see below
401 * If @timer_type is %current_while_timer, @par indicates long/short timer.
402 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
403 * %SLOW_PERIODIC_TIME.
405 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par)
407 u16 retval = 0; /* to silence the compiler */
409 switch (timer_type) {
410 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */
412 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec);
414 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec);
416 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */
417 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
419 case AD_PERIODIC_TIMER: /* for periodic machine */
420 retval = (par*ad_ticks_per_sec); /* long timeout */
422 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */
423 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
425 case AD_WAIT_WHILE_TIMER: /* for selection machine */
426 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec);
434 /* ================= ad_rx_machine helper functions ================== */
437 * __choose_matched - update a port's matched variable from a received lacpdu
438 * @lacpdu: the lacpdu we've received
439 * @port: the port we're looking at
441 * Update the value of the matched variable, using parameter values from a
442 * newly received lacpdu. Parameter values for the partner carried in the
443 * received PDU are compared with the corresponding operational parameter
444 * values for the actor. Matched is set to TRUE if all of these parameters
445 * match and the PDU parameter partner_state.aggregation has the same value as
446 * actor_oper_port_state.aggregation and lacp will actively maintain the link
447 * in the aggregation. Matched is also set to TRUE if the value of
448 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
449 * an individual link and lacp will actively maintain the link. Otherwise,
450 * matched is set to FALSE. LACP is considered to be actively maintaining the
451 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
452 * the actor's actor_oper_port_state.lacp_activity and the PDU's
453 * partner_state.lacp_activity variables are TRUE.
455 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
456 * used here to implement the language from 802.3ad 43.4.9 that requires
457 * recordPDU to "match" the LACPDU parameters to the stored values.
459 static void __choose_matched(struct lacpdu *lacpdu, struct port *port)
461 /* check if all parameters are alike
462 * or this is individual link(aggregation == FALSE)
463 * then update the state machine Matched variable.
465 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) &&
466 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) &&
467 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) &&
468 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) &&
469 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) &&
470 ((lacpdu->partner_state & LACP_STATE_AGGREGATION) == (port->actor_oper_port_state & LACP_STATE_AGGREGATION))) ||
471 ((lacpdu->actor_state & LACP_STATE_AGGREGATION) == 0)
473 port->sm_vars |= AD_PORT_MATCHED;
475 port->sm_vars &= ~AD_PORT_MATCHED;
480 * __record_pdu - record parameters from a received lacpdu
481 * @lacpdu: the lacpdu we've received
482 * @port: the port we're looking at
484 * Record the parameter values for the Actor carried in a received lacpdu as
485 * the current partner operational parameter values and sets
486 * actor_oper_port_state.defaulted to FALSE.
488 static void __record_pdu(struct lacpdu *lacpdu, struct port *port)
490 if (lacpdu && port) {
491 struct port_params *partner = &port->partner_oper;
493 __choose_matched(lacpdu, port);
494 /* record the new parameter values for the partner
497 partner->port_number = ntohs(lacpdu->actor_port);
498 partner->port_priority = ntohs(lacpdu->actor_port_priority);
499 partner->system = lacpdu->actor_system;
500 partner->system_priority = ntohs(lacpdu->actor_system_priority);
501 partner->key = ntohs(lacpdu->actor_key);
502 partner->port_state = lacpdu->actor_state;
504 /* set actor_oper_port_state.defaulted to FALSE */
505 port->actor_oper_port_state &= ~LACP_STATE_DEFAULTED;
507 /* set the partner sync. to on if the partner is sync,
508 * and the port is matched
510 if ((port->sm_vars & AD_PORT_MATCHED) &&
511 (lacpdu->actor_state & LACP_STATE_SYNCHRONIZATION)) {
512 partner->port_state |= LACP_STATE_SYNCHRONIZATION;
513 slave_dbg(port->slave->bond->dev, port->slave->dev,
516 partner->port_state &= ~LACP_STATE_SYNCHRONIZATION;
517 slave_dbg(port->slave->bond->dev, port->slave->dev,
524 * __record_default - record default parameters
525 * @port: the port we're looking at
527 * This function records the default parameter values for the partner carried
528 * in the Partner Admin parameters as the current partner operational parameter
529 * values and sets actor_oper_port_state.defaulted to TRUE.
531 static void __record_default(struct port *port)
534 /* record the partner admin parameters */
535 memcpy(&port->partner_oper, &port->partner_admin,
536 sizeof(struct port_params));
538 /* set actor_oper_port_state.defaulted to true */
539 port->actor_oper_port_state |= LACP_STATE_DEFAULTED;
544 * __update_selected - update a port's Selected variable from a received lacpdu
545 * @lacpdu: the lacpdu we've received
546 * @port: the port we're looking at
548 * Update the value of the selected variable, using parameter values from a
549 * newly received lacpdu. The parameter values for the Actor carried in the
550 * received PDU are compared with the corresponding operational parameter
551 * values for the ports partner. If one or more of the comparisons shows that
552 * the value(s) received in the PDU differ from the current operational values,
553 * then selected is set to FALSE and actor_oper_port_state.synchronization is
554 * set to out_of_sync. Otherwise, selected remains unchanged.
556 static void __update_selected(struct lacpdu *lacpdu, struct port *port)
558 if (lacpdu && port) {
559 const struct port_params *partner = &port->partner_oper;
561 /* check if any parameter is different then
562 * update the state machine selected variable.
564 if (ntohs(lacpdu->actor_port) != partner->port_number ||
565 ntohs(lacpdu->actor_port_priority) != partner->port_priority ||
566 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) ||
567 ntohs(lacpdu->actor_system_priority) != partner->system_priority ||
568 ntohs(lacpdu->actor_key) != partner->key ||
569 (lacpdu->actor_state & LACP_STATE_AGGREGATION) != (partner->port_state & LACP_STATE_AGGREGATION)) {
570 port->sm_vars &= ~AD_PORT_SELECTED;
576 * __update_default_selected - update a port's Selected variable from Partner
577 * @port: the port we're looking at
579 * This function updates the value of the selected variable, using the partner
580 * administrative parameter values. The administrative values are compared with
581 * the corresponding operational parameter values for the partner. If one or
582 * more of the comparisons shows that the administrative value(s) differ from
583 * the current operational values, then Selected is set to FALSE and
584 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
585 * Selected remains unchanged.
587 static void __update_default_selected(struct port *port)
590 const struct port_params *admin = &port->partner_admin;
591 const struct port_params *oper = &port->partner_oper;
593 /* check if any parameter is different then
594 * update the state machine selected variable.
596 if (admin->port_number != oper->port_number ||
597 admin->port_priority != oper->port_priority ||
598 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) ||
599 admin->system_priority != oper->system_priority ||
600 admin->key != oper->key ||
601 (admin->port_state & LACP_STATE_AGGREGATION)
602 != (oper->port_state & LACP_STATE_AGGREGATION)) {
603 port->sm_vars &= ~AD_PORT_SELECTED;
609 * __update_ntt - update a port's ntt variable from a received lacpdu
610 * @lacpdu: the lacpdu we've received
611 * @port: the port we're looking at
613 * Updates the value of the ntt variable, using parameter values from a newly
614 * received lacpdu. The parameter values for the partner carried in the
615 * received PDU are compared with the corresponding operational parameter
616 * values for the Actor. If one or more of the comparisons shows that the
617 * value(s) received in the PDU differ from the current operational values,
618 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
620 static void __update_ntt(struct lacpdu *lacpdu, struct port *port)
622 /* validate lacpdu and port */
623 if (lacpdu && port) {
624 /* check if any parameter is different then
625 * update the port->ntt.
627 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) ||
628 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) ||
629 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) ||
630 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) ||
631 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) ||
632 ((lacpdu->partner_state & LACP_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & LACP_STATE_LACP_ACTIVITY)) ||
633 ((lacpdu->partner_state & LACP_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & LACP_STATE_LACP_TIMEOUT)) ||
634 ((lacpdu->partner_state & LACP_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION)) ||
635 ((lacpdu->partner_state & LACP_STATE_AGGREGATION) != (port->actor_oper_port_state & LACP_STATE_AGGREGATION))
643 * __agg_ports_are_ready - check if all ports in an aggregator are ready
644 * @aggregator: the aggregator we're looking at
647 static int __agg_ports_are_ready(struct aggregator *aggregator)
653 /* scan all ports in this aggregator to verfy if they are
656 for (port = aggregator->lag_ports;
658 port = port->next_port_in_aggregator) {
659 if (!(port->sm_vars & AD_PORT_READY_N)) {
670 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
671 * @aggregator: the aggregator we're looking at
672 * @val: Should the ports' ready bit be set on or off
675 static void __set_agg_ports_ready(struct aggregator *aggregator, int val)
679 for (port = aggregator->lag_ports; port;
680 port = port->next_port_in_aggregator) {
682 port->sm_vars |= AD_PORT_READY;
684 port->sm_vars &= ~AD_PORT_READY;
688 static int __agg_active_ports(struct aggregator *agg)
693 for (port = agg->lag_ports; port;
694 port = port->next_port_in_aggregator) {
695 if (port->is_enabled)
703 * __get_agg_bandwidth - get the total bandwidth of an aggregator
704 * @aggregator: the aggregator we're looking at
707 static u32 __get_agg_bandwidth(struct aggregator *aggregator)
709 int nports = __agg_active_ports(aggregator);
713 switch (__get_link_speed(aggregator->lag_ports)) {
714 case AD_LINK_SPEED_1MBPS:
717 case AD_LINK_SPEED_10MBPS:
718 bandwidth = nports * 10;
720 case AD_LINK_SPEED_100MBPS:
721 bandwidth = nports * 100;
723 case AD_LINK_SPEED_1000MBPS:
724 bandwidth = nports * 1000;
726 case AD_LINK_SPEED_2500MBPS:
727 bandwidth = nports * 2500;
729 case AD_LINK_SPEED_5000MBPS:
730 bandwidth = nports * 5000;
732 case AD_LINK_SPEED_10000MBPS:
733 bandwidth = nports * 10000;
735 case AD_LINK_SPEED_14000MBPS:
736 bandwidth = nports * 14000;
738 case AD_LINK_SPEED_20000MBPS:
739 bandwidth = nports * 20000;
741 case AD_LINK_SPEED_25000MBPS:
742 bandwidth = nports * 25000;
744 case AD_LINK_SPEED_40000MBPS:
745 bandwidth = nports * 40000;
747 case AD_LINK_SPEED_50000MBPS:
748 bandwidth = nports * 50000;
750 case AD_LINK_SPEED_56000MBPS:
751 bandwidth = nports * 56000;
753 case AD_LINK_SPEED_100000MBPS:
754 bandwidth = nports * 100000;
756 case AD_LINK_SPEED_200000MBPS:
757 bandwidth = nports * 200000;
759 case AD_LINK_SPEED_400000MBPS:
760 bandwidth = nports * 400000;
762 case AD_LINK_SPEED_800000MBPS:
763 bandwidth = nports * 800000;
766 bandwidth = 0; /* to silence the compiler */
773 * __get_active_agg - get the current active aggregator
774 * @aggregator: the aggregator we're looking at
776 * Caller must hold RCU lock.
778 static struct aggregator *__get_active_agg(struct aggregator *aggregator)
780 struct bonding *bond = aggregator->slave->bond;
781 struct list_head *iter;
784 bond_for_each_slave_rcu(bond, slave, iter)
785 if (SLAVE_AD_INFO(slave)->aggregator.is_active)
786 return &(SLAVE_AD_INFO(slave)->aggregator);
792 * __update_lacpdu_from_port - update a port's lacpdu fields
793 * @port: the port we're looking at
795 static inline void __update_lacpdu_from_port(struct port *port)
797 struct lacpdu *lacpdu = &port->lacpdu;
798 const struct port_params *partner = &port->partner_oper;
800 /* update current actual Actor parameters
801 * lacpdu->subtype initialized
802 * lacpdu->version_number initialized
803 * lacpdu->tlv_type_actor_info initialized
804 * lacpdu->actor_information_length initialized
807 lacpdu->actor_system_priority = htons(port->actor_system_priority);
808 lacpdu->actor_system = port->actor_system;
809 lacpdu->actor_key = htons(port->actor_oper_port_key);
810 lacpdu->actor_port_priority = htons(port->actor_port_priority);
811 lacpdu->actor_port = htons(port->actor_port_number);
812 lacpdu->actor_state = port->actor_oper_port_state;
813 slave_dbg(port->slave->bond->dev, port->slave->dev,
814 "update lacpdu: actor port state %x\n",
815 port->actor_oper_port_state);
817 /* lacpdu->reserved_3_1 initialized
818 * lacpdu->tlv_type_partner_info initialized
819 * lacpdu->partner_information_length initialized
822 lacpdu->partner_system_priority = htons(partner->system_priority);
823 lacpdu->partner_system = partner->system;
824 lacpdu->partner_key = htons(partner->key);
825 lacpdu->partner_port_priority = htons(partner->port_priority);
826 lacpdu->partner_port = htons(partner->port_number);
827 lacpdu->partner_state = partner->port_state;
829 /* lacpdu->reserved_3_2 initialized
830 * lacpdu->tlv_type_collector_info initialized
831 * lacpdu->collector_information_length initialized
832 * collector_max_delay initialized
833 * reserved_12[12] initialized
834 * tlv_type_terminator initialized
835 * terminator_length initialized
836 * reserved_50[50] initialized
840 /* ================= main 802.3ad protocol code ========================= */
843 * ad_lacpdu_send - send out a lacpdu packet on a given port
844 * @port: the port we're looking at
846 * Returns: 0 on success
849 static int ad_lacpdu_send(struct port *port)
851 struct slave *slave = port->slave;
853 struct lacpdu_header *lacpdu_header;
854 int length = sizeof(struct lacpdu_header);
856 skb = dev_alloc_skb(length);
860 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_tx);
861 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.lacpdu_tx);
863 skb->dev = slave->dev;
864 skb_reset_mac_header(skb);
865 skb->network_header = skb->mac_header + ETH_HLEN;
866 skb->protocol = PKT_TYPE_LACPDU;
867 skb->priority = TC_PRIO_CONTROL;
869 lacpdu_header = skb_put(skb, length);
871 ether_addr_copy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr);
872 /* Note: source address is set to be the member's PERMANENT address,
873 * because we use it to identify loopback lacpdus in receive.
875 ether_addr_copy(lacpdu_header->hdr.h_source, slave->perm_hwaddr);
876 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU;
878 lacpdu_header->lacpdu = port->lacpdu;
886 * ad_marker_send - send marker information/response on a given port
887 * @port: the port we're looking at
888 * @marker: marker data to send
890 * Returns: 0 on success
893 static int ad_marker_send(struct port *port, struct bond_marker *marker)
895 struct slave *slave = port->slave;
897 struct bond_marker_header *marker_header;
898 int length = sizeof(struct bond_marker_header);
900 skb = dev_alloc_skb(length + 16);
904 switch (marker->tlv_type) {
905 case AD_MARKER_INFORMATION_SUBTYPE:
906 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.marker_tx);
907 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.marker_tx);
909 case AD_MARKER_RESPONSE_SUBTYPE:
910 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.marker_resp_tx);
911 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.marker_resp_tx);
915 skb_reserve(skb, 16);
917 skb->dev = slave->dev;
918 skb_reset_mac_header(skb);
919 skb->network_header = skb->mac_header + ETH_HLEN;
920 skb->protocol = PKT_TYPE_LACPDU;
922 marker_header = skb_put(skb, length);
924 ether_addr_copy(marker_header->hdr.h_dest, lacpdu_mcast_addr);
925 /* Note: source address is set to be the member's PERMANENT address,
926 * because we use it to identify loopback MARKERs in receive.
928 ether_addr_copy(marker_header->hdr.h_source, slave->perm_hwaddr);
929 marker_header->hdr.h_proto = PKT_TYPE_LACPDU;
931 marker_header->marker = *marker;
939 * ad_mux_machine - handle a port's mux state machine
940 * @port: the port we're looking at
941 * @update_slave_arr: Does slave array need update?
943 static void ad_mux_machine(struct port *port, bool *update_slave_arr)
945 mux_states_t last_state;
947 /* keep current State Machine state to compare later if it was
950 last_state = port->sm_mux_state;
952 if (port->sm_vars & AD_PORT_BEGIN) {
953 port->sm_mux_state = AD_MUX_DETACHED;
955 switch (port->sm_mux_state) {
956 case AD_MUX_DETACHED:
957 if ((port->sm_vars & AD_PORT_SELECTED)
958 || (port->sm_vars & AD_PORT_STANDBY))
959 /* if SELECTED or STANDBY */
960 port->sm_mux_state = AD_MUX_WAITING;
963 /* if SELECTED == FALSE return to DETACH state */
964 if (!(port->sm_vars & AD_PORT_SELECTED)) {
965 port->sm_vars &= ~AD_PORT_READY_N;
966 /* in order to withhold the Selection Logic to
967 * check all ports READY_N value every callback
968 * cycle to update ready variable, we check
969 * READY_N and update READY here
971 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
972 port->sm_mux_state = AD_MUX_DETACHED;
976 /* check if the wait_while_timer expired */
977 if (port->sm_mux_timer_counter
978 && !(--port->sm_mux_timer_counter))
979 port->sm_vars |= AD_PORT_READY_N;
981 /* in order to withhold the selection logic to check
982 * all ports READY_N value every callback cycle to
983 * update ready variable, we check READY_N and update
986 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
988 /* if the wait_while_timer expired, and the port is
989 * in READY state, move to ATTACHED state
991 if ((port->sm_vars & AD_PORT_READY)
992 && !port->sm_mux_timer_counter)
993 port->sm_mux_state = AD_MUX_ATTACHED;
995 case AD_MUX_ATTACHED:
996 /* check also if agg_select_timer expired (so the
997 * edable port will take place only after this timer)
999 if ((port->sm_vars & AD_PORT_SELECTED) &&
1000 (port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) &&
1001 !__check_agg_selection_timer(port)) {
1002 if (port->aggregator->is_active)
1003 port->sm_mux_state =
1004 AD_MUX_COLLECTING_DISTRIBUTING;
1005 } else if (!(port->sm_vars & AD_PORT_SELECTED) ||
1006 (port->sm_vars & AD_PORT_STANDBY)) {
1007 /* if UNSELECTED or STANDBY */
1008 port->sm_vars &= ~AD_PORT_READY_N;
1009 /* in order to withhold the selection logic to
1010 * check all ports READY_N value every callback
1011 * cycle to update ready variable, we check
1012 * READY_N and update READY here
1014 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
1015 port->sm_mux_state = AD_MUX_DETACHED;
1016 } else if (port->aggregator->is_active) {
1017 port->actor_oper_port_state |=
1018 LACP_STATE_SYNCHRONIZATION;
1021 case AD_MUX_COLLECTING_DISTRIBUTING:
1022 if (!(port->sm_vars & AD_PORT_SELECTED) ||
1023 (port->sm_vars & AD_PORT_STANDBY) ||
1024 !(port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) ||
1025 !(port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION)) {
1026 port->sm_mux_state = AD_MUX_ATTACHED;
1028 /* if port state hasn't changed make
1029 * sure that a collecting distributing
1030 * port in an active aggregator is enabled
1032 if (port->aggregator &&
1033 port->aggregator->is_active &&
1034 !__port_is_enabled(port)) {
1035 __enable_port(port);
1036 *update_slave_arr = true;
1045 /* check if the state machine was changed */
1046 if (port->sm_mux_state != last_state) {
1047 slave_dbg(port->slave->bond->dev, port->slave->dev,
1048 "Mux Machine: Port=%d, Last State=%d, Curr State=%d\n",
1049 port->actor_port_number,
1051 port->sm_mux_state);
1052 switch (port->sm_mux_state) {
1053 case AD_MUX_DETACHED:
1054 port->actor_oper_port_state &= ~LACP_STATE_SYNCHRONIZATION;
1055 ad_disable_collecting_distributing(port,
1057 port->actor_oper_port_state &= ~LACP_STATE_COLLECTING;
1058 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING;
1061 case AD_MUX_WAITING:
1062 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0);
1064 case AD_MUX_ATTACHED:
1065 if (port->aggregator->is_active)
1066 port->actor_oper_port_state |=
1067 LACP_STATE_SYNCHRONIZATION;
1069 port->actor_oper_port_state &=
1070 ~LACP_STATE_SYNCHRONIZATION;
1071 port->actor_oper_port_state &= ~LACP_STATE_COLLECTING;
1072 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING;
1073 ad_disable_collecting_distributing(port,
1077 case AD_MUX_COLLECTING_DISTRIBUTING:
1078 port->actor_oper_port_state |= LACP_STATE_COLLECTING;
1079 port->actor_oper_port_state |= LACP_STATE_DISTRIBUTING;
1080 port->actor_oper_port_state |= LACP_STATE_SYNCHRONIZATION;
1081 ad_enable_collecting_distributing(port,
1092 * ad_rx_machine - handle a port's rx State Machine
1093 * @lacpdu: the lacpdu we've received
1094 * @port: the port we're looking at
1096 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
1097 * CURRENT. If timer expired set the state machine in the proper state.
1098 * In other cases, this function checks if we need to switch to other state.
1100 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
1102 rx_states_t last_state;
1104 /* keep current State Machine state to compare later if it was
1107 last_state = port->sm_rx_state;
1110 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.lacpdu_rx);
1111 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.lacpdu_rx);
1113 /* check if state machine should change state */
1115 /* first, check if port was reinitialized */
1116 if (port->sm_vars & AD_PORT_BEGIN) {
1117 port->sm_rx_state = AD_RX_INITIALIZE;
1118 port->sm_vars |= AD_PORT_CHURNED;
1119 /* check if port is not enabled */
1120 } else if (!(port->sm_vars & AD_PORT_BEGIN) && !port->is_enabled)
1121 port->sm_rx_state = AD_RX_PORT_DISABLED;
1122 /* check if new lacpdu arrived */
1123 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) ||
1124 (port->sm_rx_state == AD_RX_DEFAULTED) ||
1125 (port->sm_rx_state == AD_RX_CURRENT))) {
1126 if (port->sm_rx_state != AD_RX_CURRENT)
1127 port->sm_vars |= AD_PORT_CHURNED;
1128 port->sm_rx_timer_counter = 0;
1129 port->sm_rx_state = AD_RX_CURRENT;
1131 /* if timer is on, and if it is expired */
1132 if (port->sm_rx_timer_counter &&
1133 !(--port->sm_rx_timer_counter)) {
1134 switch (port->sm_rx_state) {
1136 port->sm_rx_state = AD_RX_DEFAULTED;
1139 port->sm_rx_state = AD_RX_EXPIRED;
1145 /* if no lacpdu arrived and no timer is on */
1146 switch (port->sm_rx_state) {
1147 case AD_RX_PORT_DISABLED:
1148 if (port->is_enabled &&
1149 (port->sm_vars & AD_PORT_LACP_ENABLED))
1150 port->sm_rx_state = AD_RX_EXPIRED;
1151 else if (port->is_enabled
1153 & AD_PORT_LACP_ENABLED) == 0))
1154 port->sm_rx_state = AD_RX_LACP_DISABLED;
1163 /* check if the State machine was changed or new lacpdu arrived */
1164 if ((port->sm_rx_state != last_state) || (lacpdu)) {
1165 slave_dbg(port->slave->bond->dev, port->slave->dev,
1166 "Rx Machine: Port=%d, Last State=%d, Curr State=%d\n",
1167 port->actor_port_number,
1170 switch (port->sm_rx_state) {
1171 case AD_RX_INITIALIZE:
1172 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS))
1173 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1175 port->sm_vars |= AD_PORT_LACP_ENABLED;
1176 port->sm_vars &= ~AD_PORT_SELECTED;
1177 __record_default(port);
1178 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED;
1179 port->sm_rx_state = AD_RX_PORT_DISABLED;
1182 case AD_RX_PORT_DISABLED:
1183 port->sm_vars &= ~AD_PORT_MATCHED;
1185 case AD_RX_LACP_DISABLED:
1186 port->sm_vars &= ~AD_PORT_SELECTED;
1187 __record_default(port);
1188 port->partner_oper.port_state &= ~LACP_STATE_AGGREGATION;
1189 port->sm_vars |= AD_PORT_MATCHED;
1190 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED;
1193 /* Reset of the Synchronization flag (Standard 43.4.12)
1194 * This reset cause to disable this port in the
1195 * COLLECTING_DISTRIBUTING state of the mux machine in
1196 * case of EXPIRED even if LINK_DOWN didn't arrive for
1199 port->partner_oper.port_state &= ~LACP_STATE_SYNCHRONIZATION;
1200 port->sm_vars &= ~AD_PORT_MATCHED;
1201 port->partner_oper.port_state |= LACP_STATE_LACP_TIMEOUT;
1202 port->partner_oper.port_state |= LACP_STATE_LACP_ACTIVITY;
1203 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
1204 port->actor_oper_port_state |= LACP_STATE_EXPIRED;
1205 port->sm_vars |= AD_PORT_CHURNED;
1207 case AD_RX_DEFAULTED:
1208 __update_default_selected(port);
1209 __record_default(port);
1210 port->sm_vars |= AD_PORT_MATCHED;
1211 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED;
1214 /* detect loopback situation */
1215 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system),
1216 &(port->actor_system))) {
1217 slave_err(port->slave->bond->dev, port->slave->dev, "An illegal loopback occurred on slave\n"
1218 "Check the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n");
1221 __update_selected(lacpdu, port);
1222 __update_ntt(lacpdu, port);
1223 __record_pdu(lacpdu, port);
1224 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & LACP_STATE_LACP_TIMEOUT));
1225 port->actor_oper_port_state &= ~LACP_STATE_EXPIRED;
1234 * ad_churn_machine - handle port churn's state machine
1235 * @port: the port we're looking at
1238 static void ad_churn_machine(struct port *port)
1240 if (port->sm_vars & AD_PORT_CHURNED) {
1241 port->sm_vars &= ~AD_PORT_CHURNED;
1242 port->sm_churn_actor_state = AD_CHURN_MONITOR;
1243 port->sm_churn_partner_state = AD_CHURN_MONITOR;
1244 port->sm_churn_actor_timer_counter =
1245 __ad_timer_to_ticks(AD_ACTOR_CHURN_TIMER, 0);
1246 port->sm_churn_partner_timer_counter =
1247 __ad_timer_to_ticks(AD_PARTNER_CHURN_TIMER, 0);
1250 if (port->sm_churn_actor_timer_counter &&
1251 !(--port->sm_churn_actor_timer_counter) &&
1252 port->sm_churn_actor_state == AD_CHURN_MONITOR) {
1253 if (port->actor_oper_port_state & LACP_STATE_SYNCHRONIZATION) {
1254 port->sm_churn_actor_state = AD_NO_CHURN;
1256 port->churn_actor_count++;
1257 port->sm_churn_actor_state = AD_CHURN;
1260 if (port->sm_churn_partner_timer_counter &&
1261 !(--port->sm_churn_partner_timer_counter) &&
1262 port->sm_churn_partner_state == AD_CHURN_MONITOR) {
1263 if (port->partner_oper.port_state & LACP_STATE_SYNCHRONIZATION) {
1264 port->sm_churn_partner_state = AD_NO_CHURN;
1266 port->churn_partner_count++;
1267 port->sm_churn_partner_state = AD_CHURN;
1273 * ad_tx_machine - handle a port's tx state machine
1274 * @port: the port we're looking at
1276 static void ad_tx_machine(struct port *port)
1278 /* check if tx timer expired, to verify that we do not send more than
1279 * 3 packets per second
1281 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) {
1282 /* check if there is something to send */
1283 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1284 __update_lacpdu_from_port(port);
1286 if (ad_lacpdu_send(port) >= 0) {
1287 slave_dbg(port->slave->bond->dev,
1289 "Sent LACPDU on port %d\n",
1290 port->actor_port_number);
1292 /* mark ntt as false, so it will not be sent
1293 * again until demanded
1298 /* restart tx timer(to verify that we will not exceed
1299 * AD_MAX_TX_IN_SECOND
1301 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1306 * ad_periodic_machine - handle a port's periodic state machine
1307 * @port: the port we're looking at
1308 * @bond_params: bond parameters we will use
1310 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1312 static void ad_periodic_machine(struct port *port, struct bond_params *bond_params)
1314 periodic_states_t last_state;
1316 /* keep current state machine state to compare later if it was changed */
1317 last_state = port->sm_periodic_state;
1319 /* check if port was reinitialized */
1320 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
1321 (!(port->actor_oper_port_state & LACP_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & LACP_STATE_LACP_ACTIVITY)) ||
1322 !bond_params->lacp_active) {
1323 port->sm_periodic_state = AD_NO_PERIODIC;
1325 /* check if state machine should change state */
1326 else if (port->sm_periodic_timer_counter) {
1327 /* check if periodic state machine expired */
1328 if (!(--port->sm_periodic_timer_counter)) {
1329 /* if expired then do tx */
1330 port->sm_periodic_state = AD_PERIODIC_TX;
1332 /* If not expired, check if there is some new timeout
1333 * parameter from the partner state
1335 switch (port->sm_periodic_state) {
1336 case AD_FAST_PERIODIC:
1337 if (!(port->partner_oper.port_state
1338 & LACP_STATE_LACP_TIMEOUT))
1339 port->sm_periodic_state = AD_SLOW_PERIODIC;
1341 case AD_SLOW_PERIODIC:
1342 if ((port->partner_oper.port_state & LACP_STATE_LACP_TIMEOUT)) {
1343 port->sm_periodic_timer_counter = 0;
1344 port->sm_periodic_state = AD_PERIODIC_TX;
1352 switch (port->sm_periodic_state) {
1353 case AD_NO_PERIODIC:
1354 port->sm_periodic_state = AD_FAST_PERIODIC;
1356 case AD_PERIODIC_TX:
1357 if (!(port->partner_oper.port_state &
1358 LACP_STATE_LACP_TIMEOUT))
1359 port->sm_periodic_state = AD_SLOW_PERIODIC;
1361 port->sm_periodic_state = AD_FAST_PERIODIC;
1368 /* check if the state machine was changed */
1369 if (port->sm_periodic_state != last_state) {
1370 slave_dbg(port->slave->bond->dev, port->slave->dev,
1371 "Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1372 port->actor_port_number, last_state,
1373 port->sm_periodic_state);
1374 switch (port->sm_periodic_state) {
1375 case AD_NO_PERIODIC:
1376 port->sm_periodic_timer_counter = 0;
1378 case AD_FAST_PERIODIC:
1379 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1380 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1;
1382 case AD_SLOW_PERIODIC:
1383 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1384 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1;
1386 case AD_PERIODIC_TX:
1396 * ad_port_selection_logic - select aggregation groups
1397 * @port: the port we're looking at
1398 * @update_slave_arr: Does slave array need update?
1400 * Select aggregation groups, and assign each port for it's aggregetor. The
1401 * selection logic is called in the inititalization (after all the handshkes),
1402 * and after every lacpdu receive (if selected is off).
1404 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr)
1406 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator;
1407 struct port *last_port = NULL, *curr_port;
1408 struct list_head *iter;
1409 struct bonding *bond;
1410 struct slave *slave;
1413 /* if the port is already Selected, do nothing */
1414 if (port->sm_vars & AD_PORT_SELECTED)
1417 bond = __get_bond_by_port(port);
1419 /* if the port is connected to other aggregator, detach it */
1420 if (port->aggregator) {
1421 /* detach the port from its former aggregator */
1422 temp_aggregator = port->aggregator;
1423 for (curr_port = temp_aggregator->lag_ports; curr_port;
1424 last_port = curr_port,
1425 curr_port = curr_port->next_port_in_aggregator) {
1426 if (curr_port == port) {
1427 temp_aggregator->num_of_ports--;
1428 /* if it is the first port attached to the
1432 temp_aggregator->lag_ports =
1433 port->next_port_in_aggregator;
1435 /* not the first port attached to the
1438 last_port->next_port_in_aggregator =
1439 port->next_port_in_aggregator;
1442 /* clear the port's relations to this
1445 port->aggregator = NULL;
1446 port->next_port_in_aggregator = NULL;
1447 port->actor_port_aggregator_identifier = 0;
1449 slave_dbg(bond->dev, port->slave->dev, "Port %d left LAG %d\n",
1450 port->actor_port_number,
1451 temp_aggregator->aggregator_identifier);
1452 /* if the aggregator is empty, clear its
1453 * parameters, and set it ready to be attached
1455 if (!temp_aggregator->lag_ports)
1456 ad_clear_agg(temp_aggregator);
1461 /* meaning: the port was related to an aggregator
1462 * but was not on the aggregator port list
1464 net_warn_ratelimited("%s: (slave %s): Warning: Port %d was related to aggregator %d but was not on its port list\n",
1465 port->slave->bond->dev->name,
1466 port->slave->dev->name,
1467 port->actor_port_number,
1468 port->aggregator->aggregator_identifier);
1471 /* search on all aggregators for a suitable aggregator for this port */
1472 bond_for_each_slave(bond, slave, iter) {
1473 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
1475 /* keep a free aggregator for later use(if needed) */
1476 if (!aggregator->lag_ports) {
1477 if (!free_aggregator)
1478 free_aggregator = aggregator;
1481 /* check if current aggregator suits us */
1482 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */
1483 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) &&
1484 (aggregator->partner_system_priority == port->partner_oper.system_priority) &&
1485 (aggregator->partner_oper_aggregator_key == port->partner_oper.key)
1487 ((!MAC_ADDRESS_EQUAL(&(port->partner_oper.system), &(null_mac_addr)) && /* partner answers */
1488 !aggregator->is_individual) /* but is not individual OR */
1491 /* attach to the founded aggregator */
1492 port->aggregator = aggregator;
1493 port->actor_port_aggregator_identifier =
1494 port->aggregator->aggregator_identifier;
1495 port->next_port_in_aggregator = aggregator->lag_ports;
1496 port->aggregator->num_of_ports++;
1497 aggregator->lag_ports = port;
1498 slave_dbg(bond->dev, slave->dev, "Port %d joined LAG %d (existing LAG)\n",
1499 port->actor_port_number,
1500 port->aggregator->aggregator_identifier);
1502 /* mark this port as selected */
1503 port->sm_vars |= AD_PORT_SELECTED;
1509 /* the port couldn't find an aggregator - attach it to a new
1513 if (free_aggregator) {
1514 /* assign port a new aggregator */
1515 port->aggregator = free_aggregator;
1516 port->actor_port_aggregator_identifier =
1517 port->aggregator->aggregator_identifier;
1519 /* update the new aggregator's parameters
1520 * if port was responsed from the end-user
1522 if (port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS)
1523 /* if port is full duplex */
1524 port->aggregator->is_individual = false;
1526 port->aggregator->is_individual = true;
1528 port->aggregator->actor_admin_aggregator_key =
1529 port->actor_admin_port_key;
1530 port->aggregator->actor_oper_aggregator_key =
1531 port->actor_oper_port_key;
1532 port->aggregator->partner_system =
1533 port->partner_oper.system;
1534 port->aggregator->partner_system_priority =
1535 port->partner_oper.system_priority;
1536 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key;
1537 port->aggregator->receive_state = 1;
1538 port->aggregator->transmit_state = 1;
1539 port->aggregator->lag_ports = port;
1540 port->aggregator->num_of_ports++;
1542 /* mark this port as selected */
1543 port->sm_vars |= AD_PORT_SELECTED;
1545 slave_dbg(bond->dev, port->slave->dev, "Port %d joined LAG %d (new LAG)\n",
1546 port->actor_port_number,
1547 port->aggregator->aggregator_identifier);
1549 slave_err(bond->dev, port->slave->dev,
1550 "Port %d did not find a suitable aggregator\n",
1551 port->actor_port_number);
1555 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1556 * in all aggregator's ports, else set ready=FALSE in all
1557 * aggregator's ports
1559 __set_agg_ports_ready(port->aggregator,
1560 __agg_ports_are_ready(port->aggregator));
1562 aggregator = __get_first_agg(port);
1563 ad_agg_selection_logic(aggregator, update_slave_arr);
1565 if (!port->aggregator->is_active)
1566 port->actor_oper_port_state &= ~LACP_STATE_SYNCHRONIZATION;
1569 /* Decide if "agg" is a better choice for the new active aggregator that
1570 * the current best, according to the ad_select policy.
1572 static struct aggregator *ad_agg_selection_test(struct aggregator *best,
1573 struct aggregator *curr)
1575 /* 0. If no best, select current.
1577 * 1. If the current agg is not individual, and the best is
1578 * individual, select current.
1580 * 2. If current agg is individual and the best is not, keep best.
1582 * 3. Therefore, current and best are both individual or both not
1585 * 3a. If current agg partner replied, and best agg partner did not,
1588 * 3b. If current agg partner did not reply and best agg partner
1589 * did reply, keep best.
1591 * 4. Therefore, current and best both have partner replies or
1592 * both do not, so perform selection policy:
1594 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1595 * select by bandwidth.
1597 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1602 if (!curr->is_individual && best->is_individual)
1605 if (curr->is_individual && !best->is_individual)
1608 if (__agg_has_partner(curr) && !__agg_has_partner(best))
1611 if (!__agg_has_partner(curr) && __agg_has_partner(best))
1614 switch (__get_agg_selection_mode(curr->lag_ports)) {
1616 if (__agg_active_ports(curr) > __agg_active_ports(best))
1619 if (__agg_active_ports(curr) < __agg_active_ports(best))
1623 case BOND_AD_STABLE:
1624 case BOND_AD_BANDWIDTH:
1625 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best))
1631 net_warn_ratelimited("%s: (slave %s): Impossible agg select mode %d\n",
1632 curr->slave->bond->dev->name,
1633 curr->slave->dev->name,
1634 __get_agg_selection_mode(curr->lag_ports));
1641 static int agg_device_up(const struct aggregator *agg)
1643 struct port *port = agg->lag_ports;
1648 for (port = agg->lag_ports; port;
1649 port = port->next_port_in_aggregator) {
1650 if (netif_running(port->slave->dev) &&
1651 netif_carrier_ok(port->slave->dev))
1659 * ad_agg_selection_logic - select an aggregation group for a team
1660 * @agg: the aggregator we're looking at
1661 * @update_slave_arr: Does slave array need update?
1663 * It is assumed that only one aggregator may be selected for a team.
1665 * The logic of this function is to select the aggregator according to
1666 * the ad_select policy:
1668 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1669 * it, and to reselect the active aggregator only if the previous
1670 * aggregator has no more ports related to it.
1672 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1673 * bandwidth, and reselect whenever a link state change takes place or the
1674 * set of slaves in the bond changes.
1676 * BOND_AD_COUNT: select the aggregator with largest number of ports
1677 * (slaves), and reselect whenever a link state change takes place or the
1678 * set of slaves in the bond changes.
1680 * FIXME: this function MUST be called with the first agg in the bond, or
1681 * __get_active_agg() won't work correctly. This function should be better
1682 * called with the bond itself, and retrieve the first agg from it.
1684 static void ad_agg_selection_logic(struct aggregator *agg,
1685 bool *update_slave_arr)
1687 struct aggregator *best, *active, *origin;
1688 struct bonding *bond = agg->slave->bond;
1689 struct list_head *iter;
1690 struct slave *slave;
1695 active = __get_active_agg(agg);
1696 best = (active && agg_device_up(active)) ? active : NULL;
1698 bond_for_each_slave_rcu(bond, slave, iter) {
1699 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1703 if (__agg_active_ports(agg) && agg_device_up(agg))
1704 best = ad_agg_selection_test(best, agg);
1708 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) {
1709 /* For the STABLE policy, don't replace the old active
1710 * aggregator if it's still active (it has an answering
1711 * partner) or if both the best and active don't have an
1712 * answering partner.
1714 if (active && active->lag_ports &&
1715 __agg_active_ports(active) &&
1716 (__agg_has_partner(active) ||
1717 (!__agg_has_partner(active) &&
1718 !__agg_has_partner(best)))) {
1719 if (!(!active->actor_oper_aggregator_key &&
1720 best->actor_oper_aggregator_key)) {
1722 active->is_active = 1;
1727 if (best && (best == active)) {
1729 active->is_active = 1;
1732 /* if there is new best aggregator, activate it */
1734 netdev_dbg(bond->dev, "(slave %s): best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1735 best->slave ? best->slave->dev->name : "NULL",
1736 best->aggregator_identifier, best->num_of_ports,
1737 best->actor_oper_aggregator_key,
1738 best->partner_oper_aggregator_key,
1739 best->is_individual, best->is_active);
1740 netdev_dbg(bond->dev, "(slave %s): best ports %p slave %p\n",
1741 best->slave ? best->slave->dev->name : "NULL",
1742 best->lag_ports, best->slave);
1744 bond_for_each_slave_rcu(bond, slave, iter) {
1745 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1747 slave_dbg(bond->dev, slave->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1748 agg->aggregator_identifier, agg->num_of_ports,
1749 agg->actor_oper_aggregator_key,
1750 agg->partner_oper_aggregator_key,
1751 agg->is_individual, agg->is_active);
1754 /* check if any partner replies */
1755 if (best->is_individual)
1756 net_warn_ratelimited("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1759 best->is_active = 1;
1760 netdev_dbg(bond->dev, "(slave %s): LAG %d chosen as the active LAG\n",
1761 best->slave ? best->slave->dev->name : "NULL",
1762 best->aggregator_identifier);
1763 netdev_dbg(bond->dev, "(slave %s): Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1764 best->slave ? best->slave->dev->name : "NULL",
1765 best->aggregator_identifier, best->num_of_ports,
1766 best->actor_oper_aggregator_key,
1767 best->partner_oper_aggregator_key,
1768 best->is_individual, best->is_active);
1770 /* disable the ports that were related to the former
1774 for (port = active->lag_ports; port;
1775 port = port->next_port_in_aggregator) {
1776 __disable_port(port);
1779 /* Slave array needs update. */
1780 *update_slave_arr = true;
1783 /* if the selected aggregator is of join individuals
1784 * (partner_system is NULL), enable their ports
1786 active = __get_active_agg(origin);
1789 if (!__agg_has_partner(active)) {
1790 for (port = active->lag_ports; port;
1791 port = port->next_port_in_aggregator) {
1792 __enable_port(port);
1794 *update_slave_arr = true;
1800 bond_3ad_set_carrier(bond);
1804 * ad_clear_agg - clear a given aggregator's parameters
1805 * @aggregator: the aggregator we're looking at
1807 static void ad_clear_agg(struct aggregator *aggregator)
1810 aggregator->is_individual = false;
1811 aggregator->actor_admin_aggregator_key = 0;
1812 aggregator->actor_oper_aggregator_key = 0;
1813 eth_zero_addr(aggregator->partner_system.mac_addr_value);
1814 aggregator->partner_system_priority = 0;
1815 aggregator->partner_oper_aggregator_key = 0;
1816 aggregator->receive_state = 0;
1817 aggregator->transmit_state = 0;
1818 aggregator->lag_ports = NULL;
1819 aggregator->is_active = 0;
1820 aggregator->num_of_ports = 0;
1821 pr_debug("%s: LAG %d was cleared\n",
1823 aggregator->slave->dev->name : "NULL",
1824 aggregator->aggregator_identifier);
1829 * ad_initialize_agg - initialize a given aggregator's parameters
1830 * @aggregator: the aggregator we're looking at
1832 static void ad_initialize_agg(struct aggregator *aggregator)
1835 ad_clear_agg(aggregator);
1837 eth_zero_addr(aggregator->aggregator_mac_address.mac_addr_value);
1838 aggregator->aggregator_identifier = 0;
1839 aggregator->slave = NULL;
1844 * ad_initialize_port - initialize a given port's parameters
1845 * @port: the port we're looking at
1846 * @lacp_fast: boolean. whether fast periodic should be used
1848 static void ad_initialize_port(struct port *port, int lacp_fast)
1850 static const struct port_params tmpl = {
1851 .system_priority = 0xffff,
1854 .port_priority = 0xff,
1857 static const struct lacpdu lacpdu = {
1859 .version_number = 0x01,
1860 .tlv_type_actor_info = 0x01,
1861 .actor_information_length = 0x14,
1862 .tlv_type_partner_info = 0x02,
1863 .partner_information_length = 0x14,
1864 .tlv_type_collector_info = 0x03,
1865 .collector_information_length = 0x10,
1866 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY),
1870 port->actor_port_priority = 0xff;
1871 port->actor_port_aggregator_identifier = 0;
1873 port->actor_admin_port_state = LACP_STATE_AGGREGATION |
1874 LACP_STATE_LACP_ACTIVITY;
1875 port->actor_oper_port_state = LACP_STATE_AGGREGATION |
1876 LACP_STATE_LACP_ACTIVITY;
1879 port->actor_oper_port_state |= LACP_STATE_LACP_TIMEOUT;
1881 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
1882 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl));
1884 port->is_enabled = true;
1885 /* private parameters */
1886 port->sm_vars = AD_PORT_BEGIN | AD_PORT_LACP_ENABLED;
1887 port->sm_rx_state = 0;
1888 port->sm_rx_timer_counter = 0;
1889 port->sm_periodic_state = 0;
1890 port->sm_periodic_timer_counter = 0;
1891 port->sm_mux_state = 0;
1892 port->sm_mux_timer_counter = 0;
1893 port->sm_tx_state = 0;
1894 port->aggregator = NULL;
1895 port->next_port_in_aggregator = NULL;
1896 port->transaction_id = 0;
1898 port->sm_churn_actor_timer_counter = 0;
1899 port->sm_churn_actor_state = 0;
1900 port->churn_actor_count = 0;
1901 port->sm_churn_partner_timer_counter = 0;
1902 port->sm_churn_partner_state = 0;
1903 port->churn_partner_count = 0;
1905 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu));
1910 * ad_enable_collecting_distributing - enable a port's transmit/receive
1911 * @port: the port we're looking at
1912 * @update_slave_arr: Does slave array need update?
1914 * Enable @port if it's in an active aggregator
1916 static void ad_enable_collecting_distributing(struct port *port,
1917 bool *update_slave_arr)
1919 if (port->aggregator->is_active) {
1920 slave_dbg(port->slave->bond->dev, port->slave->dev,
1921 "Enabling port %d (LAG %d)\n",
1922 port->actor_port_number,
1923 port->aggregator->aggregator_identifier);
1924 __enable_port(port);
1925 /* Slave array needs update */
1926 *update_slave_arr = true;
1931 * ad_disable_collecting_distributing - disable a port's transmit/receive
1932 * @port: the port we're looking at
1933 * @update_slave_arr: Does slave array need update?
1935 static void ad_disable_collecting_distributing(struct port *port,
1936 bool *update_slave_arr)
1938 if (port->aggregator &&
1939 !MAC_ADDRESS_EQUAL(&(port->aggregator->partner_system),
1940 &(null_mac_addr))) {
1941 slave_dbg(port->slave->bond->dev, port->slave->dev,
1942 "Disabling port %d (LAG %d)\n",
1943 port->actor_port_number,
1944 port->aggregator->aggregator_identifier);
1945 __disable_port(port);
1946 /* Slave array needs an update */
1947 *update_slave_arr = true;
1952 * ad_marker_info_received - handle receive of a Marker information frame
1953 * @marker_info: Marker info received
1954 * @port: the port we're looking at
1956 static void ad_marker_info_received(struct bond_marker *marker_info,
1959 struct bond_marker marker;
1961 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.marker_rx);
1962 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.marker_rx);
1964 /* copy the received marker data to the response marker */
1965 memcpy(&marker, marker_info, sizeof(struct bond_marker));
1966 /* change the marker subtype to marker response */
1967 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE;
1969 /* send the marker response */
1970 if (ad_marker_send(port, &marker) >= 0)
1971 slave_dbg(port->slave->bond->dev, port->slave->dev,
1972 "Sent Marker Response on port %d\n",
1973 port->actor_port_number);
1977 * ad_marker_response_received - handle receive of a marker response frame
1978 * @marker: marker PDU received
1979 * @port: the port we're looking at
1981 * This function does nothing since we decided not to implement send and handle
1982 * response for marker PDU's, in this stage, but only to respond to marker
1985 static void ad_marker_response_received(struct bond_marker *marker,
1988 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.marker_resp_rx);
1989 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.marker_resp_rx);
1991 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1994 /* ========= AD exported functions to the main bonding code ========= */
1996 /* Check aggregators status in team every T seconds */
1997 #define AD_AGGREGATOR_SELECTION_TIMER 8
2000 * bond_3ad_initiate_agg_selection - initate aggregator selection
2001 * @bond: bonding struct
2002 * @timeout: timeout value to set
2004 * Set the aggregation selection timer, to initiate an agg selection in
2005 * the very near future. Called during first initialization, and during
2006 * any down to up transitions of the bond.
2008 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout)
2010 atomic_set(&BOND_AD_INFO(bond).agg_select_timer, timeout);
2014 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
2015 * @bond: bonding struct to work on
2017 * Can be called only after the mac address of the bond is set.
2019 void bond_3ad_initialize(struct bonding *bond)
2021 BOND_AD_INFO(bond).aggregator_identifier = 0;
2022 BOND_AD_INFO(bond).system.sys_priority =
2023 bond->params.ad_actor_sys_prio;
2024 if (is_zero_ether_addr(bond->params.ad_actor_system))
2025 BOND_AD_INFO(bond).system.sys_mac_addr =
2026 *((struct mac_addr *)bond->dev->dev_addr);
2028 BOND_AD_INFO(bond).system.sys_mac_addr =
2029 *((struct mac_addr *)bond->params.ad_actor_system);
2031 bond_3ad_initiate_agg_selection(bond,
2032 AD_AGGREGATOR_SELECTION_TIMER *
2037 * bond_3ad_bind_slave - initialize a slave's port
2038 * @slave: slave struct to work on
2040 * Returns: 0 on success
2043 void bond_3ad_bind_slave(struct slave *slave)
2045 struct bonding *bond = bond_get_bond_by_slave(slave);
2047 struct aggregator *aggregator;
2049 /* check that the slave has not been initialized yet. */
2050 if (SLAVE_AD_INFO(slave)->port.slave != slave) {
2052 /* port initialization */
2053 port = &(SLAVE_AD_INFO(slave)->port);
2055 ad_initialize_port(port, bond->params.lacp_fast);
2057 port->slave = slave;
2058 port->actor_port_number = SLAVE_AD_INFO(slave)->id;
2059 /* key is determined according to the link speed, duplex and
2062 port->actor_admin_port_key = bond->params.ad_user_port_key << 6;
2063 ad_update_actor_keys(port, false);
2064 /* actor system is the bond's system */
2065 __ad_actor_update_port(port);
2066 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
2067 * lacpdu's are sent in one second)
2069 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
2071 __disable_port(port);
2073 /* aggregator initialization */
2074 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2076 ad_initialize_agg(aggregator);
2078 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr);
2079 aggregator->aggregator_identifier = ++BOND_AD_INFO(bond).aggregator_identifier;
2080 aggregator->slave = slave;
2081 aggregator->is_active = 0;
2082 aggregator->num_of_ports = 0;
2087 * bond_3ad_unbind_slave - deinitialize a slave's port
2088 * @slave: slave struct to work on
2090 * Search for the aggregator that is related to this port, remove the
2091 * aggregator and assign another aggregator for other port related to it
2092 * (if any), and remove the port.
2094 void bond_3ad_unbind_slave(struct slave *slave)
2096 struct port *port, *prev_port, *temp_port;
2097 struct aggregator *aggregator, *new_aggregator, *temp_aggregator;
2098 int select_new_active_agg = 0;
2099 struct bonding *bond = slave->bond;
2100 struct slave *slave_iter;
2101 struct list_head *iter;
2102 bool dummy_slave_update; /* Ignore this value as caller updates array */
2104 /* Sync against bond_3ad_state_machine_handler() */
2105 spin_lock_bh(&bond->mode_lock);
2106 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2107 port = &(SLAVE_AD_INFO(slave)->port);
2109 /* if slave is null, the whole port is not initialized */
2111 slave_warn(bond->dev, slave->dev, "Trying to unbind an uninitialized port\n");
2115 slave_dbg(bond->dev, slave->dev, "Unbinding Link Aggregation Group %d\n",
2116 aggregator->aggregator_identifier);
2118 /* Tell the partner that this port is not suitable for aggregation */
2119 port->actor_oper_port_state &= ~LACP_STATE_SYNCHRONIZATION;
2120 port->actor_oper_port_state &= ~LACP_STATE_COLLECTING;
2121 port->actor_oper_port_state &= ~LACP_STATE_DISTRIBUTING;
2122 port->actor_oper_port_state &= ~LACP_STATE_AGGREGATION;
2123 __update_lacpdu_from_port(port);
2124 ad_lacpdu_send(port);
2126 /* check if this aggregator is occupied */
2127 if (aggregator->lag_ports) {
2128 /* check if there are other ports related to this aggregator
2129 * except the port related to this slave(thats ensure us that
2130 * there is a reason to search for new aggregator, and that we
2133 if ((aggregator->lag_ports != port) ||
2134 (aggregator->lag_ports->next_port_in_aggregator)) {
2135 /* find new aggregator for the related port(s) */
2136 bond_for_each_slave(bond, slave_iter, iter) {
2137 new_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2138 /* if the new aggregator is empty, or it is
2139 * connected to our port only
2141 if (!new_aggregator->lag_ports ||
2142 ((new_aggregator->lag_ports == port) &&
2143 !new_aggregator->lag_ports->next_port_in_aggregator))
2147 new_aggregator = NULL;
2149 /* if new aggregator found, copy the aggregator's
2150 * parameters and connect the related lag_ports to the
2153 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) {
2154 slave_dbg(bond->dev, slave->dev, "Some port(s) related to LAG %d - replacing with LAG %d\n",
2155 aggregator->aggregator_identifier,
2156 new_aggregator->aggregator_identifier);
2158 if ((new_aggregator->lag_ports == port) &&
2159 new_aggregator->is_active) {
2160 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n");
2161 select_new_active_agg = 1;
2164 new_aggregator->is_individual = aggregator->is_individual;
2165 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key;
2166 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key;
2167 new_aggregator->partner_system = aggregator->partner_system;
2168 new_aggregator->partner_system_priority = aggregator->partner_system_priority;
2169 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key;
2170 new_aggregator->receive_state = aggregator->receive_state;
2171 new_aggregator->transmit_state = aggregator->transmit_state;
2172 new_aggregator->lag_ports = aggregator->lag_ports;
2173 new_aggregator->is_active = aggregator->is_active;
2174 new_aggregator->num_of_ports = aggregator->num_of_ports;
2176 /* update the information that is written on
2177 * the ports about the aggregator
2179 for (temp_port = aggregator->lag_ports; temp_port;
2180 temp_port = temp_port->next_port_in_aggregator) {
2181 temp_port->aggregator = new_aggregator;
2182 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier;
2185 ad_clear_agg(aggregator);
2187 if (select_new_active_agg)
2188 ad_agg_selection_logic(__get_first_agg(port),
2189 &dummy_slave_update);
2191 slave_warn(bond->dev, slave->dev, "unbinding aggregator, and could not find a new aggregator for its ports\n");
2194 /* in case that the only port related to this
2195 * aggregator is the one we want to remove
2197 select_new_active_agg = aggregator->is_active;
2198 ad_clear_agg(aggregator);
2199 if (select_new_active_agg) {
2200 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n");
2201 /* select new active aggregator */
2202 temp_aggregator = __get_first_agg(port);
2203 if (temp_aggregator)
2204 ad_agg_selection_logic(temp_aggregator,
2205 &dummy_slave_update);
2210 slave_dbg(bond->dev, slave->dev, "Unbinding port %d\n", port->actor_port_number);
2212 /* find the aggregator that this port is connected to */
2213 bond_for_each_slave(bond, slave_iter, iter) {
2214 temp_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2216 /* search the port in the aggregator's related ports */
2217 for (temp_port = temp_aggregator->lag_ports; temp_port;
2218 prev_port = temp_port,
2219 temp_port = temp_port->next_port_in_aggregator) {
2220 if (temp_port == port) {
2221 /* the aggregator found - detach the port from
2225 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator;
2227 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator;
2228 temp_aggregator->num_of_ports--;
2229 if (__agg_active_ports(temp_aggregator) == 0) {
2230 select_new_active_agg = temp_aggregator->is_active;
2231 if (temp_aggregator->num_of_ports == 0)
2232 ad_clear_agg(temp_aggregator);
2233 if (select_new_active_agg) {
2234 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n");
2235 /* select new active aggregator */
2236 ad_agg_selection_logic(__get_first_agg(port),
2237 &dummy_slave_update);
2247 spin_unlock_bh(&bond->mode_lock);
2251 * bond_3ad_update_ad_actor_settings - reflect change of actor settings to ports
2252 * @bond: bonding struct to work on
2254 * If an ad_actor setting gets changed we need to update the individual port
2255 * settings so the bond device will use the new values when it gets upped.
2257 void bond_3ad_update_ad_actor_settings(struct bonding *bond)
2259 struct list_head *iter;
2260 struct slave *slave;
2264 BOND_AD_INFO(bond).system.sys_priority = bond->params.ad_actor_sys_prio;
2265 if (is_zero_ether_addr(bond->params.ad_actor_system))
2266 BOND_AD_INFO(bond).system.sys_mac_addr =
2267 *((struct mac_addr *)bond->dev->dev_addr);
2269 BOND_AD_INFO(bond).system.sys_mac_addr =
2270 *((struct mac_addr *)bond->params.ad_actor_system);
2272 spin_lock_bh(&bond->mode_lock);
2273 bond_for_each_slave(bond, slave, iter) {
2274 struct port *port = &(SLAVE_AD_INFO(slave))->port;
2276 __ad_actor_update_port(port);
2279 spin_unlock_bh(&bond->mode_lock);
2283 * bond_agg_timer_advance - advance agg_select_timer
2284 * @bond: bonding structure
2286 * Return true when agg_select_timer reaches 0.
2288 static bool bond_agg_timer_advance(struct bonding *bond)
2293 val = atomic_read(&BOND_AD_INFO(bond).agg_select_timer);
2297 if (atomic_cmpxchg(&BOND_AD_INFO(bond).agg_select_timer,
2305 * bond_3ad_state_machine_handler - handle state machines timeout
2306 * @work: work context to fetch bonding struct to work on from
2308 * The state machine handling concept in this module is to check every tick
2309 * which state machine should operate any function. The execution order is
2310 * round robin, so when we have an interaction between state machines, the
2311 * reply of one to each other might be delayed until next tick.
2313 * This function also complete the initialization when the agg_select_timer
2314 * times out, and it selects an aggregator for the ports that are yet not
2315 * related to any aggregator, and selects the active aggregator for a bond.
2317 void bond_3ad_state_machine_handler(struct work_struct *work)
2319 struct bonding *bond = container_of(work, struct bonding,
2321 struct aggregator *aggregator;
2322 struct list_head *iter;
2323 struct slave *slave;
2325 bool should_notify_rtnl = BOND_SLAVE_NOTIFY_LATER;
2326 bool update_slave_arr = false;
2328 /* Lock to protect data accessed by all (e.g., port->sm_vars) and
2329 * against running with bond_3ad_unbind_slave. ad_rx_machine may run
2330 * concurrently due to incoming LACPDU as well.
2332 spin_lock_bh(&bond->mode_lock);
2335 /* check if there are any slaves */
2336 if (!bond_has_slaves(bond))
2339 if (bond_agg_timer_advance(bond)) {
2340 slave = bond_first_slave_rcu(bond);
2341 port = slave ? &(SLAVE_AD_INFO(slave)->port) : NULL;
2343 /* select the active aggregator for the bond */
2346 net_warn_ratelimited("%s: Warning: bond's first port is uninitialized\n",
2351 aggregator = __get_first_agg(port);
2352 ad_agg_selection_logic(aggregator, &update_slave_arr);
2354 bond_3ad_set_carrier(bond);
2357 /* for each port run the state machines */
2358 bond_for_each_slave_rcu(bond, slave, iter) {
2359 port = &(SLAVE_AD_INFO(slave)->port);
2361 net_warn_ratelimited("%s: Warning: Found an uninitialized port\n",
2366 ad_rx_machine(NULL, port);
2367 ad_periodic_machine(port, &bond->params);
2368 ad_port_selection_logic(port, &update_slave_arr);
2369 ad_mux_machine(port, &update_slave_arr);
2370 ad_tx_machine(port);
2371 ad_churn_machine(port);
2373 /* turn off the BEGIN bit, since we already handled it */
2374 if (port->sm_vars & AD_PORT_BEGIN)
2375 port->sm_vars &= ~AD_PORT_BEGIN;
2379 bond_for_each_slave_rcu(bond, slave, iter) {
2380 if (slave->should_notify) {
2381 should_notify_rtnl = BOND_SLAVE_NOTIFY_NOW;
2386 spin_unlock_bh(&bond->mode_lock);
2388 if (update_slave_arr)
2389 bond_slave_arr_work_rearm(bond, 0);
2391 if (should_notify_rtnl && rtnl_trylock()) {
2392 bond_slave_state_notify(bond);
2395 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks);
2399 * bond_3ad_rx_indication - handle a received frame
2400 * @lacpdu: received lacpdu
2401 * @slave: slave struct to work on
2403 * It is assumed that frames that were sent on this NIC don't returned as new
2404 * received frames (loopback). Since only the payload is given to this
2405 * function, it check for loopback.
2407 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave)
2409 struct bonding *bond = slave->bond;
2410 int ret = RX_HANDLER_ANOTHER;
2411 struct bond_marker *marker;
2415 port = &(SLAVE_AD_INFO(slave)->port);
2417 net_warn_ratelimited("%s: Warning: port of slave %s is uninitialized\n",
2418 slave->dev->name, slave->bond->dev->name);
2422 switch (lacpdu->subtype) {
2423 case AD_TYPE_LACPDU:
2424 ret = RX_HANDLER_CONSUMED;
2425 slave_dbg(slave->bond->dev, slave->dev,
2426 "Received LACPDU on port %d\n",
2427 port->actor_port_number);
2428 /* Protect against concurrent state machines */
2429 spin_lock(&slave->bond->mode_lock);
2430 ad_rx_machine(lacpdu, port);
2431 spin_unlock(&slave->bond->mode_lock);
2433 case AD_TYPE_MARKER:
2434 ret = RX_HANDLER_CONSUMED;
2435 /* No need to convert fields to Little Endian since we
2436 * don't use the marker's fields.
2438 marker = (struct bond_marker *)lacpdu;
2439 switch (marker->tlv_type) {
2440 case AD_MARKER_INFORMATION_SUBTYPE:
2441 slave_dbg(slave->bond->dev, slave->dev, "Received Marker Information on port %d\n",
2442 port->actor_port_number);
2443 ad_marker_info_received(marker, port);
2445 case AD_MARKER_RESPONSE_SUBTYPE:
2446 slave_dbg(slave->bond->dev, slave->dev, "Received Marker Response on port %d\n",
2447 port->actor_port_number);
2448 ad_marker_response_received(marker, port);
2451 slave_dbg(slave->bond->dev, slave->dev, "Received an unknown Marker subtype on port %d\n",
2452 port->actor_port_number);
2453 stat = &SLAVE_AD_INFO(slave)->stats.marker_unknown_rx;
2455 stat = &BOND_AD_INFO(bond).stats.marker_unknown_rx;
2460 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_unknown_rx);
2461 atomic64_inc(&BOND_AD_INFO(bond).stats.lacpdu_unknown_rx);
2468 * ad_update_actor_keys - Update the oper / admin keys for a port based on
2469 * its current speed and duplex settings.
2471 * @port: the port we'are looking at
2472 * @reset: Boolean to just reset the speed and the duplex part of the key
2474 * The logic to change the oper / admin keys is:
2475 * (a) A full duplex port can participate in LACP with partner.
2476 * (b) When the speed is changed, LACP need to be reinitiated.
2478 static void ad_update_actor_keys(struct port *port, bool reset)
2481 u16 ospeed = 0, speed = 0;
2482 u16 old_oper_key = port->actor_oper_port_key;
2484 port->actor_admin_port_key &= ~(AD_SPEED_KEY_MASKS|AD_DUPLEX_KEY_MASKS);
2486 speed = __get_link_speed(port);
2487 ospeed = (old_oper_key & AD_SPEED_KEY_MASKS) >> 1;
2488 duplex = __get_duplex(port);
2489 port->actor_admin_port_key |= (speed << 1) | duplex;
2491 port->actor_oper_port_key = port->actor_admin_port_key;
2493 if (old_oper_key != port->actor_oper_port_key) {
2494 /* Only 'duplex' port participates in LACP */
2496 port->sm_vars |= AD_PORT_LACP_ENABLED;
2498 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
2502 slave_err(port->slave->bond->dev,
2504 "speed changed to 0 on port %d\n",
2505 port->actor_port_number);
2506 } else if (duplex && ospeed != speed) {
2507 /* Speed change restarts LACP state-machine */
2508 port->sm_vars |= AD_PORT_BEGIN;
2515 * bond_3ad_adapter_speed_duplex_changed - handle a slave's speed / duplex
2518 * @slave: slave struct to work on
2520 * Handle reselection of aggregator (if needed) for this port.
2522 void bond_3ad_adapter_speed_duplex_changed(struct slave *slave)
2526 port = &(SLAVE_AD_INFO(slave)->port);
2528 /* if slave is null, the whole port is not initialized */
2530 slave_warn(slave->bond->dev, slave->dev,
2531 "speed/duplex changed for uninitialized port\n");
2535 spin_lock_bh(&slave->bond->mode_lock);
2536 ad_update_actor_keys(port, false);
2537 spin_unlock_bh(&slave->bond->mode_lock);
2538 slave_dbg(slave->bond->dev, slave->dev, "Port %d changed speed/duplex\n",
2539 port->actor_port_number);
2543 * bond_3ad_handle_link_change - handle a slave's link status change indication
2544 * @slave: slave struct to work on
2545 * @link: whether the link is now up or down
2547 * Handle reselection of aggregator (if needed) for this port.
2549 void bond_3ad_handle_link_change(struct slave *slave, char link)
2551 struct aggregator *agg;
2555 port = &(SLAVE_AD_INFO(slave)->port);
2557 /* if slave is null, the whole port is not initialized */
2559 slave_warn(slave->bond->dev, slave->dev, "link status changed for uninitialized port\n");
2563 spin_lock_bh(&slave->bond->mode_lock);
2564 /* on link down we are zeroing duplex and speed since
2565 * some of the adaptors(ce1000.lan) report full duplex/speed
2566 * instead of N/A(duplex) / 0(speed).
2568 * on link up we are forcing recheck on the duplex and speed since
2569 * some of he adaptors(ce1000.lan) report.
2571 if (link == BOND_LINK_UP) {
2572 port->is_enabled = true;
2573 ad_update_actor_keys(port, false);
2575 /* link has failed */
2576 port->is_enabled = false;
2577 ad_update_actor_keys(port, true);
2579 agg = __get_first_agg(port);
2580 ad_agg_selection_logic(agg, &dummy);
2582 spin_unlock_bh(&slave->bond->mode_lock);
2584 slave_dbg(slave->bond->dev, slave->dev, "Port %d changed link status to %s\n",
2585 port->actor_port_number,
2586 link == BOND_LINK_UP ? "UP" : "DOWN");
2588 /* RTNL is held and mode_lock is released so it's safe
2589 * to update slave_array here.
2591 bond_update_slave_arr(slave->bond, NULL);
2595 * bond_3ad_set_carrier - set link state for bonding master
2596 * @bond: bonding structure
2598 * if we have an active aggregator, we're up, if not, we're down.
2599 * Presumes that we cannot have an active aggregator if there are
2600 * no slaves with link up.
2602 * This behavior complies with IEEE 802.3 section 43.3.9.
2604 * Called by bond_set_carrier(). Return zero if carrier state does not
2605 * change, nonzero if it does.
2607 int bond_3ad_set_carrier(struct bonding *bond)
2609 struct aggregator *active;
2610 struct slave *first_slave;
2614 first_slave = bond_first_slave_rcu(bond);
2619 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave)->aggregator));
2621 /* are enough slaves available to consider link up? */
2622 if (__agg_active_ports(active) < bond->params.min_links) {
2623 if (netif_carrier_ok(bond->dev)) {
2624 netif_carrier_off(bond->dev);
2627 } else if (!netif_carrier_ok(bond->dev)) {
2628 netif_carrier_on(bond->dev);
2631 } else if (netif_carrier_ok(bond->dev)) {
2632 netif_carrier_off(bond->dev);
2640 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2641 * @bond: bonding struct to work on
2642 * @ad_info: ad_info struct to fill with the bond's info
2644 * Returns: 0 on success
2647 int __bond_3ad_get_active_agg_info(struct bonding *bond,
2648 struct ad_info *ad_info)
2650 struct aggregator *aggregator = NULL;
2651 struct list_head *iter;
2652 struct slave *slave;
2655 bond_for_each_slave_rcu(bond, slave, iter) {
2656 port = &(SLAVE_AD_INFO(slave)->port);
2657 if (port->aggregator && port->aggregator->is_active) {
2658 aggregator = port->aggregator;
2666 ad_info->aggregator_id = aggregator->aggregator_identifier;
2667 ad_info->ports = __agg_active_ports(aggregator);
2668 ad_info->actor_key = aggregator->actor_oper_aggregator_key;
2669 ad_info->partner_key = aggregator->partner_oper_aggregator_key;
2670 ether_addr_copy(ad_info->partner_system,
2671 aggregator->partner_system.mac_addr_value);
2675 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info)
2680 ret = __bond_3ad_get_active_agg_info(bond, ad_info);
2686 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond,
2687 struct slave *slave)
2689 struct lacpdu *lacpdu, _lacpdu;
2691 if (skb->protocol != PKT_TYPE_LACPDU)
2692 return RX_HANDLER_ANOTHER;
2694 if (!MAC_ADDRESS_EQUAL(eth_hdr(skb)->h_dest, lacpdu_mcast_addr))
2695 return RX_HANDLER_ANOTHER;
2697 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu);
2699 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_illegal_rx);
2700 atomic64_inc(&BOND_AD_INFO(bond).stats.lacpdu_illegal_rx);
2701 return RX_HANDLER_ANOTHER;
2704 return bond_3ad_rx_indication(lacpdu, slave);
2708 * bond_3ad_update_lacp_rate - change the lacp rate
2709 * @bond: bonding struct
2711 * When modify lacp_rate parameter via sysfs,
2712 * update actor_oper_port_state of each port.
2714 * Hold bond->mode_lock,
2715 * so we can modify port->actor_oper_port_state,
2716 * no matter bond is up or down.
2718 void bond_3ad_update_lacp_rate(struct bonding *bond)
2720 struct port *port = NULL;
2721 struct list_head *iter;
2722 struct slave *slave;
2725 lacp_fast = bond->params.lacp_fast;
2726 spin_lock_bh(&bond->mode_lock);
2727 bond_for_each_slave(bond, slave, iter) {
2728 port = &(SLAVE_AD_INFO(slave)->port);
2730 port->actor_oper_port_state |= LACP_STATE_LACP_TIMEOUT;
2732 port->actor_oper_port_state &= ~LACP_STATE_LACP_TIMEOUT;
2734 spin_unlock_bh(&bond->mode_lock);
2737 size_t bond_3ad_stats_size(void)
2739 return nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_RX */
2740 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_TX */
2741 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_UNKNOWN_RX */
2742 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_ILLEGAL_RX */
2743 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RX */
2744 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_TX */
2745 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RESP_RX */
2746 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RESP_TX */
2747 nla_total_size_64bit(sizeof(u64)); /* BOND_3AD_STAT_MARKER_UNKNOWN_RX */
2750 int bond_3ad_stats_fill(struct sk_buff *skb, struct bond_3ad_stats *stats)
2754 val = atomic64_read(&stats->lacpdu_rx);
2755 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_RX, val,
2758 val = atomic64_read(&stats->lacpdu_tx);
2759 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_TX, val,
2762 val = atomic64_read(&stats->lacpdu_unknown_rx);
2763 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_UNKNOWN_RX, val,
2766 val = atomic64_read(&stats->lacpdu_illegal_rx);
2767 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_ILLEGAL_RX, val,
2771 val = atomic64_read(&stats->marker_rx);
2772 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RX, val,
2775 val = atomic64_read(&stats->marker_tx);
2776 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_TX, val,
2779 val = atomic64_read(&stats->marker_resp_rx);
2780 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RESP_RX, val,
2783 val = atomic64_read(&stats->marker_resp_tx);
2784 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RESP_TX, val,
2787 val = atomic64_read(&stats->marker_unknown_rx);
2788 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_UNKNOWN_RX, val,