1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
6 #include <linux/skbuff.h>
7 #include <linux/if_ether.h>
8 #include <linux/netdevice.h>
9 #include <linux/spinlock.h>
10 #include <linux/ethtool.h>
11 #include <linux/etherdevice.h>
12 #include <linux/if_bonding.h>
13 #include <linux/pkt_sched.h>
14 #include <net/net_namespace.h>
15 #include <net/bonding.h>
16 #include <net/bond_3ad.h>
17 #include <net/netlink.h>
19 /* General definitions */
20 #define AD_SHORT_TIMEOUT 1
21 #define AD_LONG_TIMEOUT 0
22 #define AD_STANDBY 0x2
23 #define AD_MAX_TX_IN_SECOND 3
24 #define AD_COLLECTOR_MAX_DELAY 0
26 /* Timer definitions (43.4.4 in the 802.3ad standard) */
27 #define AD_FAST_PERIODIC_TIME 1
28 #define AD_SLOW_PERIODIC_TIME 30
29 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
30 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
31 #define AD_CHURN_DETECTION_TIME 60
32 #define AD_AGGREGATE_WAIT_TIME 2
34 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */
35 #define AD_STATE_LACP_ACTIVITY 0x1
36 #define AD_STATE_LACP_TIMEOUT 0x2
37 #define AD_STATE_AGGREGATION 0x4
38 #define AD_STATE_SYNCHRONIZATION 0x8
39 #define AD_STATE_COLLECTING 0x10
40 #define AD_STATE_DISTRIBUTING 0x20
41 #define AD_STATE_DEFAULTED 0x40
42 #define AD_STATE_EXPIRED 0x80
44 /* Port Variables definitions used by the State Machines (43.4.7 in the
47 #define AD_PORT_BEGIN 0x1
48 #define AD_PORT_LACP_ENABLED 0x2
49 #define AD_PORT_ACTOR_CHURN 0x4
50 #define AD_PORT_PARTNER_CHURN 0x8
51 #define AD_PORT_READY 0x10
52 #define AD_PORT_READY_N 0x20
53 #define AD_PORT_MATCHED 0x40
54 #define AD_PORT_STANDBY 0x80
55 #define AD_PORT_SELECTED 0x100
56 #define AD_PORT_MOVED 0x200
57 #define AD_PORT_CHURNED (AD_PORT_ACTOR_CHURN | AD_PORT_PARTNER_CHURN)
59 /* Port Key definitions
60 * key is determined according to the link speed, duplex and
61 * user key (which is yet not supported)
62 * --------------------------------------------------------------
63 * Port key | User key (10 bits) | Speed (5 bits) | Duplex|
64 * --------------------------------------------------------------
67 #define AD_DUPLEX_KEY_MASKS 0x1
68 #define AD_SPEED_KEY_MASKS 0x3E
69 #define AD_USER_KEY_MASKS 0xFFC0
71 enum ad_link_speed_type {
72 AD_LINK_SPEED_1MBPS = 1,
74 AD_LINK_SPEED_100MBPS,
75 AD_LINK_SPEED_1000MBPS,
76 AD_LINK_SPEED_2500MBPS,
77 AD_LINK_SPEED_5000MBPS,
78 AD_LINK_SPEED_10000MBPS,
79 AD_LINK_SPEED_14000MBPS,
80 AD_LINK_SPEED_20000MBPS,
81 AD_LINK_SPEED_25000MBPS,
82 AD_LINK_SPEED_40000MBPS,
83 AD_LINK_SPEED_50000MBPS,
84 AD_LINK_SPEED_56000MBPS,
85 AD_LINK_SPEED_100000MBPS,
88 /* compare MAC addresses */
89 #define MAC_ADDRESS_EQUAL(A, B) \
90 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
92 static const u8 null_mac_addr[ETH_ALEN + 2] __long_aligned = {
95 static u16 ad_ticks_per_sec;
96 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000;
98 static const u8 lacpdu_mcast_addr[ETH_ALEN + 2] __long_aligned =
99 MULTICAST_LACPDU_ADDR;
101 /* ================= main 802.3ad protocol functions ================== */
102 static int ad_lacpdu_send(struct port *port);
103 static int ad_marker_send(struct port *port, struct bond_marker *marker);
104 static void ad_mux_machine(struct port *port, bool *update_slave_arr);
105 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
106 static void ad_tx_machine(struct port *port);
107 static void ad_periodic_machine(struct port *port);
108 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr);
109 static void ad_agg_selection_logic(struct aggregator *aggregator,
110 bool *update_slave_arr);
111 static void ad_clear_agg(struct aggregator *aggregator);
112 static void ad_initialize_agg(struct aggregator *aggregator);
113 static void ad_initialize_port(struct port *port, int lacp_fast);
114 static void ad_enable_collecting_distributing(struct port *port,
115 bool *update_slave_arr);
116 static void ad_disable_collecting_distributing(struct port *port,
117 bool *update_slave_arr);
118 static void ad_marker_info_received(struct bond_marker *marker_info,
120 static void ad_marker_response_received(struct bond_marker *marker,
122 static void ad_update_actor_keys(struct port *port, bool reset);
125 /* ================= api to bonding and kernel code ================== */
128 * __get_bond_by_port - get the port's bonding struct
129 * @port: the port we're looking at
131 * Return @port's bonding struct, or %NULL if it can't be found.
133 static inline struct bonding *__get_bond_by_port(struct port *port)
135 if (port->slave == NULL)
138 return bond_get_bond_by_slave(port->slave);
142 * __get_first_agg - get the first aggregator in the bond
143 * @bond: the bond we're looking at
145 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
147 * The caller must hold RCU or RTNL lock.
149 static inline struct aggregator *__get_first_agg(struct port *port)
151 struct bonding *bond = __get_bond_by_port(port);
152 struct slave *first_slave;
153 struct aggregator *agg;
155 /* If there's no bond for this port, or bond has no slaves */
160 first_slave = bond_first_slave_rcu(bond);
161 agg = first_slave ? &(SLAVE_AD_INFO(first_slave)->aggregator) : NULL;
168 * __agg_has_partner - see if we have a partner
169 * @agg: the agregator we're looking at
171 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
172 * address for the partner). Return 0 if not.
174 static inline int __agg_has_partner(struct aggregator *agg)
176 return !is_zero_ether_addr(agg->partner_system.mac_addr_value);
180 * __disable_port - disable the port's slave
181 * @port: the port we're looking at
183 static inline void __disable_port(struct port *port)
185 bond_set_slave_inactive_flags(port->slave, BOND_SLAVE_NOTIFY_LATER);
189 * __enable_port - enable the port's slave, if it's up
190 * @port: the port we're looking at
192 static inline void __enable_port(struct port *port)
194 struct slave *slave = port->slave;
196 if ((slave->link == BOND_LINK_UP) && bond_slave_is_up(slave))
197 bond_set_slave_active_flags(slave, BOND_SLAVE_NOTIFY_LATER);
201 * __port_is_enabled - check if the port's slave is in active state
202 * @port: the port we're looking at
204 static inline int __port_is_enabled(struct port *port)
206 return bond_is_active_slave(port->slave);
210 * __get_agg_selection_mode - get the aggregator selection mode
211 * @port: the port we're looking at
213 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
215 static inline u32 __get_agg_selection_mode(struct port *port)
217 struct bonding *bond = __get_bond_by_port(port);
220 return BOND_AD_STABLE;
222 return bond->params.ad_select;
226 * __check_agg_selection_timer - check if the selection timer has expired
227 * @port: the port we're looking at
229 static inline int __check_agg_selection_timer(struct port *port)
231 struct bonding *bond = __get_bond_by_port(port);
236 return BOND_AD_INFO(bond).agg_select_timer ? 1 : 0;
240 * __get_link_speed - get a port's speed
241 * @port: the port we're looking at
243 * Return @port's speed in 802.3ad enum format. i.e. one of:
245 * %AD_LINK_SPEED_10MBPS,
246 * %AD_LINK_SPEED_100MBPS,
247 * %AD_LINK_SPEED_1000MBPS,
248 * %AD_LINK_SPEED_2500MBPS,
249 * %AD_LINK_SPEED_5000MBPS,
250 * %AD_LINK_SPEED_10000MBPS
251 * %AD_LINK_SPEED_14000MBPS,
252 * %AD_LINK_SPEED_20000MBPS
253 * %AD_LINK_SPEED_25000MBPS
254 * %AD_LINK_SPEED_40000MBPS
255 * %AD_LINK_SPEED_50000MBPS
256 * %AD_LINK_SPEED_56000MBPS
257 * %AD_LINK_SPEED_100000MBPS
259 static u16 __get_link_speed(struct port *port)
261 struct slave *slave = port->slave;
264 /* this if covers only a special case: when the configuration starts
265 * with link down, it sets the speed to 0.
266 * This is done in spite of the fact that the e100 driver reports 0
267 * to be compatible with MVT in the future.
269 if (slave->link != BOND_LINK_UP)
272 switch (slave->speed) {
274 speed = AD_LINK_SPEED_10MBPS;
278 speed = AD_LINK_SPEED_100MBPS;
282 speed = AD_LINK_SPEED_1000MBPS;
286 speed = AD_LINK_SPEED_2500MBPS;
290 speed = AD_LINK_SPEED_5000MBPS;
294 speed = AD_LINK_SPEED_10000MBPS;
298 speed = AD_LINK_SPEED_14000MBPS;
302 speed = AD_LINK_SPEED_20000MBPS;
306 speed = AD_LINK_SPEED_25000MBPS;
310 speed = AD_LINK_SPEED_40000MBPS;
314 speed = AD_LINK_SPEED_50000MBPS;
318 speed = AD_LINK_SPEED_56000MBPS;
322 speed = AD_LINK_SPEED_100000MBPS;
326 /* unknown speed value from ethtool. shouldn't happen */
327 if (slave->speed != SPEED_UNKNOWN)
328 pr_warn_once("%s: (slave %s): unknown ethtool speed (%d) for port %d (set it to 0)\n",
329 slave->bond->dev->name,
330 slave->dev->name, slave->speed,
331 port->actor_port_number);
337 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received link speed %d update from adapter\n",
338 port->actor_port_number, speed);
343 * __get_duplex - get a port's duplex
344 * @port: the port we're looking at
346 * Return @port's duplex in 802.3ad bitmask format. i.e.:
347 * 0x01 if in full duplex
350 static u8 __get_duplex(struct port *port)
352 struct slave *slave = port->slave;
355 /* handling a special case: when the configuration starts with
356 * link down, it sets the duplex to 0.
358 if (slave->link == BOND_LINK_UP) {
359 switch (slave->duplex) {
362 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received status full duplex update from adapter\n",
363 port->actor_port_number);
368 slave_dbg(slave->bond->dev, slave->dev, "Port %d Received status NOT full duplex update from adapter\n",
369 port->actor_port_number);
376 static void __ad_actor_update_port(struct port *port)
378 const struct bonding *bond = bond_get_bond_by_slave(port->slave);
380 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr;
381 port->actor_system_priority = BOND_AD_INFO(bond).system.sys_priority;
387 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
388 * @timer_type: which timer to operate
389 * @par: timer parameter. see below
391 * If @timer_type is %current_while_timer, @par indicates long/short timer.
392 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
393 * %SLOW_PERIODIC_TIME.
395 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par)
397 u16 retval = 0; /* to silence the compiler */
399 switch (timer_type) {
400 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */
402 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec);
404 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec);
406 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */
407 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
409 case AD_PERIODIC_TIMER: /* for periodic machine */
410 retval = (par*ad_ticks_per_sec); /* long timeout */
412 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */
413 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
415 case AD_WAIT_WHILE_TIMER: /* for selection machine */
416 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec);
424 /* ================= ad_rx_machine helper functions ================== */
427 * __choose_matched - update a port's matched variable from a received lacpdu
428 * @lacpdu: the lacpdu we've received
429 * @port: the port we're looking at
431 * Update the value of the matched variable, using parameter values from a
432 * newly received lacpdu. Parameter values for the partner carried in the
433 * received PDU are compared with the corresponding operational parameter
434 * values for the actor. Matched is set to TRUE if all of these parameters
435 * match and the PDU parameter partner_state.aggregation has the same value as
436 * actor_oper_port_state.aggregation and lacp will actively maintain the link
437 * in the aggregation. Matched is also set to TRUE if the value of
438 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
439 * an individual link and lacp will actively maintain the link. Otherwise,
440 * matched is set to FALSE. LACP is considered to be actively maintaining the
441 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
442 * the actor's actor_oper_port_state.lacp_activity and the PDU's
443 * partner_state.lacp_activity variables are TRUE.
445 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
446 * used here to implement the language from 802.3ad 43.4.9 that requires
447 * recordPDU to "match" the LACPDU parameters to the stored values.
449 static void __choose_matched(struct lacpdu *lacpdu, struct port *port)
451 /* check if all parameters are alike
452 * or this is individual link(aggregation == FALSE)
453 * then update the state machine Matched variable.
455 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) &&
456 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) &&
457 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) &&
458 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) &&
459 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) &&
460 ((lacpdu->partner_state & AD_STATE_AGGREGATION) == (port->actor_oper_port_state & AD_STATE_AGGREGATION))) ||
461 ((lacpdu->actor_state & AD_STATE_AGGREGATION) == 0)
463 port->sm_vars |= AD_PORT_MATCHED;
465 port->sm_vars &= ~AD_PORT_MATCHED;
470 * __record_pdu - record parameters from a received lacpdu
471 * @lacpdu: the lacpdu we've received
472 * @port: the port we're looking at
474 * Record the parameter values for the Actor carried in a received lacpdu as
475 * the current partner operational parameter values and sets
476 * actor_oper_port_state.defaulted to FALSE.
478 static void __record_pdu(struct lacpdu *lacpdu, struct port *port)
480 if (lacpdu && port) {
481 struct port_params *partner = &port->partner_oper;
483 __choose_matched(lacpdu, port);
484 /* record the new parameter values for the partner
487 partner->port_number = ntohs(lacpdu->actor_port);
488 partner->port_priority = ntohs(lacpdu->actor_port_priority);
489 partner->system = lacpdu->actor_system;
490 partner->system_priority = ntohs(lacpdu->actor_system_priority);
491 partner->key = ntohs(lacpdu->actor_key);
492 partner->port_state = lacpdu->actor_state;
494 /* set actor_oper_port_state.defaulted to FALSE */
495 port->actor_oper_port_state &= ~AD_STATE_DEFAULTED;
497 /* set the partner sync. to on if the partner is sync,
498 * and the port is matched
500 if ((port->sm_vars & AD_PORT_MATCHED) &&
501 (lacpdu->actor_state & AD_STATE_SYNCHRONIZATION)) {
502 partner->port_state |= AD_STATE_SYNCHRONIZATION;
503 slave_dbg(port->slave->bond->dev, port->slave->dev,
506 partner->port_state &= ~AD_STATE_SYNCHRONIZATION;
507 slave_dbg(port->slave->bond->dev, port->slave->dev,
514 * __record_default - record default parameters
515 * @port: the port we're looking at
517 * This function records the default parameter values for the partner carried
518 * in the Partner Admin parameters as the current partner operational parameter
519 * values and sets actor_oper_port_state.defaulted to TRUE.
521 static void __record_default(struct port *port)
524 /* record the partner admin parameters */
525 memcpy(&port->partner_oper, &port->partner_admin,
526 sizeof(struct port_params));
528 /* set actor_oper_port_state.defaulted to true */
529 port->actor_oper_port_state |= AD_STATE_DEFAULTED;
534 * __update_selected - update a port's Selected variable from a received lacpdu
535 * @lacpdu: the lacpdu we've received
536 * @port: the port we're looking at
538 * Update the value of the selected variable, using parameter values from a
539 * newly received lacpdu. The parameter values for the Actor carried in the
540 * received PDU are compared with the corresponding operational parameter
541 * values for the ports partner. If one or more of the comparisons shows that
542 * the value(s) received in the PDU differ from the current operational values,
543 * then selected is set to FALSE and actor_oper_port_state.synchronization is
544 * set to out_of_sync. Otherwise, selected remains unchanged.
546 static void __update_selected(struct lacpdu *lacpdu, struct port *port)
548 if (lacpdu && port) {
549 const struct port_params *partner = &port->partner_oper;
551 /* check if any parameter is different then
552 * update the state machine selected variable.
554 if (ntohs(lacpdu->actor_port) != partner->port_number ||
555 ntohs(lacpdu->actor_port_priority) != partner->port_priority ||
556 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) ||
557 ntohs(lacpdu->actor_system_priority) != partner->system_priority ||
558 ntohs(lacpdu->actor_key) != partner->key ||
559 (lacpdu->actor_state & AD_STATE_AGGREGATION) != (partner->port_state & AD_STATE_AGGREGATION)) {
560 port->sm_vars &= ~AD_PORT_SELECTED;
566 * __update_default_selected - update a port's Selected variable from Partner
567 * @port: the port we're looking at
569 * This function updates the value of the selected variable, using the partner
570 * administrative parameter values. The administrative values are compared with
571 * the corresponding operational parameter values for the partner. If one or
572 * more of the comparisons shows that the administrative value(s) differ from
573 * the current operational values, then Selected is set to FALSE and
574 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
575 * Selected remains unchanged.
577 static void __update_default_selected(struct port *port)
580 const struct port_params *admin = &port->partner_admin;
581 const struct port_params *oper = &port->partner_oper;
583 /* check if any parameter is different then
584 * update the state machine selected variable.
586 if (admin->port_number != oper->port_number ||
587 admin->port_priority != oper->port_priority ||
588 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) ||
589 admin->system_priority != oper->system_priority ||
590 admin->key != oper->key ||
591 (admin->port_state & AD_STATE_AGGREGATION)
592 != (oper->port_state & AD_STATE_AGGREGATION)) {
593 port->sm_vars &= ~AD_PORT_SELECTED;
599 * __update_ntt - update a port's ntt variable from a received lacpdu
600 * @lacpdu: the lacpdu we've received
601 * @port: the port we're looking at
603 * Updates the value of the ntt variable, using parameter values from a newly
604 * received lacpdu. The parameter values for the partner carried in the
605 * received PDU are compared with the corresponding operational parameter
606 * values for the Actor. If one or more of the comparisons shows that the
607 * value(s) received in the PDU differ from the current operational values,
608 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
610 static void __update_ntt(struct lacpdu *lacpdu, struct port *port)
612 /* validate lacpdu and port */
613 if (lacpdu && port) {
614 /* check if any parameter is different then
615 * update the port->ntt.
617 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) ||
618 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) ||
619 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) ||
620 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) ||
621 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) ||
622 ((lacpdu->partner_state & AD_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY)) ||
623 ((lacpdu->partner_state & AD_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)) ||
624 ((lacpdu->partner_state & AD_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) ||
625 ((lacpdu->partner_state & AD_STATE_AGGREGATION) != (port->actor_oper_port_state & AD_STATE_AGGREGATION))
633 * __agg_ports_are_ready - check if all ports in an aggregator are ready
634 * @aggregator: the aggregator we're looking at
637 static int __agg_ports_are_ready(struct aggregator *aggregator)
643 /* scan all ports in this aggregator to verfy if they are
646 for (port = aggregator->lag_ports;
648 port = port->next_port_in_aggregator) {
649 if (!(port->sm_vars & AD_PORT_READY_N)) {
660 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
661 * @aggregator: the aggregator we're looking at
662 * @val: Should the ports' ready bit be set on or off
665 static void __set_agg_ports_ready(struct aggregator *aggregator, int val)
669 for (port = aggregator->lag_ports; port;
670 port = port->next_port_in_aggregator) {
672 port->sm_vars |= AD_PORT_READY;
674 port->sm_vars &= ~AD_PORT_READY;
678 static int __agg_active_ports(struct aggregator *agg)
683 for (port = agg->lag_ports; port;
684 port = port->next_port_in_aggregator) {
685 if (port->is_enabled)
693 * __get_agg_bandwidth - get the total bandwidth of an aggregator
694 * @aggregator: the aggregator we're looking at
697 static u32 __get_agg_bandwidth(struct aggregator *aggregator)
699 int nports = __agg_active_ports(aggregator);
703 switch (__get_link_speed(aggregator->lag_ports)) {
704 case AD_LINK_SPEED_1MBPS:
707 case AD_LINK_SPEED_10MBPS:
708 bandwidth = nports * 10;
710 case AD_LINK_SPEED_100MBPS:
711 bandwidth = nports * 100;
713 case AD_LINK_SPEED_1000MBPS:
714 bandwidth = nports * 1000;
716 case AD_LINK_SPEED_2500MBPS:
717 bandwidth = nports * 2500;
719 case AD_LINK_SPEED_5000MBPS:
720 bandwidth = nports * 5000;
722 case AD_LINK_SPEED_10000MBPS:
723 bandwidth = nports * 10000;
725 case AD_LINK_SPEED_14000MBPS:
726 bandwidth = nports * 14000;
728 case AD_LINK_SPEED_20000MBPS:
729 bandwidth = nports * 20000;
731 case AD_LINK_SPEED_25000MBPS:
732 bandwidth = nports * 25000;
734 case AD_LINK_SPEED_40000MBPS:
735 bandwidth = nports * 40000;
737 case AD_LINK_SPEED_50000MBPS:
738 bandwidth = nports * 50000;
740 case AD_LINK_SPEED_56000MBPS:
741 bandwidth = nports * 56000;
743 case AD_LINK_SPEED_100000MBPS:
744 bandwidth = nports * 100000;
747 bandwidth = 0; /* to silence the compiler */
754 * __get_active_agg - get the current active aggregator
755 * @aggregator: the aggregator we're looking at
757 * Caller must hold RCU lock.
759 static struct aggregator *__get_active_agg(struct aggregator *aggregator)
761 struct bonding *bond = aggregator->slave->bond;
762 struct list_head *iter;
765 bond_for_each_slave_rcu(bond, slave, iter)
766 if (SLAVE_AD_INFO(slave)->aggregator.is_active)
767 return &(SLAVE_AD_INFO(slave)->aggregator);
773 * __update_lacpdu_from_port - update a port's lacpdu fields
774 * @port: the port we're looking at
776 static inline void __update_lacpdu_from_port(struct port *port)
778 struct lacpdu *lacpdu = &port->lacpdu;
779 const struct port_params *partner = &port->partner_oper;
781 /* update current actual Actor parameters
782 * lacpdu->subtype initialized
783 * lacpdu->version_number initialized
784 * lacpdu->tlv_type_actor_info initialized
785 * lacpdu->actor_information_length initialized
788 lacpdu->actor_system_priority = htons(port->actor_system_priority);
789 lacpdu->actor_system = port->actor_system;
790 lacpdu->actor_key = htons(port->actor_oper_port_key);
791 lacpdu->actor_port_priority = htons(port->actor_port_priority);
792 lacpdu->actor_port = htons(port->actor_port_number);
793 lacpdu->actor_state = port->actor_oper_port_state;
794 slave_dbg(port->slave->bond->dev, port->slave->dev,
795 "update lacpdu: actor port state %x\n",
796 port->actor_oper_port_state);
798 /* lacpdu->reserved_3_1 initialized
799 * lacpdu->tlv_type_partner_info initialized
800 * lacpdu->partner_information_length initialized
803 lacpdu->partner_system_priority = htons(partner->system_priority);
804 lacpdu->partner_system = partner->system;
805 lacpdu->partner_key = htons(partner->key);
806 lacpdu->partner_port_priority = htons(partner->port_priority);
807 lacpdu->partner_port = htons(partner->port_number);
808 lacpdu->partner_state = partner->port_state;
810 /* lacpdu->reserved_3_2 initialized
811 * lacpdu->tlv_type_collector_info initialized
812 * lacpdu->collector_information_length initialized
813 * collector_max_delay initialized
814 * reserved_12[12] initialized
815 * tlv_type_terminator initialized
816 * terminator_length initialized
817 * reserved_50[50] initialized
821 /* ================= main 802.3ad protocol code ========================= */
824 * ad_lacpdu_send - send out a lacpdu packet on a given port
825 * @port: the port we're looking at
827 * Returns: 0 on success
830 static int ad_lacpdu_send(struct port *port)
832 struct slave *slave = port->slave;
834 struct lacpdu_header *lacpdu_header;
835 int length = sizeof(struct lacpdu_header);
837 skb = dev_alloc_skb(length);
841 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_tx);
842 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.lacpdu_tx);
844 skb->dev = slave->dev;
845 skb_reset_mac_header(skb);
846 skb->network_header = skb->mac_header + ETH_HLEN;
847 skb->protocol = PKT_TYPE_LACPDU;
848 skb->priority = TC_PRIO_CONTROL;
850 lacpdu_header = skb_put(skb, length);
852 ether_addr_copy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr);
853 /* Note: source address is set to be the member's PERMANENT address,
854 * because we use it to identify loopback lacpdus in receive.
856 ether_addr_copy(lacpdu_header->hdr.h_source, slave->perm_hwaddr);
857 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU;
859 lacpdu_header->lacpdu = port->lacpdu;
867 * ad_marker_send - send marker information/response on a given port
868 * @port: the port we're looking at
869 * @marker: marker data to send
871 * Returns: 0 on success
874 static int ad_marker_send(struct port *port, struct bond_marker *marker)
876 struct slave *slave = port->slave;
878 struct bond_marker_header *marker_header;
879 int length = sizeof(struct bond_marker_header);
881 skb = dev_alloc_skb(length + 16);
885 switch (marker->tlv_type) {
886 case AD_MARKER_INFORMATION_SUBTYPE:
887 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.marker_tx);
888 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.marker_tx);
890 case AD_MARKER_RESPONSE_SUBTYPE:
891 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.marker_resp_tx);
892 atomic64_inc(&BOND_AD_INFO(slave->bond).stats.marker_resp_tx);
896 skb_reserve(skb, 16);
898 skb->dev = slave->dev;
899 skb_reset_mac_header(skb);
900 skb->network_header = skb->mac_header + ETH_HLEN;
901 skb->protocol = PKT_TYPE_LACPDU;
903 marker_header = skb_put(skb, length);
905 ether_addr_copy(marker_header->hdr.h_dest, lacpdu_mcast_addr);
906 /* Note: source address is set to be the member's PERMANENT address,
907 * because we use it to identify loopback MARKERs in receive.
909 ether_addr_copy(marker_header->hdr.h_source, slave->perm_hwaddr);
910 marker_header->hdr.h_proto = PKT_TYPE_LACPDU;
912 marker_header->marker = *marker;
920 * ad_mux_machine - handle a port's mux state machine
921 * @port: the port we're looking at
922 * @update_slave_arr: Does slave array need update?
924 static void ad_mux_machine(struct port *port, bool *update_slave_arr)
926 mux_states_t last_state;
928 /* keep current State Machine state to compare later if it was
931 last_state = port->sm_mux_state;
933 if (port->sm_vars & AD_PORT_BEGIN) {
934 port->sm_mux_state = AD_MUX_DETACHED;
936 switch (port->sm_mux_state) {
937 case AD_MUX_DETACHED:
938 if ((port->sm_vars & AD_PORT_SELECTED)
939 || (port->sm_vars & AD_PORT_STANDBY))
940 /* if SELECTED or STANDBY */
941 port->sm_mux_state = AD_MUX_WAITING;
944 /* if SELECTED == FALSE return to DETACH state */
945 if (!(port->sm_vars & AD_PORT_SELECTED)) {
946 port->sm_vars &= ~AD_PORT_READY_N;
947 /* in order to withhold the Selection Logic to
948 * check all ports READY_N value every callback
949 * cycle to update ready variable, we check
950 * READY_N and update READY here
952 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
953 port->sm_mux_state = AD_MUX_DETACHED;
957 /* check if the wait_while_timer expired */
958 if (port->sm_mux_timer_counter
959 && !(--port->sm_mux_timer_counter))
960 port->sm_vars |= AD_PORT_READY_N;
962 /* in order to withhold the selection logic to check
963 * all ports READY_N value every callback cycle to
964 * update ready variable, we check READY_N and update
967 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
969 /* if the wait_while_timer expired, and the port is
970 * in READY state, move to ATTACHED state
972 if ((port->sm_vars & AD_PORT_READY)
973 && !port->sm_mux_timer_counter)
974 port->sm_mux_state = AD_MUX_ATTACHED;
976 case AD_MUX_ATTACHED:
977 /* check also if agg_select_timer expired (so the
978 * edable port will take place only after this timer)
980 if ((port->sm_vars & AD_PORT_SELECTED) &&
981 (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) &&
982 !__check_agg_selection_timer(port)) {
983 if (port->aggregator->is_active)
985 AD_MUX_COLLECTING_DISTRIBUTING;
986 } else if (!(port->sm_vars & AD_PORT_SELECTED) ||
987 (port->sm_vars & AD_PORT_STANDBY)) {
988 /* if UNSELECTED or STANDBY */
989 port->sm_vars &= ~AD_PORT_READY_N;
990 /* in order to withhold the selection logic to
991 * check all ports READY_N value every callback
992 * cycle to update ready variable, we check
993 * READY_N and update READY here
995 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
996 port->sm_mux_state = AD_MUX_DETACHED;
997 } else if (port->aggregator->is_active) {
998 port->actor_oper_port_state |=
999 AD_STATE_SYNCHRONIZATION;
1002 case AD_MUX_COLLECTING_DISTRIBUTING:
1003 if (!(port->sm_vars & AD_PORT_SELECTED) ||
1004 (port->sm_vars & AD_PORT_STANDBY) ||
1005 !(port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) ||
1006 !(port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) {
1007 port->sm_mux_state = AD_MUX_ATTACHED;
1009 /* if port state hasn't changed make
1010 * sure that a collecting distributing
1011 * port in an active aggregator is enabled
1013 if (port->aggregator &&
1014 port->aggregator->is_active &&
1015 !__port_is_enabled(port)) {
1017 __enable_port(port);
1026 /* check if the state machine was changed */
1027 if (port->sm_mux_state != last_state) {
1028 slave_dbg(port->slave->bond->dev, port->slave->dev,
1029 "Mux Machine: Port=%d, Last State=%d, Curr State=%d\n",
1030 port->actor_port_number,
1032 port->sm_mux_state);
1033 switch (port->sm_mux_state) {
1034 case AD_MUX_DETACHED:
1035 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
1036 ad_disable_collecting_distributing(port,
1038 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
1039 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
1042 case AD_MUX_WAITING:
1043 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0);
1045 case AD_MUX_ATTACHED:
1046 if (port->aggregator->is_active)
1047 port->actor_oper_port_state |=
1048 AD_STATE_SYNCHRONIZATION;
1050 port->actor_oper_port_state &=
1051 ~AD_STATE_SYNCHRONIZATION;
1052 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
1053 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
1054 ad_disable_collecting_distributing(port,
1058 case AD_MUX_COLLECTING_DISTRIBUTING:
1059 port->actor_oper_port_state |= AD_STATE_COLLECTING;
1060 port->actor_oper_port_state |= AD_STATE_DISTRIBUTING;
1061 port->actor_oper_port_state |= AD_STATE_SYNCHRONIZATION;
1062 ad_enable_collecting_distributing(port,
1073 * ad_rx_machine - handle a port's rx State Machine
1074 * @lacpdu: the lacpdu we've received
1075 * @port: the port we're looking at
1077 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
1078 * CURRENT. If timer expired set the state machine in the proper state.
1079 * In other cases, this function checks if we need to switch to other state.
1081 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
1083 rx_states_t last_state;
1085 /* keep current State Machine state to compare later if it was
1088 last_state = port->sm_rx_state;
1091 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.lacpdu_rx);
1092 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.lacpdu_rx);
1094 /* check if state machine should change state */
1096 /* first, check if port was reinitialized */
1097 if (port->sm_vars & AD_PORT_BEGIN) {
1098 port->sm_rx_state = AD_RX_INITIALIZE;
1099 port->sm_vars |= AD_PORT_CHURNED;
1100 /* check if port is not enabled */
1101 } else if (!(port->sm_vars & AD_PORT_BEGIN) && !port->is_enabled)
1102 port->sm_rx_state = AD_RX_PORT_DISABLED;
1103 /* check if new lacpdu arrived */
1104 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) ||
1105 (port->sm_rx_state == AD_RX_DEFAULTED) ||
1106 (port->sm_rx_state == AD_RX_CURRENT))) {
1107 if (port->sm_rx_state != AD_RX_CURRENT)
1108 port->sm_vars |= AD_PORT_CHURNED;
1109 port->sm_rx_timer_counter = 0;
1110 port->sm_rx_state = AD_RX_CURRENT;
1112 /* if timer is on, and if it is expired */
1113 if (port->sm_rx_timer_counter &&
1114 !(--port->sm_rx_timer_counter)) {
1115 switch (port->sm_rx_state) {
1117 port->sm_rx_state = AD_RX_DEFAULTED;
1120 port->sm_rx_state = AD_RX_EXPIRED;
1126 /* if no lacpdu arrived and no timer is on */
1127 switch (port->sm_rx_state) {
1128 case AD_RX_PORT_DISABLED:
1129 if (port->is_enabled &&
1130 (port->sm_vars & AD_PORT_LACP_ENABLED))
1131 port->sm_rx_state = AD_RX_EXPIRED;
1132 else if (port->is_enabled
1134 & AD_PORT_LACP_ENABLED) == 0))
1135 port->sm_rx_state = AD_RX_LACP_DISABLED;
1144 /* check if the State machine was changed or new lacpdu arrived */
1145 if ((port->sm_rx_state != last_state) || (lacpdu)) {
1146 slave_dbg(port->slave->bond->dev, port->slave->dev,
1147 "Rx Machine: Port=%d, Last State=%d, Curr State=%d\n",
1148 port->actor_port_number,
1151 switch (port->sm_rx_state) {
1152 case AD_RX_INITIALIZE:
1153 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS))
1154 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1156 port->sm_vars |= AD_PORT_LACP_ENABLED;
1157 port->sm_vars &= ~AD_PORT_SELECTED;
1158 __record_default(port);
1159 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1160 port->sm_rx_state = AD_RX_PORT_DISABLED;
1163 case AD_RX_PORT_DISABLED:
1164 port->sm_vars &= ~AD_PORT_MATCHED;
1166 case AD_RX_LACP_DISABLED:
1167 port->sm_vars &= ~AD_PORT_SELECTED;
1168 __record_default(port);
1169 port->partner_oper.port_state &= ~AD_STATE_AGGREGATION;
1170 port->sm_vars |= AD_PORT_MATCHED;
1171 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1174 /* Reset of the Synchronization flag (Standard 43.4.12)
1175 * This reset cause to disable this port in the
1176 * COLLECTING_DISTRIBUTING state of the mux machine in
1177 * case of EXPIRED even if LINK_DOWN didn't arrive for
1180 port->partner_oper.port_state &= ~AD_STATE_SYNCHRONIZATION;
1181 port->sm_vars &= ~AD_PORT_MATCHED;
1182 port->partner_oper.port_state |= AD_STATE_LACP_TIMEOUT;
1183 port->partner_oper.port_state |= AD_STATE_LACP_ACTIVITY;
1184 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
1185 port->actor_oper_port_state |= AD_STATE_EXPIRED;
1186 port->sm_vars |= AD_PORT_CHURNED;
1188 case AD_RX_DEFAULTED:
1189 __update_default_selected(port);
1190 __record_default(port);
1191 port->sm_vars |= AD_PORT_MATCHED;
1192 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1195 /* detect loopback situation */
1196 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system),
1197 &(port->actor_system))) {
1198 slave_err(port->slave->bond->dev, port->slave->dev, "An illegal loopback occurred on slave\n"
1199 "Check the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n");
1202 __update_selected(lacpdu, port);
1203 __update_ntt(lacpdu, port);
1204 __record_pdu(lacpdu, port);
1205 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT));
1206 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1215 * ad_churn_machine - handle port churn's state machine
1216 * @port: the port we're looking at
1219 static void ad_churn_machine(struct port *port)
1221 if (port->sm_vars & AD_PORT_CHURNED) {
1222 port->sm_vars &= ~AD_PORT_CHURNED;
1223 port->sm_churn_actor_state = AD_CHURN_MONITOR;
1224 port->sm_churn_partner_state = AD_CHURN_MONITOR;
1225 port->sm_churn_actor_timer_counter =
1226 __ad_timer_to_ticks(AD_ACTOR_CHURN_TIMER, 0);
1227 port->sm_churn_partner_timer_counter =
1228 __ad_timer_to_ticks(AD_PARTNER_CHURN_TIMER, 0);
1231 if (port->sm_churn_actor_timer_counter &&
1232 !(--port->sm_churn_actor_timer_counter) &&
1233 port->sm_churn_actor_state == AD_CHURN_MONITOR) {
1234 if (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION) {
1235 port->sm_churn_actor_state = AD_NO_CHURN;
1237 port->churn_actor_count++;
1238 port->sm_churn_actor_state = AD_CHURN;
1241 if (port->sm_churn_partner_timer_counter &&
1242 !(--port->sm_churn_partner_timer_counter) &&
1243 port->sm_churn_partner_state == AD_CHURN_MONITOR) {
1244 if (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) {
1245 port->sm_churn_partner_state = AD_NO_CHURN;
1247 port->churn_partner_count++;
1248 port->sm_churn_partner_state = AD_CHURN;
1254 * ad_tx_machine - handle a port's tx state machine
1255 * @port: the port we're looking at
1257 static void ad_tx_machine(struct port *port)
1259 /* check if tx timer expired, to verify that we do not send more than
1260 * 3 packets per second
1262 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) {
1263 /* check if there is something to send */
1264 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1265 __update_lacpdu_from_port(port);
1267 if (ad_lacpdu_send(port) >= 0) {
1268 slave_dbg(port->slave->bond->dev,
1270 "Sent LACPDU on port %d\n",
1271 port->actor_port_number);
1273 /* mark ntt as false, so it will not be sent
1274 * again until demanded
1279 /* restart tx timer(to verify that we will not exceed
1280 * AD_MAX_TX_IN_SECOND
1282 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1287 * ad_periodic_machine - handle a port's periodic state machine
1288 * @port: the port we're looking at
1290 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1292 static void ad_periodic_machine(struct port *port)
1294 periodic_states_t last_state;
1296 /* keep current state machine state to compare later if it was changed */
1297 last_state = port->sm_periodic_state;
1299 /* check if port was reinitialized */
1300 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
1301 (!(port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & AD_STATE_LACP_ACTIVITY))
1303 port->sm_periodic_state = AD_NO_PERIODIC;
1305 /* check if state machine should change state */
1306 else if (port->sm_periodic_timer_counter) {
1307 /* check if periodic state machine expired */
1308 if (!(--port->sm_periodic_timer_counter)) {
1309 /* if expired then do tx */
1310 port->sm_periodic_state = AD_PERIODIC_TX;
1312 /* If not expired, check if there is some new timeout
1313 * parameter from the partner state
1315 switch (port->sm_periodic_state) {
1316 case AD_FAST_PERIODIC:
1317 if (!(port->partner_oper.port_state
1318 & AD_STATE_LACP_TIMEOUT))
1319 port->sm_periodic_state = AD_SLOW_PERIODIC;
1321 case AD_SLOW_PERIODIC:
1322 if ((port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1323 port->sm_periodic_timer_counter = 0;
1324 port->sm_periodic_state = AD_PERIODIC_TX;
1332 switch (port->sm_periodic_state) {
1333 case AD_NO_PERIODIC:
1334 port->sm_periodic_state = AD_FAST_PERIODIC;
1336 case AD_PERIODIC_TX:
1337 if (!(port->partner_oper.port_state &
1338 AD_STATE_LACP_TIMEOUT))
1339 port->sm_periodic_state = AD_SLOW_PERIODIC;
1341 port->sm_periodic_state = AD_FAST_PERIODIC;
1348 /* check if the state machine was changed */
1349 if (port->sm_periodic_state != last_state) {
1350 slave_dbg(port->slave->bond->dev, port->slave->dev,
1351 "Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1352 port->actor_port_number, last_state,
1353 port->sm_periodic_state);
1354 switch (port->sm_periodic_state) {
1355 case AD_NO_PERIODIC:
1356 port->sm_periodic_timer_counter = 0;
1358 case AD_FAST_PERIODIC:
1359 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1360 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1;
1362 case AD_SLOW_PERIODIC:
1363 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1364 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1;
1366 case AD_PERIODIC_TX:
1376 * ad_port_selection_logic - select aggregation groups
1377 * @port: the port we're looking at
1378 * @update_slave_arr: Does slave array need update?
1380 * Select aggregation groups, and assign each port for it's aggregetor. The
1381 * selection logic is called in the inititalization (after all the handshkes),
1382 * and after every lacpdu receive (if selected is off).
1384 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr)
1386 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator;
1387 struct port *last_port = NULL, *curr_port;
1388 struct list_head *iter;
1389 struct bonding *bond;
1390 struct slave *slave;
1393 /* if the port is already Selected, do nothing */
1394 if (port->sm_vars & AD_PORT_SELECTED)
1397 bond = __get_bond_by_port(port);
1399 /* if the port is connected to other aggregator, detach it */
1400 if (port->aggregator) {
1401 /* detach the port from its former aggregator */
1402 temp_aggregator = port->aggregator;
1403 for (curr_port = temp_aggregator->lag_ports; curr_port;
1404 last_port = curr_port,
1405 curr_port = curr_port->next_port_in_aggregator) {
1406 if (curr_port == port) {
1407 temp_aggregator->num_of_ports--;
1408 /* if it is the first port attached to the
1412 temp_aggregator->lag_ports =
1413 port->next_port_in_aggregator;
1415 /* not the first port attached to the
1418 last_port->next_port_in_aggregator =
1419 port->next_port_in_aggregator;
1422 /* clear the port's relations to this
1425 port->aggregator = NULL;
1426 port->next_port_in_aggregator = NULL;
1427 port->actor_port_aggregator_identifier = 0;
1429 slave_dbg(bond->dev, port->slave->dev, "Port %d left LAG %d\n",
1430 port->actor_port_number,
1431 temp_aggregator->aggregator_identifier);
1432 /* if the aggregator is empty, clear its
1433 * parameters, and set it ready to be attached
1435 if (!temp_aggregator->lag_ports)
1436 ad_clear_agg(temp_aggregator);
1441 /* meaning: the port was related to an aggregator
1442 * but was not on the aggregator port list
1444 net_warn_ratelimited("%s: (slave %s): Warning: Port %d was related to aggregator %d but was not on its port list\n",
1445 port->slave->bond->dev->name,
1446 port->slave->dev->name,
1447 port->actor_port_number,
1448 port->aggregator->aggregator_identifier);
1451 /* search on all aggregators for a suitable aggregator for this port */
1452 bond_for_each_slave(bond, slave, iter) {
1453 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
1455 /* keep a free aggregator for later use(if needed) */
1456 if (!aggregator->lag_ports) {
1457 if (!free_aggregator)
1458 free_aggregator = aggregator;
1461 /* check if current aggregator suits us */
1462 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */
1463 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) &&
1464 (aggregator->partner_system_priority == port->partner_oper.system_priority) &&
1465 (aggregator->partner_oper_aggregator_key == port->partner_oper.key)
1467 ((!MAC_ADDRESS_EQUAL(&(port->partner_oper.system), &(null_mac_addr)) && /* partner answers */
1468 !aggregator->is_individual) /* but is not individual OR */
1471 /* attach to the founded aggregator */
1472 port->aggregator = aggregator;
1473 port->actor_port_aggregator_identifier =
1474 port->aggregator->aggregator_identifier;
1475 port->next_port_in_aggregator = aggregator->lag_ports;
1476 port->aggregator->num_of_ports++;
1477 aggregator->lag_ports = port;
1478 slave_dbg(bond->dev, slave->dev, "Port %d joined LAG %d (existing LAG)\n",
1479 port->actor_port_number,
1480 port->aggregator->aggregator_identifier);
1482 /* mark this port as selected */
1483 port->sm_vars |= AD_PORT_SELECTED;
1489 /* the port couldn't find an aggregator - attach it to a new
1493 if (free_aggregator) {
1494 /* assign port a new aggregator */
1495 port->aggregator = free_aggregator;
1496 port->actor_port_aggregator_identifier =
1497 port->aggregator->aggregator_identifier;
1499 /* update the new aggregator's parameters
1500 * if port was responsed from the end-user
1502 if (port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS)
1503 /* if port is full duplex */
1504 port->aggregator->is_individual = false;
1506 port->aggregator->is_individual = true;
1508 port->aggregator->actor_admin_aggregator_key =
1509 port->actor_admin_port_key;
1510 port->aggregator->actor_oper_aggregator_key =
1511 port->actor_oper_port_key;
1512 port->aggregator->partner_system =
1513 port->partner_oper.system;
1514 port->aggregator->partner_system_priority =
1515 port->partner_oper.system_priority;
1516 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key;
1517 port->aggregator->receive_state = 1;
1518 port->aggregator->transmit_state = 1;
1519 port->aggregator->lag_ports = port;
1520 port->aggregator->num_of_ports++;
1522 /* mark this port as selected */
1523 port->sm_vars |= AD_PORT_SELECTED;
1525 slave_dbg(bond->dev, port->slave->dev, "Port %d joined LAG %d (new LAG)\n",
1526 port->actor_port_number,
1527 port->aggregator->aggregator_identifier);
1529 slave_err(bond->dev, port->slave->dev,
1530 "Port %d did not find a suitable aggregator\n",
1531 port->actor_port_number);
1534 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1535 * in all aggregator's ports, else set ready=FALSE in all
1536 * aggregator's ports
1538 __set_agg_ports_ready(port->aggregator,
1539 __agg_ports_are_ready(port->aggregator));
1541 aggregator = __get_first_agg(port);
1542 ad_agg_selection_logic(aggregator, update_slave_arr);
1544 if (!port->aggregator->is_active)
1545 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
1548 /* Decide if "agg" is a better choice for the new active aggregator that
1549 * the current best, according to the ad_select policy.
1551 static struct aggregator *ad_agg_selection_test(struct aggregator *best,
1552 struct aggregator *curr)
1554 /* 0. If no best, select current.
1556 * 1. If the current agg is not individual, and the best is
1557 * individual, select current.
1559 * 2. If current agg is individual and the best is not, keep best.
1561 * 3. Therefore, current and best are both individual or both not
1564 * 3a. If current agg partner replied, and best agg partner did not,
1567 * 3b. If current agg partner did not reply and best agg partner
1568 * did reply, keep best.
1570 * 4. Therefore, current and best both have partner replies or
1571 * both do not, so perform selection policy:
1573 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1574 * select by bandwidth.
1576 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1581 if (!curr->is_individual && best->is_individual)
1584 if (curr->is_individual && !best->is_individual)
1587 if (__agg_has_partner(curr) && !__agg_has_partner(best))
1590 if (!__agg_has_partner(curr) && __agg_has_partner(best))
1593 switch (__get_agg_selection_mode(curr->lag_ports)) {
1595 if (__agg_active_ports(curr) > __agg_active_ports(best))
1598 if (__agg_active_ports(curr) < __agg_active_ports(best))
1602 case BOND_AD_STABLE:
1603 case BOND_AD_BANDWIDTH:
1604 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best))
1610 net_warn_ratelimited("%s: (slave %s): Impossible agg select mode %d\n",
1611 curr->slave->bond->dev->name,
1612 curr->slave->dev->name,
1613 __get_agg_selection_mode(curr->lag_ports));
1620 static int agg_device_up(const struct aggregator *agg)
1622 struct port *port = agg->lag_ports;
1627 for (port = agg->lag_ports; port;
1628 port = port->next_port_in_aggregator) {
1629 if (netif_running(port->slave->dev) &&
1630 netif_carrier_ok(port->slave->dev))
1638 * ad_agg_selection_logic - select an aggregation group for a team
1639 * @aggregator: the aggregator we're looking at
1640 * @update_slave_arr: Does slave array need update?
1642 * It is assumed that only one aggregator may be selected for a team.
1644 * The logic of this function is to select the aggregator according to
1645 * the ad_select policy:
1647 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1648 * it, and to reselect the active aggregator only if the previous
1649 * aggregator has no more ports related to it.
1651 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1652 * bandwidth, and reselect whenever a link state change takes place or the
1653 * set of slaves in the bond changes.
1655 * BOND_AD_COUNT: select the aggregator with largest number of ports
1656 * (slaves), and reselect whenever a link state change takes place or the
1657 * set of slaves in the bond changes.
1659 * FIXME: this function MUST be called with the first agg in the bond, or
1660 * __get_active_agg() won't work correctly. This function should be better
1661 * called with the bond itself, and retrieve the first agg from it.
1663 static void ad_agg_selection_logic(struct aggregator *agg,
1664 bool *update_slave_arr)
1666 struct aggregator *best, *active, *origin;
1667 struct bonding *bond = agg->slave->bond;
1668 struct list_head *iter;
1669 struct slave *slave;
1674 active = __get_active_agg(agg);
1675 best = (active && agg_device_up(active)) ? active : NULL;
1677 bond_for_each_slave_rcu(bond, slave, iter) {
1678 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1682 if (__agg_active_ports(agg) && agg_device_up(agg))
1683 best = ad_agg_selection_test(best, agg);
1687 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) {
1688 /* For the STABLE policy, don't replace the old active
1689 * aggregator if it's still active (it has an answering
1690 * partner) or if both the best and active don't have an
1691 * answering partner.
1693 if (active && active->lag_ports &&
1694 __agg_active_ports(active) &&
1695 (__agg_has_partner(active) ||
1696 (!__agg_has_partner(active) &&
1697 !__agg_has_partner(best)))) {
1698 if (!(!active->actor_oper_aggregator_key &&
1699 best->actor_oper_aggregator_key)) {
1701 active->is_active = 1;
1706 if (best && (best == active)) {
1708 active->is_active = 1;
1711 /* if there is new best aggregator, activate it */
1713 netdev_dbg(bond->dev, "(slave %s): best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1714 best->slave ? best->slave->dev->name : "NULL",
1715 best->aggregator_identifier, best->num_of_ports,
1716 best->actor_oper_aggregator_key,
1717 best->partner_oper_aggregator_key,
1718 best->is_individual, best->is_active);
1719 netdev_dbg(bond->dev, "(slave %s): best ports %p slave %p\n",
1720 best->slave ? best->slave->dev->name : "NULL",
1721 best->lag_ports, best->slave);
1723 bond_for_each_slave_rcu(bond, slave, iter) {
1724 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1726 slave_dbg(bond->dev, slave->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1727 agg->aggregator_identifier, agg->num_of_ports,
1728 agg->actor_oper_aggregator_key,
1729 agg->partner_oper_aggregator_key,
1730 agg->is_individual, agg->is_active);
1733 /* check if any partner replies */
1734 if (best->is_individual)
1735 net_warn_ratelimited("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1738 best->is_active = 1;
1739 netdev_dbg(bond->dev, "(slave %s): LAG %d chosen as the active LAG\n",
1740 best->slave ? best->slave->dev->name : "NULL",
1741 best->aggregator_identifier);
1742 netdev_dbg(bond->dev, "(slave %s): Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1743 best->slave ? best->slave->dev->name : "NULL",
1744 best->aggregator_identifier, best->num_of_ports,
1745 best->actor_oper_aggregator_key,
1746 best->partner_oper_aggregator_key,
1747 best->is_individual, best->is_active);
1749 /* disable the ports that were related to the former
1753 for (port = active->lag_ports; port;
1754 port = port->next_port_in_aggregator) {
1755 __disable_port(port);
1758 /* Slave array needs update. */
1759 *update_slave_arr = true;
1762 /* if the selected aggregator is of join individuals
1763 * (partner_system is NULL), enable their ports
1765 active = __get_active_agg(origin);
1768 if (!__agg_has_partner(active)) {
1769 for (port = active->lag_ports; port;
1770 port = port->next_port_in_aggregator) {
1771 __enable_port(port);
1778 bond_3ad_set_carrier(bond);
1782 * ad_clear_agg - clear a given aggregator's parameters
1783 * @aggregator: the aggregator we're looking at
1785 static void ad_clear_agg(struct aggregator *aggregator)
1788 aggregator->is_individual = false;
1789 aggregator->actor_admin_aggregator_key = 0;
1790 aggregator->actor_oper_aggregator_key = 0;
1791 eth_zero_addr(aggregator->partner_system.mac_addr_value);
1792 aggregator->partner_system_priority = 0;
1793 aggregator->partner_oper_aggregator_key = 0;
1794 aggregator->receive_state = 0;
1795 aggregator->transmit_state = 0;
1796 aggregator->lag_ports = NULL;
1797 aggregator->is_active = 0;
1798 aggregator->num_of_ports = 0;
1799 pr_debug("%s: LAG %d was cleared\n",
1801 aggregator->slave->dev->name : "NULL",
1802 aggregator->aggregator_identifier);
1807 * ad_initialize_agg - initialize a given aggregator's parameters
1808 * @aggregator: the aggregator we're looking at
1810 static void ad_initialize_agg(struct aggregator *aggregator)
1813 ad_clear_agg(aggregator);
1815 eth_zero_addr(aggregator->aggregator_mac_address.mac_addr_value);
1816 aggregator->aggregator_identifier = 0;
1817 aggregator->slave = NULL;
1822 * ad_initialize_port - initialize a given port's parameters
1823 * @aggregator: the aggregator we're looking at
1824 * @lacp_fast: boolean. whether fast periodic should be used
1826 static void ad_initialize_port(struct port *port, int lacp_fast)
1828 static const struct port_params tmpl = {
1829 .system_priority = 0xffff,
1832 .port_priority = 0xff,
1835 static const struct lacpdu lacpdu = {
1837 .version_number = 0x01,
1838 .tlv_type_actor_info = 0x01,
1839 .actor_information_length = 0x14,
1840 .tlv_type_partner_info = 0x02,
1841 .partner_information_length = 0x14,
1842 .tlv_type_collector_info = 0x03,
1843 .collector_information_length = 0x10,
1844 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY),
1848 port->actor_port_priority = 0xff;
1849 port->actor_port_aggregator_identifier = 0;
1851 port->actor_admin_port_state = AD_STATE_AGGREGATION |
1852 AD_STATE_LACP_ACTIVITY;
1853 port->actor_oper_port_state = AD_STATE_AGGREGATION |
1854 AD_STATE_LACP_ACTIVITY;
1857 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
1859 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
1860 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl));
1862 port->is_enabled = true;
1863 /* private parameters */
1864 port->sm_vars = AD_PORT_BEGIN | AD_PORT_LACP_ENABLED;
1865 port->sm_rx_state = 0;
1866 port->sm_rx_timer_counter = 0;
1867 port->sm_periodic_state = 0;
1868 port->sm_periodic_timer_counter = 0;
1869 port->sm_mux_state = 0;
1870 port->sm_mux_timer_counter = 0;
1871 port->sm_tx_state = 0;
1872 port->aggregator = NULL;
1873 port->next_port_in_aggregator = NULL;
1874 port->transaction_id = 0;
1876 port->sm_churn_actor_timer_counter = 0;
1877 port->sm_churn_actor_state = 0;
1878 port->churn_actor_count = 0;
1879 port->sm_churn_partner_timer_counter = 0;
1880 port->sm_churn_partner_state = 0;
1881 port->churn_partner_count = 0;
1883 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu));
1888 * ad_enable_collecting_distributing - enable a port's transmit/receive
1889 * @port: the port we're looking at
1890 * @update_slave_arr: Does slave array need update?
1892 * Enable @port if it's in an active aggregator
1894 static void ad_enable_collecting_distributing(struct port *port,
1895 bool *update_slave_arr)
1897 if (port->aggregator->is_active) {
1898 slave_dbg(port->slave->bond->dev, port->slave->dev,
1899 "Enabling port %d (LAG %d)\n",
1900 port->actor_port_number,
1901 port->aggregator->aggregator_identifier);
1902 __enable_port(port);
1903 /* Slave array needs update */
1904 *update_slave_arr = true;
1909 * ad_disable_collecting_distributing - disable a port's transmit/receive
1910 * @port: the port we're looking at
1911 * @update_slave_arr: Does slave array need update?
1913 static void ad_disable_collecting_distributing(struct port *port,
1914 bool *update_slave_arr)
1916 if (port->aggregator &&
1917 !MAC_ADDRESS_EQUAL(&(port->aggregator->partner_system),
1918 &(null_mac_addr))) {
1919 slave_dbg(port->slave->bond->dev, port->slave->dev,
1920 "Disabling port %d (LAG %d)\n",
1921 port->actor_port_number,
1922 port->aggregator->aggregator_identifier);
1923 __disable_port(port);
1924 /* Slave array needs an update */
1925 *update_slave_arr = true;
1930 * ad_marker_info_received - handle receive of a Marker information frame
1931 * @marker_info: Marker info received
1932 * @port: the port we're looking at
1934 static void ad_marker_info_received(struct bond_marker *marker_info,
1937 struct bond_marker marker;
1939 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.marker_rx);
1940 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.marker_rx);
1942 /* copy the received marker data to the response marker */
1943 memcpy(&marker, marker_info, sizeof(struct bond_marker));
1944 /* change the marker subtype to marker response */
1945 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE;
1947 /* send the marker response */
1948 if (ad_marker_send(port, &marker) >= 0)
1949 slave_dbg(port->slave->bond->dev, port->slave->dev,
1950 "Sent Marker Response on port %d\n",
1951 port->actor_port_number);
1955 * ad_marker_response_received - handle receive of a marker response frame
1956 * @marker: marker PDU received
1957 * @port: the port we're looking at
1959 * This function does nothing since we decided not to implement send and handle
1960 * response for marker PDU's, in this stage, but only to respond to marker
1963 static void ad_marker_response_received(struct bond_marker *marker,
1966 atomic64_inc(&SLAVE_AD_INFO(port->slave)->stats.marker_resp_rx);
1967 atomic64_inc(&BOND_AD_INFO(port->slave->bond).stats.marker_resp_rx);
1969 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1972 /* ========= AD exported functions to the main bonding code ========= */
1974 /* Check aggregators status in team every T seconds */
1975 #define AD_AGGREGATOR_SELECTION_TIMER 8
1978 * bond_3ad_initiate_agg_selection - initate aggregator selection
1979 * @bond: bonding struct
1981 * Set the aggregation selection timer, to initiate an agg selection in
1982 * the very near future. Called during first initialization, and during
1983 * any down to up transitions of the bond.
1985 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout)
1987 BOND_AD_INFO(bond).agg_select_timer = timeout;
1991 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1992 * @bond: bonding struct to work on
1993 * @tick_resolution: tick duration (millisecond resolution)
1995 * Can be called only after the mac address of the bond is set.
1997 void bond_3ad_initialize(struct bonding *bond, u16 tick_resolution)
1999 /* check that the bond is not initialized yet */
2000 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond).system.sys_mac_addr),
2001 bond->dev->dev_addr)) {
2003 BOND_AD_INFO(bond).aggregator_identifier = 0;
2005 BOND_AD_INFO(bond).system.sys_priority =
2006 bond->params.ad_actor_sys_prio;
2007 if (is_zero_ether_addr(bond->params.ad_actor_system))
2008 BOND_AD_INFO(bond).system.sys_mac_addr =
2009 *((struct mac_addr *)bond->dev->dev_addr);
2011 BOND_AD_INFO(bond).system.sys_mac_addr =
2012 *((struct mac_addr *)bond->params.ad_actor_system);
2014 /* initialize how many times this module is called in one
2015 * second (should be about every 100ms)
2017 ad_ticks_per_sec = tick_resolution;
2019 bond_3ad_initiate_agg_selection(bond,
2020 AD_AGGREGATOR_SELECTION_TIMER *
2026 * bond_3ad_bind_slave - initialize a slave's port
2027 * @slave: slave struct to work on
2029 * Returns: 0 on success
2032 void bond_3ad_bind_slave(struct slave *slave)
2034 struct bonding *bond = bond_get_bond_by_slave(slave);
2036 struct aggregator *aggregator;
2038 /* check that the slave has not been initialized yet. */
2039 if (SLAVE_AD_INFO(slave)->port.slave != slave) {
2041 /* port initialization */
2042 port = &(SLAVE_AD_INFO(slave)->port);
2044 ad_initialize_port(port, bond->params.lacp_fast);
2046 port->slave = slave;
2047 port->actor_port_number = SLAVE_AD_INFO(slave)->id;
2048 /* key is determined according to the link speed, duplex and
2051 port->actor_admin_port_key = bond->params.ad_user_port_key << 6;
2052 ad_update_actor_keys(port, false);
2053 /* actor system is the bond's system */
2054 __ad_actor_update_port(port);
2055 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
2056 * lacpdu's are sent in one second)
2058 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
2060 __disable_port(port);
2062 /* aggregator initialization */
2063 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2065 ad_initialize_agg(aggregator);
2067 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr);
2068 aggregator->aggregator_identifier = ++BOND_AD_INFO(bond).aggregator_identifier;
2069 aggregator->slave = slave;
2070 aggregator->is_active = 0;
2071 aggregator->num_of_ports = 0;
2076 * bond_3ad_unbind_slave - deinitialize a slave's port
2077 * @slave: slave struct to work on
2079 * Search for the aggregator that is related to this port, remove the
2080 * aggregator and assign another aggregator for other port related to it
2081 * (if any), and remove the port.
2083 void bond_3ad_unbind_slave(struct slave *slave)
2085 struct port *port, *prev_port, *temp_port;
2086 struct aggregator *aggregator, *new_aggregator, *temp_aggregator;
2087 int select_new_active_agg = 0;
2088 struct bonding *bond = slave->bond;
2089 struct slave *slave_iter;
2090 struct list_head *iter;
2091 bool dummy_slave_update; /* Ignore this value as caller updates array */
2093 /* Sync against bond_3ad_state_machine_handler() */
2094 spin_lock_bh(&bond->mode_lock);
2095 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2096 port = &(SLAVE_AD_INFO(slave)->port);
2098 /* if slave is null, the whole port is not initialized */
2100 slave_warn(bond->dev, slave->dev, "Trying to unbind an uninitialized port\n");
2104 slave_dbg(bond->dev, slave->dev, "Unbinding Link Aggregation Group %d\n",
2105 aggregator->aggregator_identifier);
2107 /* Tell the partner that this port is not suitable for aggregation */
2108 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
2109 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
2110 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
2111 port->actor_oper_port_state &= ~AD_STATE_AGGREGATION;
2112 __update_lacpdu_from_port(port);
2113 ad_lacpdu_send(port);
2115 /* check if this aggregator is occupied */
2116 if (aggregator->lag_ports) {
2117 /* check if there are other ports related to this aggregator
2118 * except the port related to this slave(thats ensure us that
2119 * there is a reason to search for new aggregator, and that we
2122 if ((aggregator->lag_ports != port) ||
2123 (aggregator->lag_ports->next_port_in_aggregator)) {
2124 /* find new aggregator for the related port(s) */
2125 bond_for_each_slave(bond, slave_iter, iter) {
2126 new_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2127 /* if the new aggregator is empty, or it is
2128 * connected to our port only
2130 if (!new_aggregator->lag_ports ||
2131 ((new_aggregator->lag_ports == port) &&
2132 !new_aggregator->lag_ports->next_port_in_aggregator))
2136 new_aggregator = NULL;
2138 /* if new aggregator found, copy the aggregator's
2139 * parameters and connect the related lag_ports to the
2142 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) {
2143 slave_dbg(bond->dev, slave->dev, "Some port(s) related to LAG %d - replacing with LAG %d\n",
2144 aggregator->aggregator_identifier,
2145 new_aggregator->aggregator_identifier);
2147 if ((new_aggregator->lag_ports == port) &&
2148 new_aggregator->is_active) {
2149 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n");
2150 select_new_active_agg = 1;
2153 new_aggregator->is_individual = aggregator->is_individual;
2154 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key;
2155 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key;
2156 new_aggregator->partner_system = aggregator->partner_system;
2157 new_aggregator->partner_system_priority = aggregator->partner_system_priority;
2158 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key;
2159 new_aggregator->receive_state = aggregator->receive_state;
2160 new_aggregator->transmit_state = aggregator->transmit_state;
2161 new_aggregator->lag_ports = aggregator->lag_ports;
2162 new_aggregator->is_active = aggregator->is_active;
2163 new_aggregator->num_of_ports = aggregator->num_of_ports;
2165 /* update the information that is written on
2166 * the ports about the aggregator
2168 for (temp_port = aggregator->lag_ports; temp_port;
2169 temp_port = temp_port->next_port_in_aggregator) {
2170 temp_port->aggregator = new_aggregator;
2171 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier;
2174 ad_clear_agg(aggregator);
2176 if (select_new_active_agg)
2177 ad_agg_selection_logic(__get_first_agg(port),
2178 &dummy_slave_update);
2180 slave_warn(bond->dev, slave->dev, "unbinding aggregator, and could not find a new aggregator for its ports\n");
2183 /* in case that the only port related to this
2184 * aggregator is the one we want to remove
2186 select_new_active_agg = aggregator->is_active;
2187 ad_clear_agg(aggregator);
2188 if (select_new_active_agg) {
2189 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n");
2190 /* select new active aggregator */
2191 temp_aggregator = __get_first_agg(port);
2192 if (temp_aggregator)
2193 ad_agg_selection_logic(temp_aggregator,
2194 &dummy_slave_update);
2199 slave_dbg(bond->dev, slave->dev, "Unbinding port %d\n", port->actor_port_number);
2201 /* find the aggregator that this port is connected to */
2202 bond_for_each_slave(bond, slave_iter, iter) {
2203 temp_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2205 /* search the port in the aggregator's related ports */
2206 for (temp_port = temp_aggregator->lag_ports; temp_port;
2207 prev_port = temp_port,
2208 temp_port = temp_port->next_port_in_aggregator) {
2209 if (temp_port == port) {
2210 /* the aggregator found - detach the port from
2214 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator;
2216 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator;
2217 temp_aggregator->num_of_ports--;
2218 if (__agg_active_ports(temp_aggregator) == 0) {
2219 select_new_active_agg = temp_aggregator->is_active;
2220 ad_clear_agg(temp_aggregator);
2221 if (select_new_active_agg) {
2222 slave_info(bond->dev, slave->dev, "Removing an active aggregator\n");
2223 /* select new active aggregator */
2224 ad_agg_selection_logic(__get_first_agg(port),
2225 &dummy_slave_update);
2235 spin_unlock_bh(&bond->mode_lock);
2239 * bond_3ad_update_ad_actor_settings - reflect change of actor settings to ports
2240 * @bond: bonding struct to work on
2242 * If an ad_actor setting gets changed we need to update the individual port
2243 * settings so the bond device will use the new values when it gets upped.
2245 void bond_3ad_update_ad_actor_settings(struct bonding *bond)
2247 struct list_head *iter;
2248 struct slave *slave;
2252 BOND_AD_INFO(bond).system.sys_priority = bond->params.ad_actor_sys_prio;
2253 if (is_zero_ether_addr(bond->params.ad_actor_system))
2254 BOND_AD_INFO(bond).system.sys_mac_addr =
2255 *((struct mac_addr *)bond->dev->dev_addr);
2257 BOND_AD_INFO(bond).system.sys_mac_addr =
2258 *((struct mac_addr *)bond->params.ad_actor_system);
2260 spin_lock_bh(&bond->mode_lock);
2261 bond_for_each_slave(bond, slave, iter) {
2262 struct port *port = &(SLAVE_AD_INFO(slave))->port;
2264 __ad_actor_update_port(port);
2267 spin_unlock_bh(&bond->mode_lock);
2271 * bond_3ad_state_machine_handler - handle state machines timeout
2272 * @bond: bonding struct to work on
2274 * The state machine handling concept in this module is to check every tick
2275 * which state machine should operate any function. The execution order is
2276 * round robin, so when we have an interaction between state machines, the
2277 * reply of one to each other might be delayed until next tick.
2279 * This function also complete the initialization when the agg_select_timer
2280 * times out, and it selects an aggregator for the ports that are yet not
2281 * related to any aggregator, and selects the active aggregator for a bond.
2283 void bond_3ad_state_machine_handler(struct work_struct *work)
2285 struct bonding *bond = container_of(work, struct bonding,
2287 struct aggregator *aggregator;
2288 struct list_head *iter;
2289 struct slave *slave;
2291 bool should_notify_rtnl = BOND_SLAVE_NOTIFY_LATER;
2292 bool update_slave_arr = false;
2294 /* Lock to protect data accessed by all (e.g., port->sm_vars) and
2295 * against running with bond_3ad_unbind_slave. ad_rx_machine may run
2296 * concurrently due to incoming LACPDU as well.
2298 spin_lock_bh(&bond->mode_lock);
2301 /* check if there are any slaves */
2302 if (!bond_has_slaves(bond))
2305 /* check if agg_select_timer timer after initialize is timed out */
2306 if (BOND_AD_INFO(bond).agg_select_timer &&
2307 !(--BOND_AD_INFO(bond).agg_select_timer)) {
2308 slave = bond_first_slave_rcu(bond);
2309 port = slave ? &(SLAVE_AD_INFO(slave)->port) : NULL;
2311 /* select the active aggregator for the bond */
2314 net_warn_ratelimited("%s: Warning: bond's first port is uninitialized\n",
2319 aggregator = __get_first_agg(port);
2320 ad_agg_selection_logic(aggregator, &update_slave_arr);
2322 bond_3ad_set_carrier(bond);
2325 /* for each port run the state machines */
2326 bond_for_each_slave_rcu(bond, slave, iter) {
2327 port = &(SLAVE_AD_INFO(slave)->port);
2329 net_warn_ratelimited("%s: Warning: Found an uninitialized port\n",
2334 ad_rx_machine(NULL, port);
2335 ad_periodic_machine(port);
2336 ad_port_selection_logic(port, &update_slave_arr);
2337 ad_mux_machine(port, &update_slave_arr);
2338 ad_tx_machine(port);
2339 ad_churn_machine(port);
2341 /* turn off the BEGIN bit, since we already handled it */
2342 if (port->sm_vars & AD_PORT_BEGIN)
2343 port->sm_vars &= ~AD_PORT_BEGIN;
2347 bond_for_each_slave_rcu(bond, slave, iter) {
2348 if (slave->should_notify) {
2349 should_notify_rtnl = BOND_SLAVE_NOTIFY_NOW;
2354 spin_unlock_bh(&bond->mode_lock);
2356 if (update_slave_arr)
2357 bond_slave_arr_work_rearm(bond, 0);
2359 if (should_notify_rtnl && rtnl_trylock()) {
2360 bond_slave_state_notify(bond);
2363 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks);
2367 * bond_3ad_rx_indication - handle a received frame
2368 * @lacpdu: received lacpdu
2369 * @slave: slave struct to work on
2371 * It is assumed that frames that were sent on this NIC don't returned as new
2372 * received frames (loopback). Since only the payload is given to this
2373 * function, it check for loopback.
2375 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave)
2377 struct bonding *bond = slave->bond;
2378 int ret = RX_HANDLER_ANOTHER;
2379 struct bond_marker *marker;
2383 port = &(SLAVE_AD_INFO(slave)->port);
2385 net_warn_ratelimited("%s: Warning: port of slave %s is uninitialized\n",
2386 slave->dev->name, slave->bond->dev->name);
2390 switch (lacpdu->subtype) {
2391 case AD_TYPE_LACPDU:
2392 ret = RX_HANDLER_CONSUMED;
2393 slave_dbg(slave->bond->dev, slave->dev,
2394 "Received LACPDU on port %d\n",
2395 port->actor_port_number);
2396 /* Protect against concurrent state machines */
2397 spin_lock(&slave->bond->mode_lock);
2398 ad_rx_machine(lacpdu, port);
2399 spin_unlock(&slave->bond->mode_lock);
2401 case AD_TYPE_MARKER:
2402 ret = RX_HANDLER_CONSUMED;
2403 /* No need to convert fields to Little Endian since we
2404 * don't use the marker's fields.
2406 marker = (struct bond_marker *)lacpdu;
2407 switch (marker->tlv_type) {
2408 case AD_MARKER_INFORMATION_SUBTYPE:
2409 slave_dbg(slave->bond->dev, slave->dev, "Received Marker Information on port %d\n",
2410 port->actor_port_number);
2411 ad_marker_info_received(marker, port);
2413 case AD_MARKER_RESPONSE_SUBTYPE:
2414 slave_dbg(slave->bond->dev, slave->dev, "Received Marker Response on port %d\n",
2415 port->actor_port_number);
2416 ad_marker_response_received(marker, port);
2419 slave_dbg(slave->bond->dev, slave->dev, "Received an unknown Marker subtype on port %d\n",
2420 port->actor_port_number);
2421 stat = &SLAVE_AD_INFO(slave)->stats.marker_unknown_rx;
2423 stat = &BOND_AD_INFO(bond).stats.marker_unknown_rx;
2428 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_unknown_rx);
2429 atomic64_inc(&BOND_AD_INFO(bond).stats.lacpdu_unknown_rx);
2436 * ad_update_actor_keys - Update the oper / admin keys for a port based on
2437 * its current speed and duplex settings.
2439 * @port: the port we'are looking at
2440 * @reset: Boolean to just reset the speed and the duplex part of the key
2442 * The logic to change the oper / admin keys is:
2443 * (a) A full duplex port can participate in LACP with partner.
2444 * (b) When the speed is changed, LACP need to be reinitiated.
2446 static void ad_update_actor_keys(struct port *port, bool reset)
2449 u16 ospeed = 0, speed = 0;
2450 u16 old_oper_key = port->actor_oper_port_key;
2452 port->actor_admin_port_key &= ~(AD_SPEED_KEY_MASKS|AD_DUPLEX_KEY_MASKS);
2454 speed = __get_link_speed(port);
2455 ospeed = (old_oper_key & AD_SPEED_KEY_MASKS) >> 1;
2456 duplex = __get_duplex(port);
2457 port->actor_admin_port_key |= (speed << 1) | duplex;
2459 port->actor_oper_port_key = port->actor_admin_port_key;
2461 if (old_oper_key != port->actor_oper_port_key) {
2462 /* Only 'duplex' port participates in LACP */
2464 port->sm_vars |= AD_PORT_LACP_ENABLED;
2466 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
2470 slave_err(port->slave->bond->dev,
2472 "speed changed to 0 on port %d\n",
2473 port->actor_port_number);
2474 } else if (duplex && ospeed != speed) {
2475 /* Speed change restarts LACP state-machine */
2476 port->sm_vars |= AD_PORT_BEGIN;
2483 * bond_3ad_adapter_speed_duplex_changed - handle a slave's speed / duplex
2486 * @slave: slave struct to work on
2488 * Handle reselection of aggregator (if needed) for this port.
2490 void bond_3ad_adapter_speed_duplex_changed(struct slave *slave)
2494 port = &(SLAVE_AD_INFO(slave)->port);
2496 /* if slave is null, the whole port is not initialized */
2498 slave_warn(slave->bond->dev, slave->dev,
2499 "speed/duplex changed for uninitialized port\n");
2503 spin_lock_bh(&slave->bond->mode_lock);
2504 ad_update_actor_keys(port, false);
2505 spin_unlock_bh(&slave->bond->mode_lock);
2506 slave_dbg(slave->bond->dev, slave->dev, "Port %d changed speed/duplex\n",
2507 port->actor_port_number);
2511 * bond_3ad_handle_link_change - handle a slave's link status change indication
2512 * @slave: slave struct to work on
2513 * @status: whether the link is now up or down
2515 * Handle reselection of aggregator (if needed) for this port.
2517 void bond_3ad_handle_link_change(struct slave *slave, char link)
2519 struct aggregator *agg;
2523 port = &(SLAVE_AD_INFO(slave)->port);
2525 /* if slave is null, the whole port is not initialized */
2527 slave_warn(slave->bond->dev, slave->dev, "link status changed for uninitialized port\n");
2531 spin_lock_bh(&slave->bond->mode_lock);
2532 /* on link down we are zeroing duplex and speed since
2533 * some of the adaptors(ce1000.lan) report full duplex/speed
2534 * instead of N/A(duplex) / 0(speed).
2536 * on link up we are forcing recheck on the duplex and speed since
2537 * some of he adaptors(ce1000.lan) report.
2539 if (link == BOND_LINK_UP) {
2540 port->is_enabled = true;
2541 ad_update_actor_keys(port, false);
2543 /* link has failed */
2544 port->is_enabled = false;
2545 ad_update_actor_keys(port, true);
2547 agg = __get_first_agg(port);
2548 ad_agg_selection_logic(agg, &dummy);
2550 spin_unlock_bh(&slave->bond->mode_lock);
2552 slave_dbg(slave->bond->dev, slave->dev, "Port %d changed link status to %s\n",
2553 port->actor_port_number,
2554 link == BOND_LINK_UP ? "UP" : "DOWN");
2556 /* RTNL is held and mode_lock is released so it's safe
2557 * to update slave_array here.
2559 bond_update_slave_arr(slave->bond, NULL);
2563 * bond_3ad_set_carrier - set link state for bonding master
2564 * @bond - bonding structure
2566 * if we have an active aggregator, we're up, if not, we're down.
2567 * Presumes that we cannot have an active aggregator if there are
2568 * no slaves with link up.
2570 * This behavior complies with IEEE 802.3 section 43.3.9.
2572 * Called by bond_set_carrier(). Return zero if carrier state does not
2573 * change, nonzero if it does.
2575 int bond_3ad_set_carrier(struct bonding *bond)
2577 struct aggregator *active;
2578 struct slave *first_slave;
2582 first_slave = bond_first_slave_rcu(bond);
2587 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave)->aggregator));
2589 /* are enough slaves available to consider link up? */
2590 if (__agg_active_ports(active) < bond->params.min_links) {
2591 if (netif_carrier_ok(bond->dev)) {
2592 netif_carrier_off(bond->dev);
2595 } else if (!netif_carrier_ok(bond->dev)) {
2596 netif_carrier_on(bond->dev);
2599 } else if (netif_carrier_ok(bond->dev)) {
2600 netif_carrier_off(bond->dev);
2608 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2609 * @bond: bonding struct to work on
2610 * @ad_info: ad_info struct to fill with the bond's info
2612 * Returns: 0 on success
2615 int __bond_3ad_get_active_agg_info(struct bonding *bond,
2616 struct ad_info *ad_info)
2618 struct aggregator *aggregator = NULL;
2619 struct list_head *iter;
2620 struct slave *slave;
2623 bond_for_each_slave_rcu(bond, slave, iter) {
2624 port = &(SLAVE_AD_INFO(slave)->port);
2625 if (port->aggregator && port->aggregator->is_active) {
2626 aggregator = port->aggregator;
2634 ad_info->aggregator_id = aggregator->aggregator_identifier;
2635 ad_info->ports = __agg_active_ports(aggregator);
2636 ad_info->actor_key = aggregator->actor_oper_aggregator_key;
2637 ad_info->partner_key = aggregator->partner_oper_aggregator_key;
2638 ether_addr_copy(ad_info->partner_system,
2639 aggregator->partner_system.mac_addr_value);
2643 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info)
2648 ret = __bond_3ad_get_active_agg_info(bond, ad_info);
2654 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond,
2655 struct slave *slave)
2657 struct lacpdu *lacpdu, _lacpdu;
2659 if (skb->protocol != PKT_TYPE_LACPDU)
2660 return RX_HANDLER_ANOTHER;
2662 if (!MAC_ADDRESS_EQUAL(eth_hdr(skb)->h_dest, lacpdu_mcast_addr))
2663 return RX_HANDLER_ANOTHER;
2665 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu);
2667 atomic64_inc(&SLAVE_AD_INFO(slave)->stats.lacpdu_illegal_rx);
2668 atomic64_inc(&BOND_AD_INFO(bond).stats.lacpdu_illegal_rx);
2669 return RX_HANDLER_ANOTHER;
2672 return bond_3ad_rx_indication(lacpdu, slave);
2676 * bond_3ad_update_lacp_rate - change the lacp rate
2677 * @bond - bonding struct
2679 * When modify lacp_rate parameter via sysfs,
2680 * update actor_oper_port_state of each port.
2682 * Hold bond->mode_lock,
2683 * so we can modify port->actor_oper_port_state,
2684 * no matter bond is up or down.
2686 void bond_3ad_update_lacp_rate(struct bonding *bond)
2688 struct port *port = NULL;
2689 struct list_head *iter;
2690 struct slave *slave;
2693 lacp_fast = bond->params.lacp_fast;
2694 spin_lock_bh(&bond->mode_lock);
2695 bond_for_each_slave(bond, slave, iter) {
2696 port = &(SLAVE_AD_INFO(slave)->port);
2698 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
2700 port->actor_oper_port_state &= ~AD_STATE_LACP_TIMEOUT;
2702 spin_unlock_bh(&bond->mode_lock);
2705 size_t bond_3ad_stats_size(void)
2707 return nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_RX */
2708 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_TX */
2709 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_UNKNOWN_RX */
2710 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_ILLEGAL_RX */
2711 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RX */
2712 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_TX */
2713 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RESP_RX */
2714 nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_MARKER_RESP_TX */
2715 nla_total_size_64bit(sizeof(u64)); /* BOND_3AD_STAT_MARKER_UNKNOWN_RX */
2718 int bond_3ad_stats_fill(struct sk_buff *skb, struct bond_3ad_stats *stats)
2722 val = atomic64_read(&stats->lacpdu_rx);
2723 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_RX, val,
2726 val = atomic64_read(&stats->lacpdu_tx);
2727 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_TX, val,
2730 val = atomic64_read(&stats->lacpdu_unknown_rx);
2731 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_UNKNOWN_RX, val,
2734 val = atomic64_read(&stats->lacpdu_illegal_rx);
2735 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_LACPDU_ILLEGAL_RX, val,
2739 val = atomic64_read(&stats->marker_rx);
2740 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RX, val,
2743 val = atomic64_read(&stats->marker_tx);
2744 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_TX, val,
2747 val = atomic64_read(&stats->marker_resp_rx);
2748 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RESP_RX, val,
2751 val = atomic64_read(&stats->marker_resp_tx);
2752 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_RESP_TX, val,
2755 val = atomic64_read(&stats->marker_unknown_rx);
2756 if (nla_put_u64_64bit(skb, BOND_3AD_STAT_MARKER_UNKNOWN_RX, val,