2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * The full GNU General Public License is included in this distribution in the
19 * file called LICENSE.
23 #include <linux/skbuff.h>
24 #include <linux/if_ether.h>
25 #include <linux/netdevice.h>
26 #include <linux/spinlock.h>
27 #include <linux/ethtool.h>
28 #include <linux/etherdevice.h>
29 #include <linux/if_bonding.h>
30 #include <linux/pkt_sched.h>
31 #include <net/net_namespace.h>
32 #include <net/bonding.h>
33 #include <net/bond_3ad.h>
35 /* General definitions */
36 #define AD_SHORT_TIMEOUT 1
37 #define AD_LONG_TIMEOUT 0
38 #define AD_STANDBY 0x2
39 #define AD_MAX_TX_IN_SECOND 3
40 #define AD_COLLECTOR_MAX_DELAY 0
42 /* Timer definitions (43.4.4 in the 802.3ad standard) */
43 #define AD_FAST_PERIODIC_TIME 1
44 #define AD_SLOW_PERIODIC_TIME 30
45 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
46 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
47 #define AD_CHURN_DETECTION_TIME 60
48 #define AD_AGGREGATE_WAIT_TIME 2
50 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */
51 #define AD_STATE_LACP_ACTIVITY 0x1
52 #define AD_STATE_LACP_TIMEOUT 0x2
53 #define AD_STATE_AGGREGATION 0x4
54 #define AD_STATE_SYNCHRONIZATION 0x8
55 #define AD_STATE_COLLECTING 0x10
56 #define AD_STATE_DISTRIBUTING 0x20
57 #define AD_STATE_DEFAULTED 0x40
58 #define AD_STATE_EXPIRED 0x80
60 /* Port Variables definitions used by the State Machines (43.4.7 in the
63 #define AD_PORT_BEGIN 0x1
64 #define AD_PORT_LACP_ENABLED 0x2
65 #define AD_PORT_ACTOR_CHURN 0x4
66 #define AD_PORT_PARTNER_CHURN 0x8
67 #define AD_PORT_READY 0x10
68 #define AD_PORT_READY_N 0x20
69 #define AD_PORT_MATCHED 0x40
70 #define AD_PORT_STANDBY 0x80
71 #define AD_PORT_SELECTED 0x100
72 #define AD_PORT_MOVED 0x200
73 #define AD_PORT_CHURNED (AD_PORT_ACTOR_CHURN | AD_PORT_PARTNER_CHURN)
75 /* Port Key definitions
76 * key is determined according to the link speed, duplex and
77 * user key (which is yet not supported)
78 * --------------------------------------------------------------
79 * Port key : | User key | Speed | Duplex |
80 * --------------------------------------------------------------
83 #define AD_DUPLEX_KEY_MASKS 0x1
84 #define AD_SPEED_KEY_MASKS 0x3E
85 #define AD_USER_KEY_MASKS 0xFFC0
87 enum ad_link_speed_type
{
88 AD_LINK_SPEED_1MBPS
= 1,
90 AD_LINK_SPEED_100MBPS
,
91 AD_LINK_SPEED_1000MBPS
,
92 AD_LINK_SPEED_2500MBPS
,
93 AD_LINK_SPEED_10000MBPS
,
94 AD_LINK_SPEED_20000MBPS
,
95 AD_LINK_SPEED_40000MBPS
,
96 AD_LINK_SPEED_56000MBPS
99 /* compare MAC addresses */
100 #define MAC_ADDRESS_EQUAL(A, B) \
101 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
103 static struct mac_addr null_mac_addr
= { { 0, 0, 0, 0, 0, 0 } };
104 static u16 ad_ticks_per_sec
;
105 static const int ad_delta_in_ticks
= (AD_TIMER_INTERVAL
* HZ
) / 1000;
107 static const u8 lacpdu_mcast_addr
[ETH_ALEN
] = MULTICAST_LACPDU_ADDR
;
109 /* ================= main 802.3ad protocol functions ================== */
110 static int ad_lacpdu_send(struct port
*port
);
111 static int ad_marker_send(struct port
*port
, struct bond_marker
*marker
);
112 static void ad_mux_machine(struct port
*port
, bool *update_slave_arr
);
113 static void ad_rx_machine(struct lacpdu
*lacpdu
, struct port
*port
);
114 static void ad_tx_machine(struct port
*port
);
115 static void ad_periodic_machine(struct port
*port
);
116 static void ad_port_selection_logic(struct port
*port
, bool *update_slave_arr
);
117 static void ad_agg_selection_logic(struct aggregator
*aggregator
,
118 bool *update_slave_arr
);
119 static void ad_clear_agg(struct aggregator
*aggregator
);
120 static void ad_initialize_agg(struct aggregator
*aggregator
);
121 static void ad_initialize_port(struct port
*port
, int lacp_fast
);
122 static void ad_enable_collecting_distributing(struct port
*port
,
123 bool *update_slave_arr
);
124 static void ad_disable_collecting_distributing(struct port
*port
,
125 bool *update_slave_arr
);
126 static void ad_marker_info_received(struct bond_marker
*marker_info
,
128 static void ad_marker_response_received(struct bond_marker
*marker
,
132 /* ================= api to bonding and kernel code ================== */
135 * __get_bond_by_port - get the port's bonding struct
136 * @port: the port we're looking at
138 * Return @port's bonding struct, or %NULL if it can't be found.
140 static inline struct bonding
*__get_bond_by_port(struct port
*port
)
142 if (port
->slave
== NULL
)
145 return bond_get_bond_by_slave(port
->slave
);
149 * __get_first_agg - get the first aggregator in the bond
150 * @bond: the bond we're looking at
152 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
154 * The caller must hold RCU or RTNL lock.
156 static inline struct aggregator
*__get_first_agg(struct port
*port
)
158 struct bonding
*bond
= __get_bond_by_port(port
);
159 struct slave
*first_slave
;
160 struct aggregator
*agg
;
162 /* If there's no bond for this port, or bond has no slaves */
167 first_slave
= bond_first_slave_rcu(bond
);
168 agg
= first_slave
? &(SLAVE_AD_INFO(first_slave
)->aggregator
) : NULL
;
175 * __agg_has_partner - see if we have a partner
176 * @agg: the agregator we're looking at
178 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
179 * address for the partner). Return 0 if not.
181 static inline int __agg_has_partner(struct aggregator
*agg
)
183 return !is_zero_ether_addr(agg
->partner_system
.mac_addr_value
);
187 * __disable_port - disable the port's slave
188 * @port: the port we're looking at
190 static inline void __disable_port(struct port
*port
)
192 bond_set_slave_inactive_flags(port
->slave
, BOND_SLAVE_NOTIFY_LATER
);
196 * __enable_port - enable the port's slave, if it's up
197 * @port: the port we're looking at
199 static inline void __enable_port(struct port
*port
)
201 struct slave
*slave
= port
->slave
;
203 if ((slave
->link
== BOND_LINK_UP
) && bond_slave_is_up(slave
))
204 bond_set_slave_active_flags(slave
, BOND_SLAVE_NOTIFY_LATER
);
208 * __port_is_enabled - check if the port's slave is in active state
209 * @port: the port we're looking at
211 static inline int __port_is_enabled(struct port
*port
)
213 return bond_is_active_slave(port
->slave
);
217 * __get_agg_selection_mode - get the aggregator selection mode
218 * @port: the port we're looking at
220 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
222 static inline u32
__get_agg_selection_mode(struct port
*port
)
224 struct bonding
*bond
= __get_bond_by_port(port
);
227 return BOND_AD_STABLE
;
229 return bond
->params
.ad_select
;
233 * __check_agg_selection_timer - check if the selection timer has expired
234 * @port: the port we're looking at
236 static inline int __check_agg_selection_timer(struct port
*port
)
238 struct bonding
*bond
= __get_bond_by_port(port
);
243 return BOND_AD_INFO(bond
).agg_select_timer
? 1 : 0;
247 * __get_link_speed - get a port's speed
248 * @port: the port we're looking at
250 * Return @port's speed in 802.3ad enum format. i.e. one of:
252 * %AD_LINK_SPEED_10MBPS,
253 * %AD_LINK_SPEED_100MBPS,
254 * %AD_LINK_SPEED_1000MBPS,
255 * %AD_LINK_SPEED_2500MBPS,
256 * %AD_LINK_SPEED_10000MBPS
257 * %AD_LINK_SPEED_20000MBPS
258 * %AD_LINK_SPEED_40000MBPS
259 * %AD_LINK_SPEED_56000MBPS
261 static u16
__get_link_speed(struct port
*port
)
263 struct slave
*slave
= port
->slave
;
266 /* this if covers only a special case: when the configuration starts
267 * with link down, it sets the speed to 0.
268 * This is done in spite of the fact that the e100 driver reports 0
269 * to be compatible with MVT in the future.
271 if (slave
->link
!= BOND_LINK_UP
)
274 switch (slave
->speed
) {
276 speed
= AD_LINK_SPEED_10MBPS
;
280 speed
= AD_LINK_SPEED_100MBPS
;
284 speed
= AD_LINK_SPEED_1000MBPS
;
288 speed
= AD_LINK_SPEED_2500MBPS
;
292 speed
= AD_LINK_SPEED_10000MBPS
;
296 speed
= AD_LINK_SPEED_20000MBPS
;
300 speed
= AD_LINK_SPEED_40000MBPS
;
304 speed
= AD_LINK_SPEED_56000MBPS
;
308 /* unknown speed value from ethtool. shouldn't happen */
314 netdev_dbg(slave
->bond
->dev
, "Port %d Received link speed %d update from adapter\n",
315 port
->actor_port_number
, speed
);
320 * __get_duplex - get a port's duplex
321 * @port: the port we're looking at
323 * Return @port's duplex in 802.3ad bitmask format. i.e.:
324 * 0x01 if in full duplex
327 static u8
__get_duplex(struct port
*port
)
329 struct slave
*slave
= port
->slave
;
332 /* handling a special case: when the configuration starts with
333 * link down, it sets the duplex to 0.
335 if (slave
->link
!= BOND_LINK_UP
) {
338 switch (slave
->duplex
) {
341 netdev_dbg(slave
->bond
->dev
, "Port %d Received status full duplex update from adapter\n",
342 port
->actor_port_number
);
347 netdev_dbg(slave
->bond
->dev
, "Port %d Received status NOT full duplex update from adapter\n",
348 port
->actor_port_number
);
358 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
359 * @timer_type: which timer to operate
360 * @par: timer parameter. see below
362 * If @timer_type is %current_while_timer, @par indicates long/short timer.
363 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
364 * %SLOW_PERIODIC_TIME.
366 static u16
__ad_timer_to_ticks(u16 timer_type
, u16 par
)
368 u16 retval
= 0; /* to silence the compiler */
370 switch (timer_type
) {
371 case AD_CURRENT_WHILE_TIMER
: /* for rx machine usage */
373 retval
= (AD_SHORT_TIMEOUT_TIME
*ad_ticks_per_sec
);
375 retval
= (AD_LONG_TIMEOUT_TIME
*ad_ticks_per_sec
);
377 case AD_ACTOR_CHURN_TIMER
: /* for local churn machine */
378 retval
= (AD_CHURN_DETECTION_TIME
*ad_ticks_per_sec
);
380 case AD_PERIODIC_TIMER
: /* for periodic machine */
381 retval
= (par
*ad_ticks_per_sec
); /* long timeout */
383 case AD_PARTNER_CHURN_TIMER
: /* for remote churn machine */
384 retval
= (AD_CHURN_DETECTION_TIME
*ad_ticks_per_sec
);
386 case AD_WAIT_WHILE_TIMER
: /* for selection machine */
387 retval
= (AD_AGGREGATE_WAIT_TIME
*ad_ticks_per_sec
);
395 /* ================= ad_rx_machine helper functions ================== */
398 * __choose_matched - update a port's matched variable from a received lacpdu
399 * @lacpdu: the lacpdu we've received
400 * @port: the port we're looking at
402 * Update the value of the matched variable, using parameter values from a
403 * newly received lacpdu. Parameter values for the partner carried in the
404 * received PDU are compared with the corresponding operational parameter
405 * values for the actor. Matched is set to TRUE if all of these parameters
406 * match and the PDU parameter partner_state.aggregation has the same value as
407 * actor_oper_port_state.aggregation and lacp will actively maintain the link
408 * in the aggregation. Matched is also set to TRUE if the value of
409 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
410 * an individual link and lacp will actively maintain the link. Otherwise,
411 * matched is set to FALSE. LACP is considered to be actively maintaining the
412 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
413 * the actor's actor_oper_port_state.lacp_activity and the PDU's
414 * partner_state.lacp_activity variables are TRUE.
416 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
417 * used here to implement the language from 802.3ad 43.4.9 that requires
418 * recordPDU to "match" the LACPDU parameters to the stored values.
420 static void __choose_matched(struct lacpdu
*lacpdu
, struct port
*port
)
422 /* check if all parameters are alike
423 * or this is individual link(aggregation == FALSE)
424 * then update the state machine Matched variable.
426 if (((ntohs(lacpdu
->partner_port
) == port
->actor_port_number
) &&
427 (ntohs(lacpdu
->partner_port_priority
) == port
->actor_port_priority
) &&
428 MAC_ADDRESS_EQUAL(&(lacpdu
->partner_system
), &(port
->actor_system
)) &&
429 (ntohs(lacpdu
->partner_system_priority
) == port
->actor_system_priority
) &&
430 (ntohs(lacpdu
->partner_key
) == port
->actor_oper_port_key
) &&
431 ((lacpdu
->partner_state
& AD_STATE_AGGREGATION
) == (port
->actor_oper_port_state
& AD_STATE_AGGREGATION
))) ||
432 ((lacpdu
->actor_state
& AD_STATE_AGGREGATION
) == 0)
434 port
->sm_vars
|= AD_PORT_MATCHED
;
436 port
->sm_vars
&= ~AD_PORT_MATCHED
;
441 * __record_pdu - record parameters from a received lacpdu
442 * @lacpdu: the lacpdu we've received
443 * @port: the port we're looking at
445 * Record the parameter values for the Actor carried in a received lacpdu as
446 * the current partner operational parameter values and sets
447 * actor_oper_port_state.defaulted to FALSE.
449 static void __record_pdu(struct lacpdu
*lacpdu
, struct port
*port
)
451 if (lacpdu
&& port
) {
452 struct port_params
*partner
= &port
->partner_oper
;
454 __choose_matched(lacpdu
, port
);
455 /* record the new parameter values for the partner
458 partner
->port_number
= ntohs(lacpdu
->actor_port
);
459 partner
->port_priority
= ntohs(lacpdu
->actor_port_priority
);
460 partner
->system
= lacpdu
->actor_system
;
461 partner
->system_priority
= ntohs(lacpdu
->actor_system_priority
);
462 partner
->key
= ntohs(lacpdu
->actor_key
);
463 partner
->port_state
= lacpdu
->actor_state
;
465 /* set actor_oper_port_state.defaulted to FALSE */
466 port
->actor_oper_port_state
&= ~AD_STATE_DEFAULTED
;
468 /* set the partner sync. to on if the partner is sync,
469 * and the port is matched
471 if ((port
->sm_vars
& AD_PORT_MATCHED
) &&
472 (lacpdu
->actor_state
& AD_STATE_SYNCHRONIZATION
)) {
473 partner
->port_state
|= AD_STATE_SYNCHRONIZATION
;
474 pr_debug("%s partner sync=1\n", port
->slave
->dev
->name
);
476 partner
->port_state
&= ~AD_STATE_SYNCHRONIZATION
;
477 pr_debug("%s partner sync=0\n", port
->slave
->dev
->name
);
483 * __record_default - record default parameters
484 * @port: the port we're looking at
486 * This function records the default parameter values for the partner carried
487 * in the Partner Admin parameters as the current partner operational parameter
488 * values and sets actor_oper_port_state.defaulted to TRUE.
490 static void __record_default(struct port
*port
)
493 /* record the partner admin parameters */
494 memcpy(&port
->partner_oper
, &port
->partner_admin
,
495 sizeof(struct port_params
));
497 /* set actor_oper_port_state.defaulted to true */
498 port
->actor_oper_port_state
|= AD_STATE_DEFAULTED
;
503 * __update_selected - update a port's Selected variable from a received lacpdu
504 * @lacpdu: the lacpdu we've received
505 * @port: the port we're looking at
507 * Update the value of the selected variable, using parameter values from a
508 * newly received lacpdu. The parameter values for the Actor carried in the
509 * received PDU are compared with the corresponding operational parameter
510 * values for the ports partner. If one or more of the comparisons shows that
511 * the value(s) received in the PDU differ from the current operational values,
512 * then selected is set to FALSE and actor_oper_port_state.synchronization is
513 * set to out_of_sync. Otherwise, selected remains unchanged.
515 static void __update_selected(struct lacpdu
*lacpdu
, struct port
*port
)
517 if (lacpdu
&& port
) {
518 const struct port_params
*partner
= &port
->partner_oper
;
520 /* check if any parameter is different then
521 * update the state machine selected variable.
523 if (ntohs(lacpdu
->actor_port
) != partner
->port_number
||
524 ntohs(lacpdu
->actor_port_priority
) != partner
->port_priority
||
525 !MAC_ADDRESS_EQUAL(&lacpdu
->actor_system
, &partner
->system
) ||
526 ntohs(lacpdu
->actor_system_priority
) != partner
->system_priority
||
527 ntohs(lacpdu
->actor_key
) != partner
->key
||
528 (lacpdu
->actor_state
& AD_STATE_AGGREGATION
) != (partner
->port_state
& AD_STATE_AGGREGATION
)) {
529 port
->sm_vars
&= ~AD_PORT_SELECTED
;
535 * __update_default_selected - update a port's Selected variable from Partner
536 * @port: the port we're looking at
538 * This function updates the value of the selected variable, using the partner
539 * administrative parameter values. The administrative values are compared with
540 * the corresponding operational parameter values for the partner. If one or
541 * more of the comparisons shows that the administrative value(s) differ from
542 * the current operational values, then Selected is set to FALSE and
543 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
544 * Selected remains unchanged.
546 static void __update_default_selected(struct port
*port
)
549 const struct port_params
*admin
= &port
->partner_admin
;
550 const struct port_params
*oper
= &port
->partner_oper
;
552 /* check if any parameter is different then
553 * update the state machine selected variable.
555 if (admin
->port_number
!= oper
->port_number
||
556 admin
->port_priority
!= oper
->port_priority
||
557 !MAC_ADDRESS_EQUAL(&admin
->system
, &oper
->system
) ||
558 admin
->system_priority
!= oper
->system_priority
||
559 admin
->key
!= oper
->key
||
560 (admin
->port_state
& AD_STATE_AGGREGATION
)
561 != (oper
->port_state
& AD_STATE_AGGREGATION
)) {
562 port
->sm_vars
&= ~AD_PORT_SELECTED
;
568 * __update_ntt - update a port's ntt variable from a received lacpdu
569 * @lacpdu: the lacpdu we've received
570 * @port: the port we're looking at
572 * Updates the value of the ntt variable, using parameter values from a newly
573 * received lacpdu. The parameter values for the partner carried in the
574 * received PDU are compared with the corresponding operational parameter
575 * values for the Actor. If one or more of the comparisons shows that the
576 * value(s) received in the PDU differ from the current operational values,
577 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
579 static void __update_ntt(struct lacpdu
*lacpdu
, struct port
*port
)
581 /* validate lacpdu and port */
582 if (lacpdu
&& port
) {
583 /* check if any parameter is different then
584 * update the port->ntt.
586 if ((ntohs(lacpdu
->partner_port
) != port
->actor_port_number
) ||
587 (ntohs(lacpdu
->partner_port_priority
) != port
->actor_port_priority
) ||
588 !MAC_ADDRESS_EQUAL(&(lacpdu
->partner_system
), &(port
->actor_system
)) ||
589 (ntohs(lacpdu
->partner_system_priority
) != port
->actor_system_priority
) ||
590 (ntohs(lacpdu
->partner_key
) != port
->actor_oper_port_key
) ||
591 ((lacpdu
->partner_state
& AD_STATE_LACP_ACTIVITY
) != (port
->actor_oper_port_state
& AD_STATE_LACP_ACTIVITY
)) ||
592 ((lacpdu
->partner_state
& AD_STATE_LACP_TIMEOUT
) != (port
->actor_oper_port_state
& AD_STATE_LACP_TIMEOUT
)) ||
593 ((lacpdu
->partner_state
& AD_STATE_SYNCHRONIZATION
) != (port
->actor_oper_port_state
& AD_STATE_SYNCHRONIZATION
)) ||
594 ((lacpdu
->partner_state
& AD_STATE_AGGREGATION
) != (port
->actor_oper_port_state
& AD_STATE_AGGREGATION
))
602 * __agg_ports_are_ready - check if all ports in an aggregator are ready
603 * @aggregator: the aggregator we're looking at
606 static int __agg_ports_are_ready(struct aggregator
*aggregator
)
612 /* scan all ports in this aggregator to verfy if they are
615 for (port
= aggregator
->lag_ports
;
617 port
= port
->next_port_in_aggregator
) {
618 if (!(port
->sm_vars
& AD_PORT_READY_N
)) {
629 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
630 * @aggregator: the aggregator we're looking at
631 * @val: Should the ports' ready bit be set on or off
634 static void __set_agg_ports_ready(struct aggregator
*aggregator
, int val
)
638 for (port
= aggregator
->lag_ports
; port
;
639 port
= port
->next_port_in_aggregator
) {
641 port
->sm_vars
|= AD_PORT_READY
;
643 port
->sm_vars
&= ~AD_PORT_READY
;
648 * __get_agg_bandwidth - get the total bandwidth of an aggregator
649 * @aggregator: the aggregator we're looking at
652 static u32
__get_agg_bandwidth(struct aggregator
*aggregator
)
656 if (aggregator
->num_of_ports
) {
657 switch (__get_link_speed(aggregator
->lag_ports
)) {
658 case AD_LINK_SPEED_1MBPS
:
659 bandwidth
= aggregator
->num_of_ports
;
661 case AD_LINK_SPEED_10MBPS
:
662 bandwidth
= aggregator
->num_of_ports
* 10;
664 case AD_LINK_SPEED_100MBPS
:
665 bandwidth
= aggregator
->num_of_ports
* 100;
667 case AD_LINK_SPEED_1000MBPS
:
668 bandwidth
= aggregator
->num_of_ports
* 1000;
670 case AD_LINK_SPEED_2500MBPS
:
671 bandwidth
= aggregator
->num_of_ports
* 2500;
673 case AD_LINK_SPEED_10000MBPS
:
674 bandwidth
= aggregator
->num_of_ports
* 10000;
676 case AD_LINK_SPEED_20000MBPS
:
677 bandwidth
= aggregator
->num_of_ports
* 20000;
679 case AD_LINK_SPEED_40000MBPS
:
680 bandwidth
= aggregator
->num_of_ports
* 40000;
682 case AD_LINK_SPEED_56000MBPS
:
683 bandwidth
= aggregator
->num_of_ports
* 56000;
686 bandwidth
= 0; /* to silence the compiler */
693 * __get_active_agg - get the current active aggregator
694 * @aggregator: the aggregator we're looking at
696 * Caller must hold RCU lock.
698 static struct aggregator
*__get_active_agg(struct aggregator
*aggregator
)
700 struct bonding
*bond
= aggregator
->slave
->bond
;
701 struct list_head
*iter
;
704 bond_for_each_slave_rcu(bond
, slave
, iter
)
705 if (SLAVE_AD_INFO(slave
)->aggregator
.is_active
)
706 return &(SLAVE_AD_INFO(slave
)->aggregator
);
712 * __update_lacpdu_from_port - update a port's lacpdu fields
713 * @port: the port we're looking at
715 static inline void __update_lacpdu_from_port(struct port
*port
)
717 struct lacpdu
*lacpdu
= &port
->lacpdu
;
718 const struct port_params
*partner
= &port
->partner_oper
;
720 /* update current actual Actor parameters
721 * lacpdu->subtype initialized
722 * lacpdu->version_number initialized
723 * lacpdu->tlv_type_actor_info initialized
724 * lacpdu->actor_information_length initialized
727 lacpdu
->actor_system_priority
= htons(port
->actor_system_priority
);
728 lacpdu
->actor_system
= port
->actor_system
;
729 lacpdu
->actor_key
= htons(port
->actor_oper_port_key
);
730 lacpdu
->actor_port_priority
= htons(port
->actor_port_priority
);
731 lacpdu
->actor_port
= htons(port
->actor_port_number
);
732 lacpdu
->actor_state
= port
->actor_oper_port_state
;
733 pr_debug("update lacpdu: %s, actor port state %x\n",
734 port
->slave
->dev
->name
, port
->actor_oper_port_state
);
736 /* lacpdu->reserved_3_1 initialized
737 * lacpdu->tlv_type_partner_info initialized
738 * lacpdu->partner_information_length initialized
741 lacpdu
->partner_system_priority
= htons(partner
->system_priority
);
742 lacpdu
->partner_system
= partner
->system
;
743 lacpdu
->partner_key
= htons(partner
->key
);
744 lacpdu
->partner_port_priority
= htons(partner
->port_priority
);
745 lacpdu
->partner_port
= htons(partner
->port_number
);
746 lacpdu
->partner_state
= partner
->port_state
;
748 /* lacpdu->reserved_3_2 initialized
749 * lacpdu->tlv_type_collector_info initialized
750 * lacpdu->collector_information_length initialized
751 * collector_max_delay initialized
752 * reserved_12[12] initialized
753 * tlv_type_terminator initialized
754 * terminator_length initialized
755 * reserved_50[50] initialized
759 /* ================= main 802.3ad protocol code ========================= */
762 * ad_lacpdu_send - send out a lacpdu packet on a given port
763 * @port: the port we're looking at
765 * Returns: 0 on success
768 static int ad_lacpdu_send(struct port
*port
)
770 struct slave
*slave
= port
->slave
;
772 struct lacpdu_header
*lacpdu_header
;
773 int length
= sizeof(struct lacpdu_header
);
775 skb
= dev_alloc_skb(length
);
779 skb
->dev
= slave
->dev
;
780 skb_reset_mac_header(skb
);
781 skb
->network_header
= skb
->mac_header
+ ETH_HLEN
;
782 skb
->protocol
= PKT_TYPE_LACPDU
;
783 skb
->priority
= TC_PRIO_CONTROL
;
785 lacpdu_header
= (struct lacpdu_header
*)skb_put(skb
, length
);
787 ether_addr_copy(lacpdu_header
->hdr
.h_dest
, lacpdu_mcast_addr
);
788 /* Note: source address is set to be the member's PERMANENT address,
789 * because we use it to identify loopback lacpdus in receive.
791 ether_addr_copy(lacpdu_header
->hdr
.h_source
, slave
->perm_hwaddr
);
792 lacpdu_header
->hdr
.h_proto
= PKT_TYPE_LACPDU
;
794 lacpdu_header
->lacpdu
= port
->lacpdu
;
802 * ad_marker_send - send marker information/response on a given port
803 * @port: the port we're looking at
804 * @marker: marker data to send
806 * Returns: 0 on success
809 static int ad_marker_send(struct port
*port
, struct bond_marker
*marker
)
811 struct slave
*slave
= port
->slave
;
813 struct bond_marker_header
*marker_header
;
814 int length
= sizeof(struct bond_marker_header
);
816 skb
= dev_alloc_skb(length
+ 16);
820 skb_reserve(skb
, 16);
822 skb
->dev
= slave
->dev
;
823 skb_reset_mac_header(skb
);
824 skb
->network_header
= skb
->mac_header
+ ETH_HLEN
;
825 skb
->protocol
= PKT_TYPE_LACPDU
;
827 marker_header
= (struct bond_marker_header
*)skb_put(skb
, length
);
829 ether_addr_copy(marker_header
->hdr
.h_dest
, lacpdu_mcast_addr
);
830 /* Note: source address is set to be the member's PERMANENT address,
831 * because we use it to identify loopback MARKERs in receive.
833 ether_addr_copy(marker_header
->hdr
.h_source
, slave
->perm_hwaddr
);
834 marker_header
->hdr
.h_proto
= PKT_TYPE_LACPDU
;
836 marker_header
->marker
= *marker
;
844 * ad_mux_machine - handle a port's mux state machine
845 * @port: the port we're looking at
846 * @update_slave_arr: Does slave array need update?
848 static void ad_mux_machine(struct port
*port
, bool *update_slave_arr
)
850 mux_states_t last_state
;
852 /* keep current State Machine state to compare later if it was
855 last_state
= port
->sm_mux_state
;
857 if (port
->sm_vars
& AD_PORT_BEGIN
) {
858 port
->sm_mux_state
= AD_MUX_DETACHED
;
860 switch (port
->sm_mux_state
) {
861 case AD_MUX_DETACHED
:
862 if ((port
->sm_vars
& AD_PORT_SELECTED
)
863 || (port
->sm_vars
& AD_PORT_STANDBY
))
864 /* if SELECTED or STANDBY */
865 port
->sm_mux_state
= AD_MUX_WAITING
;
868 /* if SELECTED == FALSE return to DETACH state */
869 if (!(port
->sm_vars
& AD_PORT_SELECTED
)) {
870 port
->sm_vars
&= ~AD_PORT_READY_N
;
871 /* in order to withhold the Selection Logic to
872 * check all ports READY_N value every callback
873 * cycle to update ready variable, we check
874 * READY_N and update READY here
876 __set_agg_ports_ready(port
->aggregator
, __agg_ports_are_ready(port
->aggregator
));
877 port
->sm_mux_state
= AD_MUX_DETACHED
;
881 /* check if the wait_while_timer expired */
882 if (port
->sm_mux_timer_counter
883 && !(--port
->sm_mux_timer_counter
))
884 port
->sm_vars
|= AD_PORT_READY_N
;
886 /* in order to withhold the selection logic to check
887 * all ports READY_N value every callback cycle to
888 * update ready variable, we check READY_N and update
891 __set_agg_ports_ready(port
->aggregator
, __agg_ports_are_ready(port
->aggregator
));
893 /* if the wait_while_timer expired, and the port is
894 * in READY state, move to ATTACHED state
896 if ((port
->sm_vars
& AD_PORT_READY
)
897 && !port
->sm_mux_timer_counter
)
898 port
->sm_mux_state
= AD_MUX_ATTACHED
;
900 case AD_MUX_ATTACHED
:
901 /* check also if agg_select_timer expired (so the
902 * edable port will take place only after this timer)
904 if ((port
->sm_vars
& AD_PORT_SELECTED
) &&
905 (port
->partner_oper
.port_state
& AD_STATE_SYNCHRONIZATION
) &&
906 !__check_agg_selection_timer(port
)) {
907 if (port
->aggregator
->is_active
)
909 AD_MUX_COLLECTING_DISTRIBUTING
;
910 } else if (!(port
->sm_vars
& AD_PORT_SELECTED
) ||
911 (port
->sm_vars
& AD_PORT_STANDBY
)) {
912 /* if UNSELECTED or STANDBY */
913 port
->sm_vars
&= ~AD_PORT_READY_N
;
914 /* in order to withhold the selection logic to
915 * check all ports READY_N value every callback
916 * cycle to update ready variable, we check
917 * READY_N and update READY here
919 __set_agg_ports_ready(port
->aggregator
, __agg_ports_are_ready(port
->aggregator
));
920 port
->sm_mux_state
= AD_MUX_DETACHED
;
921 } else if (port
->aggregator
->is_active
) {
922 port
->actor_oper_port_state
|=
923 AD_STATE_SYNCHRONIZATION
;
926 case AD_MUX_COLLECTING_DISTRIBUTING
:
927 if (!(port
->sm_vars
& AD_PORT_SELECTED
) ||
928 (port
->sm_vars
& AD_PORT_STANDBY
) ||
929 !(port
->partner_oper
.port_state
& AD_STATE_SYNCHRONIZATION
) ||
930 !(port
->actor_oper_port_state
& AD_STATE_SYNCHRONIZATION
)) {
931 port
->sm_mux_state
= AD_MUX_ATTACHED
;
933 /* if port state hasn't changed make
934 * sure that a collecting distributing
935 * port in an active aggregator is enabled
937 if (port
->aggregator
&&
938 port
->aggregator
->is_active
&&
939 !__port_is_enabled(port
)) {
950 /* check if the state machine was changed */
951 if (port
->sm_mux_state
!= last_state
) {
952 pr_debug("Mux Machine: Port=%d (%s), Last State=%d, Curr State=%d\n",
953 port
->actor_port_number
,
954 port
->slave
->dev
->name
,
957 switch (port
->sm_mux_state
) {
958 case AD_MUX_DETACHED
:
959 port
->actor_oper_port_state
&= ~AD_STATE_SYNCHRONIZATION
;
960 ad_disable_collecting_distributing(port
,
962 port
->actor_oper_port_state
&= ~AD_STATE_COLLECTING
;
963 port
->actor_oper_port_state
&= ~AD_STATE_DISTRIBUTING
;
967 port
->sm_mux_timer_counter
= __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER
, 0);
969 case AD_MUX_ATTACHED
:
970 if (port
->aggregator
->is_active
)
971 port
->actor_oper_port_state
|=
972 AD_STATE_SYNCHRONIZATION
;
974 port
->actor_oper_port_state
&=
975 ~AD_STATE_SYNCHRONIZATION
;
976 port
->actor_oper_port_state
&= ~AD_STATE_COLLECTING
;
977 port
->actor_oper_port_state
&= ~AD_STATE_DISTRIBUTING
;
978 ad_disable_collecting_distributing(port
,
982 case AD_MUX_COLLECTING_DISTRIBUTING
:
983 port
->actor_oper_port_state
|= AD_STATE_COLLECTING
;
984 port
->actor_oper_port_state
|= AD_STATE_DISTRIBUTING
;
985 port
->actor_oper_port_state
|= AD_STATE_SYNCHRONIZATION
;
986 ad_enable_collecting_distributing(port
,
997 * ad_rx_machine - handle a port's rx State Machine
998 * @lacpdu: the lacpdu we've received
999 * @port: the port we're looking at
1001 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
1002 * CURRENT. If timer expired set the state machine in the proper state.
1003 * In other cases, this function checks if we need to switch to other state.
1005 static void ad_rx_machine(struct lacpdu
*lacpdu
, struct port
*port
)
1007 rx_states_t last_state
;
1009 /* keep current State Machine state to compare later if it was
1012 last_state
= port
->sm_rx_state
;
1014 /* check if state machine should change state */
1016 /* first, check if port was reinitialized */
1017 if (port
->sm_vars
& AD_PORT_BEGIN
) {
1018 port
->sm_rx_state
= AD_RX_INITIALIZE
;
1019 port
->sm_vars
|= AD_PORT_CHURNED
;
1020 /* check if port is not enabled */
1021 } else if (!(port
->sm_vars
& AD_PORT_BEGIN
)
1022 && !port
->is_enabled
&& !(port
->sm_vars
& AD_PORT_MOVED
))
1023 port
->sm_rx_state
= AD_RX_PORT_DISABLED
;
1024 /* check if new lacpdu arrived */
1025 else if (lacpdu
&& ((port
->sm_rx_state
== AD_RX_EXPIRED
) ||
1026 (port
->sm_rx_state
== AD_RX_DEFAULTED
) ||
1027 (port
->sm_rx_state
== AD_RX_CURRENT
))) {
1028 if (port
->sm_rx_state
!= AD_RX_CURRENT
)
1029 port
->sm_vars
|= AD_PORT_CHURNED
;
1030 port
->sm_rx_timer_counter
= 0;
1031 port
->sm_rx_state
= AD_RX_CURRENT
;
1033 /* if timer is on, and if it is expired */
1034 if (port
->sm_rx_timer_counter
&&
1035 !(--port
->sm_rx_timer_counter
)) {
1036 switch (port
->sm_rx_state
) {
1038 port
->sm_rx_state
= AD_RX_DEFAULTED
;
1041 port
->sm_rx_state
= AD_RX_EXPIRED
;
1047 /* if no lacpdu arrived and no timer is on */
1048 switch (port
->sm_rx_state
) {
1049 case AD_RX_PORT_DISABLED
:
1050 if (port
->sm_vars
& AD_PORT_MOVED
)
1051 port
->sm_rx_state
= AD_RX_INITIALIZE
;
1052 else if (port
->is_enabled
1054 & AD_PORT_LACP_ENABLED
))
1055 port
->sm_rx_state
= AD_RX_EXPIRED
;
1056 else if (port
->is_enabled
1058 & AD_PORT_LACP_ENABLED
) == 0))
1059 port
->sm_rx_state
= AD_RX_LACP_DISABLED
;
1068 /* check if the State machine was changed or new lacpdu arrived */
1069 if ((port
->sm_rx_state
!= last_state
) || (lacpdu
)) {
1070 pr_debug("Rx Machine: Port=%d (%s), Last State=%d, Curr State=%d\n",
1071 port
->actor_port_number
,
1072 port
->slave
->dev
->name
,
1075 switch (port
->sm_rx_state
) {
1076 case AD_RX_INITIALIZE
:
1077 if (!(port
->actor_oper_port_key
& AD_DUPLEX_KEY_MASKS
))
1078 port
->sm_vars
&= ~AD_PORT_LACP_ENABLED
;
1080 port
->sm_vars
|= AD_PORT_LACP_ENABLED
;
1081 port
->sm_vars
&= ~AD_PORT_SELECTED
;
1082 __record_default(port
);
1083 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1084 port
->sm_vars
&= ~AD_PORT_MOVED
;
1085 port
->sm_rx_state
= AD_RX_PORT_DISABLED
;
1088 case AD_RX_PORT_DISABLED
:
1089 port
->sm_vars
&= ~AD_PORT_MATCHED
;
1091 case AD_RX_LACP_DISABLED
:
1092 port
->sm_vars
&= ~AD_PORT_SELECTED
;
1093 __record_default(port
);
1094 port
->partner_oper
.port_state
&= ~AD_STATE_AGGREGATION
;
1095 port
->sm_vars
|= AD_PORT_MATCHED
;
1096 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1099 /* Reset of the Synchronization flag (Standard 43.4.12)
1100 * This reset cause to disable this port in the
1101 * COLLECTING_DISTRIBUTING state of the mux machine in
1102 * case of EXPIRED even if LINK_DOWN didn't arrive for
1105 port
->partner_oper
.port_state
&= ~AD_STATE_SYNCHRONIZATION
;
1106 port
->sm_vars
&= ~AD_PORT_MATCHED
;
1107 port
->partner_oper
.port_state
|= AD_STATE_LACP_TIMEOUT
;
1108 port
->partner_oper
.port_state
|= AD_STATE_LACP_ACTIVITY
;
1109 port
->sm_rx_timer_counter
= __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER
, (u16
)(AD_SHORT_TIMEOUT
));
1110 port
->actor_oper_port_state
|= AD_STATE_EXPIRED
;
1111 port
->sm_vars
|= AD_PORT_CHURNED
;
1113 case AD_RX_DEFAULTED
:
1114 __update_default_selected(port
);
1115 __record_default(port
);
1116 port
->sm_vars
|= AD_PORT_MATCHED
;
1117 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1120 /* detect loopback situation */
1121 if (MAC_ADDRESS_EQUAL(&(lacpdu
->actor_system
),
1122 &(port
->actor_system
))) {
1123 netdev_err(port
->slave
->bond
->dev
, "An illegal loopback occurred on adapter (%s)\n"
1124 "Check the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n",
1125 port
->slave
->dev
->name
);
1128 __update_selected(lacpdu
, port
);
1129 __update_ntt(lacpdu
, port
);
1130 __record_pdu(lacpdu
, port
);
1131 port
->sm_rx_timer_counter
= __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER
, (u16
)(port
->actor_oper_port_state
& AD_STATE_LACP_TIMEOUT
));
1132 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1141 * ad_churn_machine - handle port churn's state machine
1142 * @port: the port we're looking at
1145 static void ad_churn_machine(struct port
*port
)
1147 if (port
->sm_vars
& AD_PORT_CHURNED
) {
1148 port
->sm_vars
&= ~AD_PORT_CHURNED
;
1149 port
->sm_churn_actor_state
= AD_CHURN_MONITOR
;
1150 port
->sm_churn_partner_state
= AD_CHURN_MONITOR
;
1151 port
->sm_churn_actor_timer_counter
=
1152 __ad_timer_to_ticks(AD_ACTOR_CHURN_TIMER
, 0);
1153 port
->sm_churn_partner_timer_counter
=
1154 __ad_timer_to_ticks(AD_PARTNER_CHURN_TIMER
, 0);
1157 if (port
->sm_churn_actor_timer_counter
&&
1158 !(--port
->sm_churn_actor_timer_counter
) &&
1159 port
->sm_churn_actor_state
== AD_CHURN_MONITOR
) {
1160 if (port
->actor_oper_port_state
& AD_STATE_SYNCHRONIZATION
) {
1161 port
->sm_churn_actor_state
= AD_NO_CHURN
;
1163 port
->churn_actor_count
++;
1164 port
->sm_churn_actor_state
= AD_CHURN
;
1167 if (port
->sm_churn_partner_timer_counter
&&
1168 !(--port
->sm_churn_partner_timer_counter
) &&
1169 port
->sm_churn_partner_state
== AD_CHURN_MONITOR
) {
1170 if (port
->partner_oper
.port_state
& AD_STATE_SYNCHRONIZATION
) {
1171 port
->sm_churn_partner_state
= AD_NO_CHURN
;
1173 port
->churn_partner_count
++;
1174 port
->sm_churn_partner_state
= AD_CHURN
;
1180 * ad_tx_machine - handle a port's tx state machine
1181 * @port: the port we're looking at
1183 static void ad_tx_machine(struct port
*port
)
1185 /* check if tx timer expired, to verify that we do not send more than
1186 * 3 packets per second
1188 if (port
->sm_tx_timer_counter
&& !(--port
->sm_tx_timer_counter
)) {
1189 /* check if there is something to send */
1190 if (port
->ntt
&& (port
->sm_vars
& AD_PORT_LACP_ENABLED
)) {
1191 __update_lacpdu_from_port(port
);
1193 if (ad_lacpdu_send(port
) >= 0) {
1194 pr_debug("Sent LACPDU on port %d\n",
1195 port
->actor_port_number
);
1197 /* mark ntt as false, so it will not be sent
1198 * again until demanded
1203 /* restart tx timer(to verify that we will not exceed
1204 * AD_MAX_TX_IN_SECOND
1206 port
->sm_tx_timer_counter
= ad_ticks_per_sec
/AD_MAX_TX_IN_SECOND
;
1211 * ad_periodic_machine - handle a port's periodic state machine
1212 * @port: the port we're looking at
1214 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1216 static void ad_periodic_machine(struct port
*port
)
1218 periodic_states_t last_state
;
1220 /* keep current state machine state to compare later if it was changed */
1221 last_state
= port
->sm_periodic_state
;
1223 /* check if port was reinitialized */
1224 if (((port
->sm_vars
& AD_PORT_BEGIN
) || !(port
->sm_vars
& AD_PORT_LACP_ENABLED
) || !port
->is_enabled
) ||
1225 (!(port
->actor_oper_port_state
& AD_STATE_LACP_ACTIVITY
) && !(port
->partner_oper
.port_state
& AD_STATE_LACP_ACTIVITY
))
1227 port
->sm_periodic_state
= AD_NO_PERIODIC
;
1229 /* check if state machine should change state */
1230 else if (port
->sm_periodic_timer_counter
) {
1231 /* check if periodic state machine expired */
1232 if (!(--port
->sm_periodic_timer_counter
)) {
1233 /* if expired then do tx */
1234 port
->sm_periodic_state
= AD_PERIODIC_TX
;
1236 /* If not expired, check if there is some new timeout
1237 * parameter from the partner state
1239 switch (port
->sm_periodic_state
) {
1240 case AD_FAST_PERIODIC
:
1241 if (!(port
->partner_oper
.port_state
1242 & AD_STATE_LACP_TIMEOUT
))
1243 port
->sm_periodic_state
= AD_SLOW_PERIODIC
;
1245 case AD_SLOW_PERIODIC
:
1246 if ((port
->partner_oper
.port_state
& AD_STATE_LACP_TIMEOUT
)) {
1247 port
->sm_periodic_timer_counter
= 0;
1248 port
->sm_periodic_state
= AD_PERIODIC_TX
;
1256 switch (port
->sm_periodic_state
) {
1257 case AD_NO_PERIODIC
:
1258 port
->sm_periodic_state
= AD_FAST_PERIODIC
;
1260 case AD_PERIODIC_TX
:
1261 if (!(port
->partner_oper
.port_state
&
1262 AD_STATE_LACP_TIMEOUT
))
1263 port
->sm_periodic_state
= AD_SLOW_PERIODIC
;
1265 port
->sm_periodic_state
= AD_FAST_PERIODIC
;
1272 /* check if the state machine was changed */
1273 if (port
->sm_periodic_state
!= last_state
) {
1274 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1275 port
->actor_port_number
, last_state
,
1276 port
->sm_periodic_state
);
1277 switch (port
->sm_periodic_state
) {
1278 case AD_NO_PERIODIC
:
1279 port
->sm_periodic_timer_counter
= 0;
1281 case AD_FAST_PERIODIC
:
1282 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1283 port
->sm_periodic_timer_counter
= __ad_timer_to_ticks(AD_PERIODIC_TIMER
, (u16
)(AD_FAST_PERIODIC_TIME
))-1;
1285 case AD_SLOW_PERIODIC
:
1286 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1287 port
->sm_periodic_timer_counter
= __ad_timer_to_ticks(AD_PERIODIC_TIMER
, (u16
)(AD_SLOW_PERIODIC_TIME
))-1;
1289 case AD_PERIODIC_TX
:
1299 * ad_port_selection_logic - select aggregation groups
1300 * @port: the port we're looking at
1301 * @update_slave_arr: Does slave array need update?
1303 * Select aggregation groups, and assign each port for it's aggregetor. The
1304 * selection logic is called in the inititalization (after all the handshkes),
1305 * and after every lacpdu receive (if selected is off).
1307 static void ad_port_selection_logic(struct port
*port
, bool *update_slave_arr
)
1309 struct aggregator
*aggregator
, *free_aggregator
= NULL
, *temp_aggregator
;
1310 struct port
*last_port
= NULL
, *curr_port
;
1311 struct list_head
*iter
;
1312 struct bonding
*bond
;
1313 struct slave
*slave
;
1316 /* if the port is already Selected, do nothing */
1317 if (port
->sm_vars
& AD_PORT_SELECTED
)
1320 bond
= __get_bond_by_port(port
);
1322 /* if the port is connected to other aggregator, detach it */
1323 if (port
->aggregator
) {
1324 /* detach the port from its former aggregator */
1325 temp_aggregator
= port
->aggregator
;
1326 for (curr_port
= temp_aggregator
->lag_ports
; curr_port
;
1327 last_port
= curr_port
,
1328 curr_port
= curr_port
->next_port_in_aggregator
) {
1329 if (curr_port
== port
) {
1330 temp_aggregator
->num_of_ports
--;
1331 /* if it is the first port attached to the
1335 temp_aggregator
->lag_ports
=
1336 port
->next_port_in_aggregator
;
1338 /* not the first port attached to the
1341 last_port
->next_port_in_aggregator
=
1342 port
->next_port_in_aggregator
;
1345 /* clear the port's relations to this
1348 port
->aggregator
= NULL
;
1349 port
->next_port_in_aggregator
= NULL
;
1350 port
->actor_port_aggregator_identifier
= 0;
1352 netdev_dbg(bond
->dev
, "Port %d left LAG %d\n",
1353 port
->actor_port_number
,
1354 temp_aggregator
->aggregator_identifier
);
1355 /* if the aggregator is empty, clear its
1356 * parameters, and set it ready to be attached
1358 if (!temp_aggregator
->lag_ports
)
1359 ad_clear_agg(temp_aggregator
);
1364 /* meaning: the port was related to an aggregator
1365 * but was not on the aggregator port list
1367 net_warn_ratelimited("%s: Warning: Port %d (on %s) was related to aggregator %d but was not on its port list\n",
1368 port
->slave
->bond
->dev
->name
,
1369 port
->actor_port_number
,
1370 port
->slave
->dev
->name
,
1371 port
->aggregator
->aggregator_identifier
);
1374 /* search on all aggregators for a suitable aggregator for this port */
1375 bond_for_each_slave(bond
, slave
, iter
) {
1376 aggregator
= &(SLAVE_AD_INFO(slave
)->aggregator
);
1378 /* keep a free aggregator for later use(if needed) */
1379 if (!aggregator
->lag_ports
) {
1380 if (!free_aggregator
)
1381 free_aggregator
= aggregator
;
1384 /* check if current aggregator suits us */
1385 if (((aggregator
->actor_oper_aggregator_key
== port
->actor_oper_port_key
) && /* if all parameters match AND */
1386 MAC_ADDRESS_EQUAL(&(aggregator
->partner_system
), &(port
->partner_oper
.system
)) &&
1387 (aggregator
->partner_system_priority
== port
->partner_oper
.system_priority
) &&
1388 (aggregator
->partner_oper_aggregator_key
== port
->partner_oper
.key
)
1390 ((!MAC_ADDRESS_EQUAL(&(port
->partner_oper
.system
), &(null_mac_addr
)) && /* partner answers */
1391 !aggregator
->is_individual
) /* but is not individual OR */
1394 /* attach to the founded aggregator */
1395 port
->aggregator
= aggregator
;
1396 port
->actor_port_aggregator_identifier
=
1397 port
->aggregator
->aggregator_identifier
;
1398 port
->next_port_in_aggregator
= aggregator
->lag_ports
;
1399 port
->aggregator
->num_of_ports
++;
1400 aggregator
->lag_ports
= port
;
1401 netdev_dbg(bond
->dev
, "Port %d joined LAG %d(existing LAG)\n",
1402 port
->actor_port_number
,
1403 port
->aggregator
->aggregator_identifier
);
1405 /* mark this port as selected */
1406 port
->sm_vars
|= AD_PORT_SELECTED
;
1412 /* the port couldn't find an aggregator - attach it to a new
1416 if (free_aggregator
) {
1417 /* assign port a new aggregator */
1418 port
->aggregator
= free_aggregator
;
1419 port
->actor_port_aggregator_identifier
=
1420 port
->aggregator
->aggregator_identifier
;
1422 /* update the new aggregator's parameters
1423 * if port was responsed from the end-user
1425 if (port
->actor_oper_port_key
& AD_DUPLEX_KEY_MASKS
)
1426 /* if port is full duplex */
1427 port
->aggregator
->is_individual
= false;
1429 port
->aggregator
->is_individual
= true;
1431 port
->aggregator
->actor_admin_aggregator_key
= port
->actor_admin_port_key
;
1432 port
->aggregator
->actor_oper_aggregator_key
= port
->actor_oper_port_key
;
1433 port
->aggregator
->partner_system
=
1434 port
->partner_oper
.system
;
1435 port
->aggregator
->partner_system_priority
=
1436 port
->partner_oper
.system_priority
;
1437 port
->aggregator
->partner_oper_aggregator_key
= port
->partner_oper
.key
;
1438 port
->aggregator
->receive_state
= 1;
1439 port
->aggregator
->transmit_state
= 1;
1440 port
->aggregator
->lag_ports
= port
;
1441 port
->aggregator
->num_of_ports
++;
1443 /* mark this port as selected */
1444 port
->sm_vars
|= AD_PORT_SELECTED
;
1446 netdev_dbg(bond
->dev
, "Port %d joined LAG %d(new LAG)\n",
1447 port
->actor_port_number
,
1448 port
->aggregator
->aggregator_identifier
);
1450 netdev_err(bond
->dev
, "Port %d (on %s) did not find a suitable aggregator\n",
1451 port
->actor_port_number
, port
->slave
->dev
->name
);
1454 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1455 * in all aggregator's ports, else set ready=FALSE in all
1456 * aggregator's ports
1458 __set_agg_ports_ready(port
->aggregator
,
1459 __agg_ports_are_ready(port
->aggregator
));
1461 aggregator
= __get_first_agg(port
);
1462 ad_agg_selection_logic(aggregator
, update_slave_arr
);
1464 if (!port
->aggregator
->is_active
)
1465 port
->actor_oper_port_state
&= ~AD_STATE_SYNCHRONIZATION
;
1468 /* Decide if "agg" is a better choice for the new active aggregator that
1469 * the current best, according to the ad_select policy.
1471 static struct aggregator
*ad_agg_selection_test(struct aggregator
*best
,
1472 struct aggregator
*curr
)
1474 /* 0. If no best, select current.
1476 * 1. If the current agg is not individual, and the best is
1477 * individual, select current.
1479 * 2. If current agg is individual and the best is not, keep best.
1481 * 3. Therefore, current and best are both individual or both not
1484 * 3a. If current agg partner replied, and best agg partner did not,
1487 * 3b. If current agg partner did not reply and best agg partner
1488 * did reply, keep best.
1490 * 4. Therefore, current and best both have partner replies or
1491 * both do not, so perform selection policy:
1493 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1494 * select by bandwidth.
1496 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1501 if (!curr
->is_individual
&& best
->is_individual
)
1504 if (curr
->is_individual
&& !best
->is_individual
)
1507 if (__agg_has_partner(curr
) && !__agg_has_partner(best
))
1510 if (!__agg_has_partner(curr
) && __agg_has_partner(best
))
1513 switch (__get_agg_selection_mode(curr
->lag_ports
)) {
1515 if (curr
->num_of_ports
> best
->num_of_ports
)
1518 if (curr
->num_of_ports
< best
->num_of_ports
)
1522 case BOND_AD_STABLE
:
1523 case BOND_AD_BANDWIDTH
:
1524 if (__get_agg_bandwidth(curr
) > __get_agg_bandwidth(best
))
1530 net_warn_ratelimited("%s: Impossible agg select mode %d\n",
1531 curr
->slave
->bond
->dev
->name
,
1532 __get_agg_selection_mode(curr
->lag_ports
));
1539 static int agg_device_up(const struct aggregator
*agg
)
1541 struct port
*port
= agg
->lag_ports
;
1546 return netif_running(port
->slave
->dev
) &&
1547 netif_carrier_ok(port
->slave
->dev
);
1551 * ad_agg_selection_logic - select an aggregation group for a team
1552 * @aggregator: the aggregator we're looking at
1553 * @update_slave_arr: Does slave array need update?
1555 * It is assumed that only one aggregator may be selected for a team.
1557 * The logic of this function is to select the aggregator according to
1558 * the ad_select policy:
1560 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1561 * it, and to reselect the active aggregator only if the previous
1562 * aggregator has no more ports related to it.
1564 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1565 * bandwidth, and reselect whenever a link state change takes place or the
1566 * set of slaves in the bond changes.
1568 * BOND_AD_COUNT: select the aggregator with largest number of ports
1569 * (slaves), and reselect whenever a link state change takes place or the
1570 * set of slaves in the bond changes.
1572 * FIXME: this function MUST be called with the first agg in the bond, or
1573 * __get_active_agg() won't work correctly. This function should be better
1574 * called with the bond itself, and retrieve the first agg from it.
1576 static void ad_agg_selection_logic(struct aggregator
*agg
,
1577 bool *update_slave_arr
)
1579 struct aggregator
*best
, *active
, *origin
;
1580 struct bonding
*bond
= agg
->slave
->bond
;
1581 struct list_head
*iter
;
1582 struct slave
*slave
;
1587 active
= __get_active_agg(agg
);
1588 best
= (active
&& agg_device_up(active
)) ? active
: NULL
;
1590 bond_for_each_slave_rcu(bond
, slave
, iter
) {
1591 agg
= &(SLAVE_AD_INFO(slave
)->aggregator
);
1595 if (agg
->num_of_ports
&& agg_device_up(agg
))
1596 best
= ad_agg_selection_test(best
, agg
);
1600 __get_agg_selection_mode(best
->lag_ports
) == BOND_AD_STABLE
) {
1601 /* For the STABLE policy, don't replace the old active
1602 * aggregator if it's still active (it has an answering
1603 * partner) or if both the best and active don't have an
1604 * answering partner.
1606 if (active
&& active
->lag_ports
&&
1607 active
->lag_ports
->is_enabled
&&
1608 (__agg_has_partner(active
) ||
1609 (!__agg_has_partner(active
) &&
1610 !__agg_has_partner(best
)))) {
1611 if (!(!active
->actor_oper_aggregator_key
&&
1612 best
->actor_oper_aggregator_key
)) {
1614 active
->is_active
= 1;
1619 if (best
&& (best
== active
)) {
1621 active
->is_active
= 1;
1624 /* if there is new best aggregator, activate it */
1626 netdev_dbg(bond
->dev
, "best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1627 best
->aggregator_identifier
, best
->num_of_ports
,
1628 best
->actor_oper_aggregator_key
,
1629 best
->partner_oper_aggregator_key
,
1630 best
->is_individual
, best
->is_active
);
1631 netdev_dbg(bond
->dev
, "best ports %p slave %p %s\n",
1632 best
->lag_ports
, best
->slave
,
1633 best
->slave
? best
->slave
->dev
->name
: "NULL");
1635 bond_for_each_slave_rcu(bond
, slave
, iter
) {
1636 agg
= &(SLAVE_AD_INFO(slave
)->aggregator
);
1638 netdev_dbg(bond
->dev
, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1639 agg
->aggregator_identifier
, agg
->num_of_ports
,
1640 agg
->actor_oper_aggregator_key
,
1641 agg
->partner_oper_aggregator_key
,
1642 agg
->is_individual
, agg
->is_active
);
1645 /* check if any partner replys */
1646 if (best
->is_individual
) {
1647 net_warn_ratelimited("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1649 best
->slave
->bond
->dev
->name
: "NULL");
1652 best
->is_active
= 1;
1653 netdev_dbg(bond
->dev
, "LAG %d chosen as the active LAG\n",
1654 best
->aggregator_identifier
);
1655 netdev_dbg(bond
->dev
, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1656 best
->aggregator_identifier
, best
->num_of_ports
,
1657 best
->actor_oper_aggregator_key
,
1658 best
->partner_oper_aggregator_key
,
1659 best
->is_individual
, best
->is_active
);
1661 /* disable the ports that were related to the former
1665 for (port
= active
->lag_ports
; port
;
1666 port
= port
->next_port_in_aggregator
) {
1667 __disable_port(port
);
1670 /* Slave array needs update. */
1671 *update_slave_arr
= true;
1674 /* if the selected aggregator is of join individuals
1675 * (partner_system is NULL), enable their ports
1677 active
= __get_active_agg(origin
);
1680 if (!__agg_has_partner(active
)) {
1681 for (port
= active
->lag_ports
; port
;
1682 port
= port
->next_port_in_aggregator
) {
1683 __enable_port(port
);
1690 bond_3ad_set_carrier(bond
);
1694 * ad_clear_agg - clear a given aggregator's parameters
1695 * @aggregator: the aggregator we're looking at
1697 static void ad_clear_agg(struct aggregator
*aggregator
)
1700 aggregator
->is_individual
= false;
1701 aggregator
->actor_admin_aggregator_key
= 0;
1702 aggregator
->actor_oper_aggregator_key
= 0;
1703 aggregator
->partner_system
= null_mac_addr
;
1704 aggregator
->partner_system_priority
= 0;
1705 aggregator
->partner_oper_aggregator_key
= 0;
1706 aggregator
->receive_state
= 0;
1707 aggregator
->transmit_state
= 0;
1708 aggregator
->lag_ports
= NULL
;
1709 aggregator
->is_active
= 0;
1710 aggregator
->num_of_ports
= 0;
1711 pr_debug("LAG %d was cleared\n",
1712 aggregator
->aggregator_identifier
);
1717 * ad_initialize_agg - initialize a given aggregator's parameters
1718 * @aggregator: the aggregator we're looking at
1720 static void ad_initialize_agg(struct aggregator
*aggregator
)
1723 ad_clear_agg(aggregator
);
1725 aggregator
->aggregator_mac_address
= null_mac_addr
;
1726 aggregator
->aggregator_identifier
= 0;
1727 aggregator
->slave
= NULL
;
1732 * ad_initialize_port - initialize a given port's parameters
1733 * @aggregator: the aggregator we're looking at
1734 * @lacp_fast: boolean. whether fast periodic should be used
1736 static void ad_initialize_port(struct port
*port
, int lacp_fast
)
1738 static const struct port_params tmpl
= {
1739 .system_priority
= 0xffff,
1742 .port_priority
= 0xff,
1745 static const struct lacpdu lacpdu
= {
1747 .version_number
= 0x01,
1748 .tlv_type_actor_info
= 0x01,
1749 .actor_information_length
= 0x14,
1750 .tlv_type_partner_info
= 0x02,
1751 .partner_information_length
= 0x14,
1752 .tlv_type_collector_info
= 0x03,
1753 .collector_information_length
= 0x10,
1754 .collector_max_delay
= htons(AD_COLLECTOR_MAX_DELAY
),
1758 port
->actor_port_number
= 1;
1759 port
->actor_port_priority
= 0xff;
1760 port
->actor_system
= null_mac_addr
;
1761 port
->actor_system_priority
= 0xffff;
1762 port
->actor_port_aggregator_identifier
= 0;
1764 port
->actor_admin_port_key
= 1;
1765 port
->actor_oper_port_key
= 1;
1766 port
->actor_admin_port_state
= AD_STATE_AGGREGATION
|
1767 AD_STATE_LACP_ACTIVITY
;
1768 port
->actor_oper_port_state
= AD_STATE_AGGREGATION
|
1769 AD_STATE_LACP_ACTIVITY
;
1772 port
->actor_oper_port_state
|= AD_STATE_LACP_TIMEOUT
;
1774 memcpy(&port
->partner_admin
, &tmpl
, sizeof(tmpl
));
1775 memcpy(&port
->partner_oper
, &tmpl
, sizeof(tmpl
));
1777 port
->is_enabled
= true;
1778 /* private parameters */
1779 port
->sm_vars
= AD_PORT_BEGIN
| AD_PORT_LACP_ENABLED
;
1780 port
->sm_rx_state
= 0;
1781 port
->sm_rx_timer_counter
= 0;
1782 port
->sm_periodic_state
= 0;
1783 port
->sm_periodic_timer_counter
= 0;
1784 port
->sm_mux_state
= 0;
1785 port
->sm_mux_timer_counter
= 0;
1786 port
->sm_tx_state
= 0;
1787 port
->sm_tx_timer_counter
= 0;
1789 port
->aggregator
= NULL
;
1790 port
->next_port_in_aggregator
= NULL
;
1791 port
->transaction_id
= 0;
1793 port
->sm_churn_actor_timer_counter
= 0;
1794 port
->sm_churn_actor_state
= 0;
1795 port
->churn_actor_count
= 0;
1796 port
->sm_churn_partner_timer_counter
= 0;
1797 port
->sm_churn_partner_state
= 0;
1798 port
->churn_partner_count
= 0;
1800 memcpy(&port
->lacpdu
, &lacpdu
, sizeof(lacpdu
));
1805 * ad_enable_collecting_distributing - enable a port's transmit/receive
1806 * @port: the port we're looking at
1807 * @update_slave_arr: Does slave array need update?
1809 * Enable @port if it's in an active aggregator
1811 static void ad_enable_collecting_distributing(struct port
*port
,
1812 bool *update_slave_arr
)
1814 if (port
->aggregator
->is_active
) {
1815 pr_debug("Enabling port %d(LAG %d)\n",
1816 port
->actor_port_number
,
1817 port
->aggregator
->aggregator_identifier
);
1818 __enable_port(port
);
1819 /* Slave array needs update */
1820 *update_slave_arr
= true;
1825 * ad_disable_collecting_distributing - disable a port's transmit/receive
1826 * @port: the port we're looking at
1827 * @update_slave_arr: Does slave array need update?
1829 static void ad_disable_collecting_distributing(struct port
*port
,
1830 bool *update_slave_arr
)
1832 if (port
->aggregator
&&
1833 !MAC_ADDRESS_EQUAL(&(port
->aggregator
->partner_system
),
1834 &(null_mac_addr
))) {
1835 pr_debug("Disabling port %d(LAG %d)\n",
1836 port
->actor_port_number
,
1837 port
->aggregator
->aggregator_identifier
);
1838 __disable_port(port
);
1839 /* Slave array needs an update */
1840 *update_slave_arr
= true;
1845 * ad_marker_info_received - handle receive of a Marker information frame
1846 * @marker_info: Marker info received
1847 * @port: the port we're looking at
1849 static void ad_marker_info_received(struct bond_marker
*marker_info
,
1852 struct bond_marker marker
;
1854 /* copy the received marker data to the response marker */
1855 memcpy(&marker
, marker_info
, sizeof(struct bond_marker
));
1856 /* change the marker subtype to marker response */
1857 marker
.tlv_type
= AD_MARKER_RESPONSE_SUBTYPE
;
1859 /* send the marker response */
1860 if (ad_marker_send(port
, &marker
) >= 0) {
1861 pr_debug("Sent Marker Response on port %d\n",
1862 port
->actor_port_number
);
1867 * ad_marker_response_received - handle receive of a marker response frame
1868 * @marker: marker PDU received
1869 * @port: the port we're looking at
1871 * This function does nothing since we decided not to implement send and handle
1872 * response for marker PDU's, in this stage, but only to respond to marker
1875 static void ad_marker_response_received(struct bond_marker
*marker
,
1880 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1883 /* ========= AD exported functions to the main bonding code ========= */
1885 /* Check aggregators status in team every T seconds */
1886 #define AD_AGGREGATOR_SELECTION_TIMER 8
1889 * bond_3ad_initiate_agg_selection - initate aggregator selection
1890 * @bond: bonding struct
1892 * Set the aggregation selection timer, to initiate an agg selection in
1893 * the very near future. Called during first initialization, and during
1894 * any down to up transitions of the bond.
1896 void bond_3ad_initiate_agg_selection(struct bonding
*bond
, int timeout
)
1898 BOND_AD_INFO(bond
).agg_select_timer
= timeout
;
1902 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1903 * @bond: bonding struct to work on
1904 * @tick_resolution: tick duration (millisecond resolution)
1906 * Can be called only after the mac address of the bond is set.
1908 void bond_3ad_initialize(struct bonding
*bond
, u16 tick_resolution
)
1910 /* check that the bond is not initialized yet */
1911 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond
).system
.sys_mac_addr
),
1912 bond
->dev
->dev_addr
)) {
1914 BOND_AD_INFO(bond
).aggregator_identifier
= 0;
1916 BOND_AD_INFO(bond
).system
.sys_priority
= 0xFFFF;
1917 BOND_AD_INFO(bond
).system
.sys_mac_addr
= *((struct mac_addr
*)bond
->dev
->dev_addr
);
1919 /* initialize how many times this module is called in one
1920 * second (should be about every 100ms)
1922 ad_ticks_per_sec
= tick_resolution
;
1924 bond_3ad_initiate_agg_selection(bond
,
1925 AD_AGGREGATOR_SELECTION_TIMER
*
1931 * bond_3ad_bind_slave - initialize a slave's port
1932 * @slave: slave struct to work on
1934 * Returns: 0 on success
1937 void bond_3ad_bind_slave(struct slave
*slave
)
1939 struct bonding
*bond
= bond_get_bond_by_slave(slave
);
1941 struct aggregator
*aggregator
;
1943 /* check that the slave has not been initialized yet. */
1944 if (SLAVE_AD_INFO(slave
)->port
.slave
!= slave
) {
1946 /* port initialization */
1947 port
= &(SLAVE_AD_INFO(slave
)->port
);
1949 ad_initialize_port(port
, bond
->params
.lacp_fast
);
1951 port
->slave
= slave
;
1952 port
->actor_port_number
= SLAVE_AD_INFO(slave
)->id
;
1953 /* key is determined according to the link speed, duplex and user key(which
1954 * is yet not supported)
1956 port
->actor_admin_port_key
= 0;
1957 port
->actor_admin_port_key
|= __get_duplex(port
);
1958 port
->actor_admin_port_key
|= (__get_link_speed(port
) << 1);
1959 port
->actor_oper_port_key
= port
->actor_admin_port_key
;
1960 /* if the port is not full duplex, then the port should be not
1963 if (!(port
->actor_oper_port_key
& AD_DUPLEX_KEY_MASKS
))
1964 port
->sm_vars
&= ~AD_PORT_LACP_ENABLED
;
1965 /* actor system is the bond's system */
1966 port
->actor_system
= BOND_AD_INFO(bond
).system
.sys_mac_addr
;
1967 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
1968 * lacpdu's are sent in one second)
1970 port
->sm_tx_timer_counter
= ad_ticks_per_sec
/AD_MAX_TX_IN_SECOND
;
1971 port
->aggregator
= NULL
;
1972 port
->next_port_in_aggregator
= NULL
;
1974 __disable_port(port
);
1976 /* aggregator initialization */
1977 aggregator
= &(SLAVE_AD_INFO(slave
)->aggregator
);
1979 ad_initialize_agg(aggregator
);
1981 aggregator
->aggregator_mac_address
= *((struct mac_addr
*)bond
->dev
->dev_addr
);
1982 aggregator
->aggregator_identifier
= ++BOND_AD_INFO(bond
).aggregator_identifier
;
1983 aggregator
->slave
= slave
;
1984 aggregator
->is_active
= 0;
1985 aggregator
->num_of_ports
= 0;
1990 * bond_3ad_unbind_slave - deinitialize a slave's port
1991 * @slave: slave struct to work on
1993 * Search for the aggregator that is related to this port, remove the
1994 * aggregator and assign another aggregator for other port related to it
1995 * (if any), and remove the port.
1997 void bond_3ad_unbind_slave(struct slave
*slave
)
1999 struct port
*port
, *prev_port
, *temp_port
;
2000 struct aggregator
*aggregator
, *new_aggregator
, *temp_aggregator
;
2001 int select_new_active_agg
= 0;
2002 struct bonding
*bond
= slave
->bond
;
2003 struct slave
*slave_iter
;
2004 struct list_head
*iter
;
2005 bool dummy_slave_update
; /* Ignore this value as caller updates array */
2007 /* Sync against bond_3ad_state_machine_handler() */
2008 spin_lock_bh(&bond
->mode_lock
);
2009 aggregator
= &(SLAVE_AD_INFO(slave
)->aggregator
);
2010 port
= &(SLAVE_AD_INFO(slave
)->port
);
2012 /* if slave is null, the whole port is not initialized */
2014 netdev_warn(bond
->dev
, "Trying to unbind an uninitialized port on %s\n",
2019 netdev_dbg(bond
->dev
, "Unbinding Link Aggregation Group %d\n",
2020 aggregator
->aggregator_identifier
);
2022 /* Tell the partner that this port is not suitable for aggregation */
2023 port
->actor_oper_port_state
&= ~AD_STATE_AGGREGATION
;
2024 __update_lacpdu_from_port(port
);
2025 ad_lacpdu_send(port
);
2027 /* check if this aggregator is occupied */
2028 if (aggregator
->lag_ports
) {
2029 /* check if there are other ports related to this aggregator
2030 * except the port related to this slave(thats ensure us that
2031 * there is a reason to search for new aggregator, and that we
2034 if ((aggregator
->lag_ports
!= port
) ||
2035 (aggregator
->lag_ports
->next_port_in_aggregator
)) {
2036 /* find new aggregator for the related port(s) */
2037 bond_for_each_slave(bond
, slave_iter
, iter
) {
2038 new_aggregator
= &(SLAVE_AD_INFO(slave_iter
)->aggregator
);
2039 /* if the new aggregator is empty, or it is
2040 * connected to our port only
2042 if (!new_aggregator
->lag_ports
||
2043 ((new_aggregator
->lag_ports
== port
) &&
2044 !new_aggregator
->lag_ports
->next_port_in_aggregator
))
2048 new_aggregator
= NULL
;
2050 /* if new aggregator found, copy the aggregator's
2051 * parameters and connect the related lag_ports to the
2054 if ((new_aggregator
) && ((!new_aggregator
->lag_ports
) || ((new_aggregator
->lag_ports
== port
) && !new_aggregator
->lag_ports
->next_port_in_aggregator
))) {
2055 netdev_dbg(bond
->dev
, "Some port(s) related to LAG %d - replacing with LAG %d\n",
2056 aggregator
->aggregator_identifier
,
2057 new_aggregator
->aggregator_identifier
);
2059 if ((new_aggregator
->lag_ports
== port
) &&
2060 new_aggregator
->is_active
) {
2061 netdev_info(bond
->dev
, "Removing an active aggregator\n");
2062 select_new_active_agg
= 1;
2065 new_aggregator
->is_individual
= aggregator
->is_individual
;
2066 new_aggregator
->actor_admin_aggregator_key
= aggregator
->actor_admin_aggregator_key
;
2067 new_aggregator
->actor_oper_aggregator_key
= aggregator
->actor_oper_aggregator_key
;
2068 new_aggregator
->partner_system
= aggregator
->partner_system
;
2069 new_aggregator
->partner_system_priority
= aggregator
->partner_system_priority
;
2070 new_aggregator
->partner_oper_aggregator_key
= aggregator
->partner_oper_aggregator_key
;
2071 new_aggregator
->receive_state
= aggregator
->receive_state
;
2072 new_aggregator
->transmit_state
= aggregator
->transmit_state
;
2073 new_aggregator
->lag_ports
= aggregator
->lag_ports
;
2074 new_aggregator
->is_active
= aggregator
->is_active
;
2075 new_aggregator
->num_of_ports
= aggregator
->num_of_ports
;
2077 /* update the information that is written on
2078 * the ports about the aggregator
2080 for (temp_port
= aggregator
->lag_ports
; temp_port
;
2081 temp_port
= temp_port
->next_port_in_aggregator
) {
2082 temp_port
->aggregator
= new_aggregator
;
2083 temp_port
->actor_port_aggregator_identifier
= new_aggregator
->aggregator_identifier
;
2086 ad_clear_agg(aggregator
);
2088 if (select_new_active_agg
)
2089 ad_agg_selection_logic(__get_first_agg(port
),
2090 &dummy_slave_update
);
2092 netdev_warn(bond
->dev
, "unbinding aggregator, and could not find a new aggregator for its ports\n");
2095 /* in case that the only port related to this
2096 * aggregator is the one we want to remove
2098 select_new_active_agg
= aggregator
->is_active
;
2099 ad_clear_agg(aggregator
);
2100 if (select_new_active_agg
) {
2101 netdev_info(bond
->dev
, "Removing an active aggregator\n");
2102 /* select new active aggregator */
2103 temp_aggregator
= __get_first_agg(port
);
2104 if (temp_aggregator
)
2105 ad_agg_selection_logic(temp_aggregator
,
2106 &dummy_slave_update
);
2111 netdev_dbg(bond
->dev
, "Unbinding port %d\n", port
->actor_port_number
);
2113 /* find the aggregator that this port is connected to */
2114 bond_for_each_slave(bond
, slave_iter
, iter
) {
2115 temp_aggregator
= &(SLAVE_AD_INFO(slave_iter
)->aggregator
);
2117 /* search the port in the aggregator's related ports */
2118 for (temp_port
= temp_aggregator
->lag_ports
; temp_port
;
2119 prev_port
= temp_port
,
2120 temp_port
= temp_port
->next_port_in_aggregator
) {
2121 if (temp_port
== port
) {
2122 /* the aggregator found - detach the port from
2126 prev_port
->next_port_in_aggregator
= temp_port
->next_port_in_aggregator
;
2128 temp_aggregator
->lag_ports
= temp_port
->next_port_in_aggregator
;
2129 temp_aggregator
->num_of_ports
--;
2130 if (temp_aggregator
->num_of_ports
== 0) {
2131 select_new_active_agg
= temp_aggregator
->is_active
;
2132 ad_clear_agg(temp_aggregator
);
2133 if (select_new_active_agg
) {
2134 netdev_info(bond
->dev
, "Removing an active aggregator\n");
2135 /* select new active aggregator */
2136 ad_agg_selection_logic(__get_first_agg(port
),
2137 &dummy_slave_update
);
2147 spin_unlock_bh(&bond
->mode_lock
);
2151 * bond_3ad_state_machine_handler - handle state machines timeout
2152 * @bond: bonding struct to work on
2154 * The state machine handling concept in this module is to check every tick
2155 * which state machine should operate any function. The execution order is
2156 * round robin, so when we have an interaction between state machines, the
2157 * reply of one to each other might be delayed until next tick.
2159 * This function also complete the initialization when the agg_select_timer
2160 * times out, and it selects an aggregator for the ports that are yet not
2161 * related to any aggregator, and selects the active aggregator for a bond.
2163 void bond_3ad_state_machine_handler(struct work_struct
*work
)
2165 struct bonding
*bond
= container_of(work
, struct bonding
,
2167 struct aggregator
*aggregator
;
2168 struct list_head
*iter
;
2169 struct slave
*slave
;
2171 bool should_notify_rtnl
= BOND_SLAVE_NOTIFY_LATER
;
2172 bool update_slave_arr
= false;
2174 /* Lock to protect data accessed by all (e.g., port->sm_vars) and
2175 * against running with bond_3ad_unbind_slave. ad_rx_machine may run
2176 * concurrently due to incoming LACPDU as well.
2178 spin_lock_bh(&bond
->mode_lock
);
2181 /* check if there are any slaves */
2182 if (!bond_has_slaves(bond
))
2185 /* check if agg_select_timer timer after initialize is timed out */
2186 if (BOND_AD_INFO(bond
).agg_select_timer
&&
2187 !(--BOND_AD_INFO(bond
).agg_select_timer
)) {
2188 slave
= bond_first_slave_rcu(bond
);
2189 port
= slave
? &(SLAVE_AD_INFO(slave
)->port
) : NULL
;
2191 /* select the active aggregator for the bond */
2194 net_warn_ratelimited("%s: Warning: bond's first port is uninitialized\n",
2199 aggregator
= __get_first_agg(port
);
2200 ad_agg_selection_logic(aggregator
, &update_slave_arr
);
2202 bond_3ad_set_carrier(bond
);
2205 /* for each port run the state machines */
2206 bond_for_each_slave_rcu(bond
, slave
, iter
) {
2207 port
= &(SLAVE_AD_INFO(slave
)->port
);
2209 net_warn_ratelimited("%s: Warning: Found an uninitialized port\n",
2214 ad_rx_machine(NULL
, port
);
2215 ad_periodic_machine(port
);
2216 ad_port_selection_logic(port
, &update_slave_arr
);
2217 ad_mux_machine(port
, &update_slave_arr
);
2218 ad_tx_machine(port
);
2219 ad_churn_machine(port
);
2221 /* turn off the BEGIN bit, since we already handled it */
2222 if (port
->sm_vars
& AD_PORT_BEGIN
)
2223 port
->sm_vars
&= ~AD_PORT_BEGIN
;
2227 bond_for_each_slave_rcu(bond
, slave
, iter
) {
2228 if (slave
->should_notify
) {
2229 should_notify_rtnl
= BOND_SLAVE_NOTIFY_NOW
;
2234 spin_unlock_bh(&bond
->mode_lock
);
2236 if (update_slave_arr
)
2237 bond_slave_arr_work_rearm(bond
, 0);
2239 if (should_notify_rtnl
&& rtnl_trylock()) {
2240 bond_slave_state_notify(bond
);
2243 queue_delayed_work(bond
->wq
, &bond
->ad_work
, ad_delta_in_ticks
);
2247 * bond_3ad_rx_indication - handle a received frame
2248 * @lacpdu: received lacpdu
2249 * @slave: slave struct to work on
2250 * @length: length of the data received
2252 * It is assumed that frames that were sent on this NIC don't returned as new
2253 * received frames (loopback). Since only the payload is given to this
2254 * function, it check for loopback.
2256 static int bond_3ad_rx_indication(struct lacpdu
*lacpdu
, struct slave
*slave
,
2260 int ret
= RX_HANDLER_ANOTHER
;
2262 if (length
>= sizeof(struct lacpdu
)) {
2264 port
= &(SLAVE_AD_INFO(slave
)->port
);
2267 net_warn_ratelimited("%s: Warning: port of slave %s is uninitialized\n",
2268 slave
->dev
->name
, slave
->bond
->dev
->name
);
2272 switch (lacpdu
->subtype
) {
2273 case AD_TYPE_LACPDU
:
2274 ret
= RX_HANDLER_CONSUMED
;
2275 netdev_dbg(slave
->bond
->dev
,
2276 "Received LACPDU on port %d slave %s\n",
2277 port
->actor_port_number
,
2279 /* Protect against concurrent state machines */
2280 spin_lock(&slave
->bond
->mode_lock
);
2281 ad_rx_machine(lacpdu
, port
);
2282 spin_unlock(&slave
->bond
->mode_lock
);
2285 case AD_TYPE_MARKER
:
2286 ret
= RX_HANDLER_CONSUMED
;
2287 /* No need to convert fields to Little Endian since we
2288 * don't use the marker's fields.
2291 switch (((struct bond_marker
*)lacpdu
)->tlv_type
) {
2292 case AD_MARKER_INFORMATION_SUBTYPE
:
2293 netdev_dbg(slave
->bond
->dev
, "Received Marker Information on port %d\n",
2294 port
->actor_port_number
);
2295 ad_marker_info_received((struct bond_marker
*)lacpdu
, port
);
2298 case AD_MARKER_RESPONSE_SUBTYPE
:
2299 netdev_dbg(slave
->bond
->dev
, "Received Marker Response on port %d\n",
2300 port
->actor_port_number
);
2301 ad_marker_response_received((struct bond_marker
*)lacpdu
, port
);
2305 netdev_dbg(slave
->bond
->dev
, "Received an unknown Marker subtype on slot %d\n",
2306 port
->actor_port_number
);
2314 * bond_3ad_adapter_speed_changed - handle a slave's speed change indication
2315 * @slave: slave struct to work on
2317 * Handle reselection of aggregator (if needed) for this port.
2319 void bond_3ad_adapter_speed_changed(struct slave
*slave
)
2323 port
= &(SLAVE_AD_INFO(slave
)->port
);
2325 /* if slave is null, the whole port is not initialized */
2327 netdev_warn(slave
->bond
->dev
, "speed changed for uninitialized port on %s\n",
2332 spin_lock_bh(&slave
->bond
->mode_lock
);
2334 port
->actor_admin_port_key
&= ~AD_SPEED_KEY_MASKS
;
2335 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2336 (__get_link_speed(port
) << 1);
2337 netdev_dbg(slave
->bond
->dev
, "Port %d changed speed\n", port
->actor_port_number
);
2338 /* there is no need to reselect a new aggregator, just signal the
2339 * state machines to reinitialize
2341 port
->sm_vars
|= AD_PORT_BEGIN
;
2343 spin_unlock_bh(&slave
->bond
->mode_lock
);
2347 * bond_3ad_adapter_duplex_changed - handle a slave's duplex change indication
2348 * @slave: slave struct to work on
2350 * Handle reselection of aggregator (if needed) for this port.
2352 void bond_3ad_adapter_duplex_changed(struct slave
*slave
)
2356 port
= &(SLAVE_AD_INFO(slave
)->port
);
2358 /* if slave is null, the whole port is not initialized */
2360 netdev_warn(slave
->bond
->dev
, "duplex changed for uninitialized port on %s\n",
2365 spin_lock_bh(&slave
->bond
->mode_lock
);
2367 port
->actor_admin_port_key
&= ~AD_DUPLEX_KEY_MASKS
;
2368 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2370 netdev_dbg(slave
->bond
->dev
, "Port %d slave %s changed duplex\n",
2371 port
->actor_port_number
, slave
->dev
->name
);
2372 if (port
->actor_oper_port_key
& AD_DUPLEX_KEY_MASKS
)
2373 port
->sm_vars
|= AD_PORT_LACP_ENABLED
;
2374 /* there is no need to reselect a new aggregator, just signal the
2375 * state machines to reinitialize
2377 port
->sm_vars
|= AD_PORT_BEGIN
;
2379 spin_unlock_bh(&slave
->bond
->mode_lock
);
2383 * bond_3ad_handle_link_change - handle a slave's link status change indication
2384 * @slave: slave struct to work on
2385 * @status: whether the link is now up or down
2387 * Handle reselection of aggregator (if needed) for this port.
2389 void bond_3ad_handle_link_change(struct slave
*slave
, char link
)
2393 port
= &(SLAVE_AD_INFO(slave
)->port
);
2395 /* if slave is null, the whole port is not initialized */
2397 netdev_warn(slave
->bond
->dev
, "link status changed for uninitialized port on %s\n",
2402 spin_lock_bh(&slave
->bond
->mode_lock
);
2403 /* on link down we are zeroing duplex and speed since
2404 * some of the adaptors(ce1000.lan) report full duplex/speed
2405 * instead of N/A(duplex) / 0(speed).
2407 * on link up we are forcing recheck on the duplex and speed since
2408 * some of he adaptors(ce1000.lan) report.
2410 if (link
== BOND_LINK_UP
) {
2411 port
->is_enabled
= true;
2412 port
->actor_admin_port_key
&= ~AD_DUPLEX_KEY_MASKS
;
2413 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2415 port
->actor_admin_port_key
&= ~AD_SPEED_KEY_MASKS
;
2416 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2417 (__get_link_speed(port
) << 1);
2418 if (port
->actor_oper_port_key
& AD_DUPLEX_KEY_MASKS
)
2419 port
->sm_vars
|= AD_PORT_LACP_ENABLED
;
2421 /* link has failed */
2422 port
->is_enabled
= false;
2423 port
->actor_admin_port_key
&= ~AD_DUPLEX_KEY_MASKS
;
2424 port
->actor_oper_port_key
= (port
->actor_admin_port_key
&=
2425 ~AD_SPEED_KEY_MASKS
);
2426 port
->sm_vars
&= ~AD_PORT_LACP_ENABLED
;
2428 netdev_dbg(slave
->bond
->dev
, "Port %d changed link status to %s\n",
2429 port
->actor_port_number
,
2430 link
== BOND_LINK_UP
? "UP" : "DOWN");
2431 /* there is no need to reselect a new aggregator, just signal the
2432 * state machines to reinitialize
2434 port
->sm_vars
|= AD_PORT_BEGIN
;
2436 spin_unlock_bh(&slave
->bond
->mode_lock
);
2438 /* RTNL is held and mode_lock is released so it's safe
2439 * to update slave_array here.
2441 bond_update_slave_arr(slave
->bond
, NULL
);
2445 * bond_3ad_set_carrier - set link state for bonding master
2446 * @bond - bonding structure
2448 * if we have an active aggregator, we're up, if not, we're down.
2449 * Presumes that we cannot have an active aggregator if there are
2450 * no slaves with link up.
2452 * This behavior complies with IEEE 802.3 section 43.3.9.
2454 * Called by bond_set_carrier(). Return zero if carrier state does not
2455 * change, nonzero if it does.
2457 int bond_3ad_set_carrier(struct bonding
*bond
)
2459 struct aggregator
*active
;
2460 struct slave
*first_slave
;
2464 first_slave
= bond_first_slave_rcu(bond
);
2469 active
= __get_active_agg(&(SLAVE_AD_INFO(first_slave
)->aggregator
));
2471 /* are enough slaves available to consider link up? */
2472 if (active
->num_of_ports
< bond
->params
.min_links
) {
2473 if (netif_carrier_ok(bond
->dev
)) {
2474 netif_carrier_off(bond
->dev
);
2477 } else if (!netif_carrier_ok(bond
->dev
)) {
2478 netif_carrier_on(bond
->dev
);
2481 } else if (netif_carrier_ok(bond
->dev
)) {
2482 netif_carrier_off(bond
->dev
);
2490 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2491 * @bond: bonding struct to work on
2492 * @ad_info: ad_info struct to fill with the bond's info
2494 * Returns: 0 on success
2497 int __bond_3ad_get_active_agg_info(struct bonding
*bond
,
2498 struct ad_info
*ad_info
)
2500 struct aggregator
*aggregator
= NULL
;
2501 struct list_head
*iter
;
2502 struct slave
*slave
;
2505 bond_for_each_slave_rcu(bond
, slave
, iter
) {
2506 port
= &(SLAVE_AD_INFO(slave
)->port
);
2507 if (port
->aggregator
&& port
->aggregator
->is_active
) {
2508 aggregator
= port
->aggregator
;
2516 ad_info
->aggregator_id
= aggregator
->aggregator_identifier
;
2517 ad_info
->ports
= aggregator
->num_of_ports
;
2518 ad_info
->actor_key
= aggregator
->actor_oper_aggregator_key
;
2519 ad_info
->partner_key
= aggregator
->partner_oper_aggregator_key
;
2520 ether_addr_copy(ad_info
->partner_system
,
2521 aggregator
->partner_system
.mac_addr_value
);
2525 int bond_3ad_get_active_agg_info(struct bonding
*bond
, struct ad_info
*ad_info
)
2530 ret
= __bond_3ad_get_active_agg_info(bond
, ad_info
);
2536 int bond_3ad_lacpdu_recv(const struct sk_buff
*skb
, struct bonding
*bond
,
2537 struct slave
*slave
)
2539 struct lacpdu
*lacpdu
, _lacpdu
;
2541 if (skb
->protocol
!= PKT_TYPE_LACPDU
)
2542 return RX_HANDLER_ANOTHER
;
2544 if (!MAC_ADDRESS_EQUAL(eth_hdr(skb
)->h_dest
, lacpdu_mcast_addr
))
2545 return RX_HANDLER_ANOTHER
;
2547 lacpdu
= skb_header_pointer(skb
, 0, sizeof(_lacpdu
), &_lacpdu
);
2549 return RX_HANDLER_ANOTHER
;
2551 return bond_3ad_rx_indication(lacpdu
, slave
, skb
->len
);
2555 * bond_3ad_update_lacp_rate - change the lacp rate
2556 * @bond - bonding struct
2558 * When modify lacp_rate parameter via sysfs,
2559 * update actor_oper_port_state of each port.
2561 * Hold bond->mode_lock,
2562 * so we can modify port->actor_oper_port_state,
2563 * no matter bond is up or down.
2565 void bond_3ad_update_lacp_rate(struct bonding
*bond
)
2567 struct port
*port
= NULL
;
2568 struct list_head
*iter
;
2569 struct slave
*slave
;
2572 lacp_fast
= bond
->params
.lacp_fast
;
2573 spin_lock_bh(&bond
->mode_lock
);
2574 bond_for_each_slave(bond
, slave
, iter
) {
2575 port
= &(SLAVE_AD_INFO(slave
)->port
);
2577 port
->actor_oper_port_state
|= AD_STATE_LACP_TIMEOUT
;
2579 port
->actor_oper_port_state
&= ~AD_STATE_LACP_TIMEOUT
;
2581 spin_unlock_bh(&bond
->mode_lock
);