2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * The full GNU General Public License is included in this distribution in the
19 * file called LICENSE.
23 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
25 #include <linux/skbuff.h>
26 #include <linux/if_ether.h>
27 #include <linux/netdevice.h>
28 #include <linux/spinlock.h>
29 #include <linux/ethtool.h>
30 #include <linux/etherdevice.h>
31 #include <linux/if_bonding.h>
32 #include <linux/pkt_sched.h>
33 #include <net/net_namespace.h>
37 /* General definitions */
38 #define AD_SHORT_TIMEOUT 1
39 #define AD_LONG_TIMEOUT 0
40 #define AD_STANDBY 0x2
41 #define AD_MAX_TX_IN_SECOND 3
42 #define AD_COLLECTOR_MAX_DELAY 0
44 /* Timer definitions (43.4.4 in the 802.3ad standard) */
45 #define AD_FAST_PERIODIC_TIME 1
46 #define AD_SLOW_PERIODIC_TIME 30
47 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
48 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
49 #define AD_CHURN_DETECTION_TIME 60
50 #define AD_AGGREGATE_WAIT_TIME 2
52 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */
53 #define AD_STATE_LACP_ACTIVITY 0x1
54 #define AD_STATE_LACP_TIMEOUT 0x2
55 #define AD_STATE_AGGREGATION 0x4
56 #define AD_STATE_SYNCHRONIZATION 0x8
57 #define AD_STATE_COLLECTING 0x10
58 #define AD_STATE_DISTRIBUTING 0x20
59 #define AD_STATE_DEFAULTED 0x40
60 #define AD_STATE_EXPIRED 0x80
62 /* Port Variables definitions used by the State Machines (43.4.7 in the
65 #define AD_PORT_BEGIN 0x1
66 #define AD_PORT_LACP_ENABLED 0x2
67 #define AD_PORT_ACTOR_CHURN 0x4
68 #define AD_PORT_PARTNER_CHURN 0x8
69 #define AD_PORT_READY 0x10
70 #define AD_PORT_READY_N 0x20
71 #define AD_PORT_MATCHED 0x40
72 #define AD_PORT_STANDBY 0x80
73 #define AD_PORT_SELECTED 0x100
74 #define AD_PORT_MOVED 0x200
76 /* Port Key definitions
77 * key is determined according to the link speed, duplex and
78 * user key (which is yet not supported)
79 * --------------------------------------------------------------
80 * Port key : | User key | Speed | Duplex |
81 * --------------------------------------------------------------
84 #define AD_DUPLEX_KEY_BITS 0x1
85 #define AD_SPEED_KEY_BITS 0x3E
86 #define AD_USER_KEY_BITS 0xFFC0
88 #define AD_LINK_SPEED_BITMASK_1MBPS 0x1
89 #define AD_LINK_SPEED_BITMASK_10MBPS 0x2
90 #define AD_LINK_SPEED_BITMASK_100MBPS 0x4
91 #define AD_LINK_SPEED_BITMASK_1000MBPS 0x8
92 #define AD_LINK_SPEED_BITMASK_10000MBPS 0x10
94 /* compare MAC addresses */
95 #define MAC_ADDRESS_EQUAL(A, B) \
96 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
98 static struct mac_addr null_mac_addr
= { { 0, 0, 0, 0, 0, 0 } };
99 static u16 ad_ticks_per_sec
;
100 static const int ad_delta_in_ticks
= (AD_TIMER_INTERVAL
* HZ
) / 1000;
102 static const u8 lacpdu_mcast_addr
[ETH_ALEN
] = MULTICAST_LACPDU_ADDR
;
104 /* ================= main 802.3ad protocol functions ================== */
105 static int ad_lacpdu_send(struct port
*port
);
106 static int ad_marker_send(struct port
*port
, struct bond_marker
*marker
);
107 static void ad_mux_machine(struct port
*port
);
108 static void ad_rx_machine(struct lacpdu
*lacpdu
, struct port
*port
);
109 static void ad_tx_machine(struct port
*port
);
110 static void ad_periodic_machine(struct port
*port
);
111 static void ad_port_selection_logic(struct port
*port
);
112 static void ad_agg_selection_logic(struct aggregator
*aggregator
);
113 static void ad_clear_agg(struct aggregator
*aggregator
);
114 static void ad_initialize_agg(struct aggregator
*aggregator
);
115 static void ad_initialize_port(struct port
*port
, int lacp_fast
);
116 static void ad_enable_collecting_distributing(struct port
*port
);
117 static void ad_disable_collecting_distributing(struct port
*port
);
118 static void ad_marker_info_received(struct bond_marker
*marker_info
,
120 static void ad_marker_response_received(struct bond_marker
*marker
,
124 /* ================= api to bonding and kernel code ================== */
127 * __get_bond_by_port - get the port's bonding struct
128 * @port: the port we're looking at
130 * Return @port's bonding struct, or %NULL if it can't be found.
132 static inline struct bonding
*__get_bond_by_port(struct port
*port
)
134 if (port
->slave
== NULL
)
137 return bond_get_bond_by_slave(port
->slave
);
141 * __get_first_agg - get the first aggregator in the bond
142 * @bond: the bond we're looking at
144 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
146 * The caller must hold RCU or RTNL lock.
148 static inline struct aggregator
*__get_first_agg(struct port
*port
)
150 struct bonding
*bond
= __get_bond_by_port(port
);
151 struct slave
*first_slave
;
152 struct aggregator
*agg
;
154 /* If there's no bond for this port, or bond has no slaves */
159 first_slave
= bond_first_slave_rcu(bond
);
160 agg
= first_slave
? &(SLAVE_AD_INFO(first_slave
).aggregator
) : NULL
;
167 * __agg_has_partner - see if we have a partner
168 * @agg: the agregator we're looking at
170 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
171 * address for the partner). Return 0 if not.
173 static inline int __agg_has_partner(struct aggregator
*agg
)
175 return !is_zero_ether_addr(agg
->partner_system
.mac_addr_value
);
179 * __disable_port - disable the port's slave
180 * @port: the port we're looking at
182 static inline void __disable_port(struct port
*port
)
184 bond_set_slave_inactive_flags(port
->slave
);
188 * __enable_port - enable the port's slave, if it's up
189 * @port: the port we're looking at
191 static inline void __enable_port(struct port
*port
)
193 struct slave
*slave
= port
->slave
;
195 if ((slave
->link
== BOND_LINK_UP
) && IS_UP(slave
->dev
))
196 bond_set_slave_active_flags(slave
);
200 * __port_is_enabled - check if the port's slave is in active state
201 * @port: the port we're looking at
203 static inline int __port_is_enabled(struct port
*port
)
205 return bond_is_active_slave(port
->slave
);
209 * __get_agg_selection_mode - get the aggregator selection mode
210 * @port: the port we're looking at
212 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
214 static inline u32
__get_agg_selection_mode(struct port
*port
)
216 struct bonding
*bond
= __get_bond_by_port(port
);
219 return BOND_AD_STABLE
;
221 return bond
->params
.ad_select
;
225 * __check_agg_selection_timer - check if the selection timer has expired
226 * @port: the port we're looking at
228 static inline int __check_agg_selection_timer(struct port
*port
)
230 struct bonding
*bond
= __get_bond_by_port(port
);
235 return BOND_AD_INFO(bond
).agg_select_timer
? 1 : 0;
239 * __get_state_machine_lock - lock the port's state machines
240 * @port: the port we're looking at
242 static inline void __get_state_machine_lock(struct port
*port
)
244 spin_lock_bh(&(SLAVE_AD_INFO(port
->slave
).state_machine_lock
));
248 * __release_state_machine_lock - unlock the port's state machines
249 * @port: the port we're looking at
251 static inline void __release_state_machine_lock(struct port
*port
)
253 spin_unlock_bh(&(SLAVE_AD_INFO(port
->slave
).state_machine_lock
));
257 * __get_link_speed - get a port's speed
258 * @port: the port we're looking at
260 * Return @port's speed in 802.3ad bitmask format. i.e. one of:
262 * %AD_LINK_SPEED_BITMASK_10MBPS,
263 * %AD_LINK_SPEED_BITMASK_100MBPS,
264 * %AD_LINK_SPEED_BITMASK_1000MBPS,
265 * %AD_LINK_SPEED_BITMASK_10000MBPS
267 static u16
__get_link_speed(struct port
*port
)
269 struct slave
*slave
= port
->slave
;
272 /* this if covers only a special case: when the configuration starts
273 * with link down, it sets the speed to 0.
274 * This is done in spite of the fact that the e100 driver reports 0
275 * to be compatible with MVT in the future.
277 if (slave
->link
!= BOND_LINK_UP
)
280 switch (slave
->speed
) {
282 speed
= AD_LINK_SPEED_BITMASK_10MBPS
;
286 speed
= AD_LINK_SPEED_BITMASK_100MBPS
;
290 speed
= AD_LINK_SPEED_BITMASK_1000MBPS
;
294 speed
= AD_LINK_SPEED_BITMASK_10000MBPS
;
298 /* unknown speed value from ethtool. shouldn't happen */
304 pr_debug("Port %d Received link speed %d update from adapter\n",
305 port
->actor_port_number
, speed
);
310 * __get_duplex - get a port's duplex
311 * @port: the port we're looking at
313 * Return @port's duplex in 802.3ad bitmask format. i.e.:
314 * 0x01 if in full duplex
317 static u8
__get_duplex(struct port
*port
)
319 struct slave
*slave
= port
->slave
;
323 /* handling a special case: when the configuration starts with
324 * link down, it sets the duplex to 0.
326 if (slave
->link
!= BOND_LINK_UP
)
329 switch (slave
->duplex
) {
332 pr_debug("Port %d Received status full duplex update from adapter\n",
333 port
->actor_port_number
);
338 pr_debug("Port %d Received status NOT full duplex update from adapter\n",
339 port
->actor_port_number
);
347 * __initialize_port_locks - initialize a port's STATE machine spinlock
348 * @port: the slave of the port we're looking at
350 static inline void __initialize_port_locks(struct slave
*slave
)
352 /* make sure it isn't called twice */
353 spin_lock_init(&(SLAVE_AD_INFO(slave
).state_machine_lock
));
359 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
360 * @timer_type: which timer to operate
361 * @par: timer parameter. see below
363 * If @timer_type is %current_while_timer, @par indicates long/short timer.
364 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
365 * %SLOW_PERIODIC_TIME.
367 static u16
__ad_timer_to_ticks(u16 timer_type
, u16 par
)
369 u16 retval
= 0; /* to silence the compiler */
371 switch (timer_type
) {
372 case AD_CURRENT_WHILE_TIMER
: /* for rx machine usage */
374 retval
= (AD_SHORT_TIMEOUT_TIME
*ad_ticks_per_sec
);
376 retval
= (AD_LONG_TIMEOUT_TIME
*ad_ticks_per_sec
);
378 case AD_ACTOR_CHURN_TIMER
: /* for local churn machine */
379 retval
= (AD_CHURN_DETECTION_TIME
*ad_ticks_per_sec
);
381 case AD_PERIODIC_TIMER
: /* for periodic machine */
382 retval
= (par
*ad_ticks_per_sec
); /* long timeout */
384 case AD_PARTNER_CHURN_TIMER
: /* for remote churn machine */
385 retval
= (AD_CHURN_DETECTION_TIME
*ad_ticks_per_sec
);
387 case AD_WAIT_WHILE_TIMER
: /* for selection machine */
388 retval
= (AD_AGGREGATE_WAIT_TIME
*ad_ticks_per_sec
);
396 /* ================= ad_rx_machine helper functions ================== */
399 * __choose_matched - update a port's matched variable from a received lacpdu
400 * @lacpdu: the lacpdu we've received
401 * @port: the port we're looking at
403 * Update the value of the matched variable, using parameter values from a
404 * newly received lacpdu. Parameter values for the partner carried in the
405 * received PDU are compared with the corresponding operational parameter
406 * values for the actor. Matched is set to TRUE if all of these parameters
407 * match and the PDU parameter partner_state.aggregation has the same value as
408 * actor_oper_port_state.aggregation and lacp will actively maintain the link
409 * in the aggregation. Matched is also set to TRUE if the value of
410 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
411 * an individual link and lacp will actively maintain the link. Otherwise,
412 * matched is set to FALSE. LACP is considered to be actively maintaining the
413 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
414 * the actor's actor_oper_port_state.lacp_activity and the PDU's
415 * partner_state.lacp_activity variables are TRUE.
417 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
418 * used here to implement the language from 802.3ad 43.4.9 that requires
419 * recordPDU to "match" the LACPDU parameters to the stored values.
421 static void __choose_matched(struct lacpdu
*lacpdu
, struct port
*port
)
423 /* check if all parameters are alike
424 * or this is individual link(aggregation == FALSE)
425 * then update the state machine Matched variable.
427 if (((ntohs(lacpdu
->partner_port
) == port
->actor_port_number
) &&
428 (ntohs(lacpdu
->partner_port_priority
) == port
->actor_port_priority
) &&
429 MAC_ADDRESS_EQUAL(&(lacpdu
->partner_system
), &(port
->actor_system
)) &&
430 (ntohs(lacpdu
->partner_system_priority
) == port
->actor_system_priority
) &&
431 (ntohs(lacpdu
->partner_key
) == port
->actor_oper_port_key
) &&
432 ((lacpdu
->partner_state
& AD_STATE_AGGREGATION
) == (port
->actor_oper_port_state
& AD_STATE_AGGREGATION
))) ||
433 ((lacpdu
->actor_state
& AD_STATE_AGGREGATION
) == 0)
435 port
->sm_vars
|= AD_PORT_MATCHED
;
437 port
->sm_vars
&= ~AD_PORT_MATCHED
;
442 * __record_pdu - record parameters from a received lacpdu
443 * @lacpdu: the lacpdu we've received
444 * @port: the port we're looking at
446 * Record the parameter values for the Actor carried in a received lacpdu as
447 * the current partner operational parameter values and sets
448 * actor_oper_port_state.defaulted to FALSE.
450 static void __record_pdu(struct lacpdu
*lacpdu
, struct port
*port
)
452 if (lacpdu
&& port
) {
453 struct port_params
*partner
= &port
->partner_oper
;
455 __choose_matched(lacpdu
, port
);
456 /* record the new parameter values for the partner
459 partner
->port_number
= ntohs(lacpdu
->actor_port
);
460 partner
->port_priority
= ntohs(lacpdu
->actor_port_priority
);
461 partner
->system
= lacpdu
->actor_system
;
462 partner
->system_priority
= ntohs(lacpdu
->actor_system_priority
);
463 partner
->key
= ntohs(lacpdu
->actor_key
);
464 partner
->port_state
= lacpdu
->actor_state
;
466 /* set actor_oper_port_state.defaulted to FALSE */
467 port
->actor_oper_port_state
&= ~AD_STATE_DEFAULTED
;
469 /* set the partner sync. to on if the partner is sync,
470 * and the port is matched
472 if ((port
->sm_vars
& AD_PORT_MATCHED
)
473 && (lacpdu
->actor_state
& AD_STATE_SYNCHRONIZATION
))
474 partner
->port_state
|= AD_STATE_SYNCHRONIZATION
;
476 partner
->port_state
&= ~AD_STATE_SYNCHRONIZATION
;
481 * __record_default - record default parameters
482 * @port: the port we're looking at
484 * This function records the default parameter values for the partner carried
485 * in the Partner Admin parameters as the current partner operational parameter
486 * values and sets actor_oper_port_state.defaulted to TRUE.
488 static void __record_default(struct port
*port
)
491 /* record the partner admin parameters */
492 memcpy(&port
->partner_oper
, &port
->partner_admin
,
493 sizeof(struct port_params
));
495 /* set actor_oper_port_state.defaulted to true */
496 port
->actor_oper_port_state
|= AD_STATE_DEFAULTED
;
501 * __update_selected - update a port's Selected variable from a received lacpdu
502 * @lacpdu: the lacpdu we've received
503 * @port: the port we're looking at
505 * Update the value of the selected variable, using parameter values from a
506 * newly received lacpdu. The parameter values for the Actor carried in the
507 * received PDU are compared with the corresponding operational parameter
508 * values for the ports partner. If one or more of the comparisons shows that
509 * the value(s) received in the PDU differ from the current operational values,
510 * then selected is set to FALSE and actor_oper_port_state.synchronization is
511 * set to out_of_sync. Otherwise, selected remains unchanged.
513 static void __update_selected(struct lacpdu
*lacpdu
, struct port
*port
)
515 if (lacpdu
&& port
) {
516 const struct port_params
*partner
= &port
->partner_oper
;
518 /* check if any parameter is different then
519 * update the state machine selected variable.
521 if (ntohs(lacpdu
->actor_port
) != partner
->port_number
||
522 ntohs(lacpdu
->actor_port_priority
) != partner
->port_priority
||
523 !MAC_ADDRESS_EQUAL(&lacpdu
->actor_system
, &partner
->system
) ||
524 ntohs(lacpdu
->actor_system_priority
) != partner
->system_priority
||
525 ntohs(lacpdu
->actor_key
) != partner
->key
||
526 (lacpdu
->actor_state
& AD_STATE_AGGREGATION
) != (partner
->port_state
& AD_STATE_AGGREGATION
)) {
527 port
->sm_vars
&= ~AD_PORT_SELECTED
;
533 * __update_default_selected - update a port's Selected variable from Partner
534 * @port: the port we're looking at
536 * This function updates the value of the selected variable, using the partner
537 * administrative parameter values. The administrative values are compared with
538 * the corresponding operational parameter values for the partner. If one or
539 * more of the comparisons shows that the administrative value(s) differ from
540 * the current operational values, then Selected is set to FALSE and
541 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
542 * Selected remains unchanged.
544 static void __update_default_selected(struct port
*port
)
547 const struct port_params
*admin
= &port
->partner_admin
;
548 const struct port_params
*oper
= &port
->partner_oper
;
550 /* check if any parameter is different then
551 * update the state machine selected variable.
553 if (admin
->port_number
!= oper
->port_number
||
554 admin
->port_priority
!= oper
->port_priority
||
555 !MAC_ADDRESS_EQUAL(&admin
->system
, &oper
->system
) ||
556 admin
->system_priority
!= oper
->system_priority
||
557 admin
->key
!= oper
->key
||
558 (admin
->port_state
& AD_STATE_AGGREGATION
)
559 != (oper
->port_state
& AD_STATE_AGGREGATION
)) {
560 port
->sm_vars
&= ~AD_PORT_SELECTED
;
566 * __update_ntt - update a port's ntt variable from a received lacpdu
567 * @lacpdu: the lacpdu we've received
568 * @port: the port we're looking at
570 * Updates the value of the ntt variable, using parameter values from a newly
571 * received lacpdu. The parameter values for the partner carried in the
572 * received PDU are compared with the corresponding operational parameter
573 * values for the Actor. If one or more of the comparisons shows that the
574 * value(s) received in the PDU differ from the current operational values,
575 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
577 static void __update_ntt(struct lacpdu
*lacpdu
, struct port
*port
)
579 /* validate lacpdu and port */
580 if (lacpdu
&& port
) {
581 /* check if any parameter is different then
582 * update the port->ntt.
584 if ((ntohs(lacpdu
->partner_port
) != port
->actor_port_number
) ||
585 (ntohs(lacpdu
->partner_port_priority
) != port
->actor_port_priority
) ||
586 !MAC_ADDRESS_EQUAL(&(lacpdu
->partner_system
), &(port
->actor_system
)) ||
587 (ntohs(lacpdu
->partner_system_priority
) != port
->actor_system_priority
) ||
588 (ntohs(lacpdu
->partner_key
) != port
->actor_oper_port_key
) ||
589 ((lacpdu
->partner_state
& AD_STATE_LACP_ACTIVITY
) != (port
->actor_oper_port_state
& AD_STATE_LACP_ACTIVITY
)) ||
590 ((lacpdu
->partner_state
& AD_STATE_LACP_TIMEOUT
) != (port
->actor_oper_port_state
& AD_STATE_LACP_TIMEOUT
)) ||
591 ((lacpdu
->partner_state
& AD_STATE_SYNCHRONIZATION
) != (port
->actor_oper_port_state
& AD_STATE_SYNCHRONIZATION
)) ||
592 ((lacpdu
->partner_state
& AD_STATE_AGGREGATION
) != (port
->actor_oper_port_state
& AD_STATE_AGGREGATION
))
600 * __agg_ports_are_ready - check if all ports in an aggregator are ready
601 * @aggregator: the aggregator we're looking at
604 static int __agg_ports_are_ready(struct aggregator
*aggregator
)
610 /* scan all ports in this aggregator to verfy if they are
613 for (port
= aggregator
->lag_ports
;
615 port
= port
->next_port_in_aggregator
) {
616 if (!(port
->sm_vars
& AD_PORT_READY_N
)) {
627 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
628 * @aggregator: the aggregator we're looking at
629 * @val: Should the ports' ready bit be set on or off
632 static void __set_agg_ports_ready(struct aggregator
*aggregator
, int val
)
636 for (port
= aggregator
->lag_ports
; port
;
637 port
= port
->next_port_in_aggregator
) {
639 port
->sm_vars
|= AD_PORT_READY
;
641 port
->sm_vars
&= ~AD_PORT_READY
;
646 * __get_agg_bandwidth - get the total bandwidth of an aggregator
647 * @aggregator: the aggregator we're looking at
650 static u32
__get_agg_bandwidth(struct aggregator
*aggregator
)
654 if (aggregator
->num_of_ports
) {
655 switch (__get_link_speed(aggregator
->lag_ports
)) {
656 case AD_LINK_SPEED_BITMASK_1MBPS
:
657 bandwidth
= aggregator
->num_of_ports
;
659 case AD_LINK_SPEED_BITMASK_10MBPS
:
660 bandwidth
= aggregator
->num_of_ports
* 10;
662 case AD_LINK_SPEED_BITMASK_100MBPS
:
663 bandwidth
= aggregator
->num_of_ports
* 100;
665 case AD_LINK_SPEED_BITMASK_1000MBPS
:
666 bandwidth
= aggregator
->num_of_ports
* 1000;
668 case AD_LINK_SPEED_BITMASK_10000MBPS
:
669 bandwidth
= aggregator
->num_of_ports
* 10000;
672 bandwidth
= 0; /* to silence the compiler */
679 * __get_active_agg - get the current active aggregator
680 * @aggregator: the aggregator we're looking at
682 * Caller must hold RCU lock.
684 static struct aggregator
*__get_active_agg(struct aggregator
*aggregator
)
686 struct bonding
*bond
= aggregator
->slave
->bond
;
687 struct list_head
*iter
;
690 bond_for_each_slave_rcu(bond
, slave
, iter
)
691 if (SLAVE_AD_INFO(slave
).aggregator
.is_active
)
692 return &(SLAVE_AD_INFO(slave
).aggregator
);
698 * __update_lacpdu_from_port - update a port's lacpdu fields
699 * @port: the port we're looking at
701 static inline void __update_lacpdu_from_port(struct port
*port
)
703 struct lacpdu
*lacpdu
= &port
->lacpdu
;
704 const struct port_params
*partner
= &port
->partner_oper
;
706 /* update current actual Actor parameters
707 * lacpdu->subtype initialized
708 * lacpdu->version_number initialized
709 * lacpdu->tlv_type_actor_info initialized
710 * lacpdu->actor_information_length initialized
713 lacpdu
->actor_system_priority
= htons(port
->actor_system_priority
);
714 lacpdu
->actor_system
= port
->actor_system
;
715 lacpdu
->actor_key
= htons(port
->actor_oper_port_key
);
716 lacpdu
->actor_port_priority
= htons(port
->actor_port_priority
);
717 lacpdu
->actor_port
= htons(port
->actor_port_number
);
718 lacpdu
->actor_state
= port
->actor_oper_port_state
;
720 /* lacpdu->reserved_3_1 initialized
721 * lacpdu->tlv_type_partner_info initialized
722 * lacpdu->partner_information_length initialized
725 lacpdu
->partner_system_priority
= htons(partner
->system_priority
);
726 lacpdu
->partner_system
= partner
->system
;
727 lacpdu
->partner_key
= htons(partner
->key
);
728 lacpdu
->partner_port_priority
= htons(partner
->port_priority
);
729 lacpdu
->partner_port
= htons(partner
->port_number
);
730 lacpdu
->partner_state
= partner
->port_state
;
732 /* lacpdu->reserved_3_2 initialized
733 * lacpdu->tlv_type_collector_info initialized
734 * lacpdu->collector_information_length initialized
735 * collector_max_delay initialized
736 * reserved_12[12] initialized
737 * tlv_type_terminator initialized
738 * terminator_length initialized
739 * reserved_50[50] initialized
743 /* ================= main 802.3ad protocol code ========================= */
746 * ad_lacpdu_send - send out a lacpdu packet on a given port
747 * @port: the port we're looking at
749 * Returns: 0 on success
752 static int ad_lacpdu_send(struct port
*port
)
754 struct slave
*slave
= port
->slave
;
756 struct lacpdu_header
*lacpdu_header
;
757 int length
= sizeof(struct lacpdu_header
);
759 skb
= dev_alloc_skb(length
);
763 skb
->dev
= slave
->dev
;
764 skb_reset_mac_header(skb
);
765 skb
->network_header
= skb
->mac_header
+ ETH_HLEN
;
766 skb
->protocol
= PKT_TYPE_LACPDU
;
767 skb
->priority
= TC_PRIO_CONTROL
;
769 lacpdu_header
= (struct lacpdu_header
*)skb_put(skb
, length
);
771 memcpy(lacpdu_header
->hdr
.h_dest
, lacpdu_mcast_addr
, ETH_ALEN
);
772 /* Note: source address is set to be the member's PERMANENT address,
773 * because we use it to identify loopback lacpdus in receive.
775 memcpy(lacpdu_header
->hdr
.h_source
, slave
->perm_hwaddr
, ETH_ALEN
);
776 lacpdu_header
->hdr
.h_proto
= PKT_TYPE_LACPDU
;
778 lacpdu_header
->lacpdu
= port
->lacpdu
;
786 * ad_marker_send - send marker information/response on a given port
787 * @port: the port we're looking at
788 * @marker: marker data to send
790 * Returns: 0 on success
793 static int ad_marker_send(struct port
*port
, struct bond_marker
*marker
)
795 struct slave
*slave
= port
->slave
;
797 struct bond_marker_header
*marker_header
;
798 int length
= sizeof(struct bond_marker_header
);
800 skb
= dev_alloc_skb(length
+ 16);
804 skb_reserve(skb
, 16);
806 skb
->dev
= slave
->dev
;
807 skb_reset_mac_header(skb
);
808 skb
->network_header
= skb
->mac_header
+ ETH_HLEN
;
809 skb
->protocol
= PKT_TYPE_LACPDU
;
811 marker_header
= (struct bond_marker_header
*)skb_put(skb
, length
);
813 memcpy(marker_header
->hdr
.h_dest
, lacpdu_mcast_addr
, ETH_ALEN
);
814 /* Note: source address is set to be the member's PERMANENT address,
815 * because we use it to identify loopback MARKERs in receive.
817 memcpy(marker_header
->hdr
.h_source
, slave
->perm_hwaddr
, ETH_ALEN
);
818 marker_header
->hdr
.h_proto
= PKT_TYPE_LACPDU
;
820 marker_header
->marker
= *marker
;
828 * ad_mux_machine - handle a port's mux state machine
829 * @port: the port we're looking at
831 static void ad_mux_machine(struct port
*port
)
833 mux_states_t last_state
;
835 /* keep current State Machine state to compare later if it was
838 last_state
= port
->sm_mux_state
;
840 if (port
->sm_vars
& AD_PORT_BEGIN
) {
841 port
->sm_mux_state
= AD_MUX_DETACHED
;
843 switch (port
->sm_mux_state
) {
844 case AD_MUX_DETACHED
:
845 if ((port
->sm_vars
& AD_PORT_SELECTED
)
846 || (port
->sm_vars
& AD_PORT_STANDBY
))
847 /* if SELECTED or STANDBY */
848 port
->sm_mux_state
= AD_MUX_WAITING
;
851 /* if SELECTED == FALSE return to DETACH state */
852 if (!(port
->sm_vars
& AD_PORT_SELECTED
)) {
853 port
->sm_vars
&= ~AD_PORT_READY_N
;
854 /* in order to withhold the Selection Logic to
855 * check all ports READY_N value every callback
856 * cycle to update ready variable, we check
857 * READY_N and update READY here
859 __set_agg_ports_ready(port
->aggregator
, __agg_ports_are_ready(port
->aggregator
));
860 port
->sm_mux_state
= AD_MUX_DETACHED
;
864 /* check if the wait_while_timer expired */
865 if (port
->sm_mux_timer_counter
866 && !(--port
->sm_mux_timer_counter
))
867 port
->sm_vars
|= AD_PORT_READY_N
;
869 /* in order to withhold the selection logic to check
870 * all ports READY_N value every callback cycle to
871 * update ready variable, we check READY_N and update
874 __set_agg_ports_ready(port
->aggregator
, __agg_ports_are_ready(port
->aggregator
));
876 /* if the wait_while_timer expired, and the port is
877 * in READY state, move to ATTACHED state
879 if ((port
->sm_vars
& AD_PORT_READY
)
880 && !port
->sm_mux_timer_counter
)
881 port
->sm_mux_state
= AD_MUX_ATTACHED
;
883 case AD_MUX_ATTACHED
:
884 /* check also if agg_select_timer expired (so the
885 * edable port will take place only after this timer)
887 if ((port
->sm_vars
& AD_PORT_SELECTED
) &&
888 (port
->partner_oper
.port_state
& AD_STATE_SYNCHRONIZATION
) &&
889 !__check_agg_selection_timer(port
)) {
890 port
->sm_mux_state
= AD_MUX_COLLECTING_DISTRIBUTING
;
891 } else if (!(port
->sm_vars
& AD_PORT_SELECTED
) ||
892 (port
->sm_vars
& AD_PORT_STANDBY
)) {
893 /* if UNSELECTED or STANDBY */
894 port
->sm_vars
&= ~AD_PORT_READY_N
;
895 /* in order to withhold the selection logic to
896 * check all ports READY_N value every callback
897 * cycle to update ready variable, we check
898 * READY_N and update READY here
900 __set_agg_ports_ready(port
->aggregator
, __agg_ports_are_ready(port
->aggregator
));
901 port
->sm_mux_state
= AD_MUX_DETACHED
;
904 case AD_MUX_COLLECTING_DISTRIBUTING
:
905 if (!(port
->sm_vars
& AD_PORT_SELECTED
) ||
906 (port
->sm_vars
& AD_PORT_STANDBY
) ||
907 !(port
->partner_oper
.port_state
& AD_STATE_SYNCHRONIZATION
)) {
908 port
->sm_mux_state
= AD_MUX_ATTACHED
;
910 /* if port state hasn't changed make
911 * sure that a collecting distributing
912 * port in an active aggregator is enabled
914 if (port
->aggregator
&&
915 port
->aggregator
->is_active
&&
916 !__port_is_enabled(port
)) {
927 /* check if the state machine was changed */
928 if (port
->sm_mux_state
!= last_state
) {
929 pr_debug("Mux Machine: Port=%d, Last State=%d, Curr State=%d\n",
930 port
->actor_port_number
, last_state
,
932 switch (port
->sm_mux_state
) {
933 case AD_MUX_DETACHED
:
934 port
->actor_oper_port_state
&= ~AD_STATE_SYNCHRONIZATION
;
935 ad_disable_collecting_distributing(port
);
936 port
->actor_oper_port_state
&= ~AD_STATE_COLLECTING
;
937 port
->actor_oper_port_state
&= ~AD_STATE_DISTRIBUTING
;
941 port
->sm_mux_timer_counter
= __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER
, 0);
943 case AD_MUX_ATTACHED
:
944 port
->actor_oper_port_state
|= AD_STATE_SYNCHRONIZATION
;
945 port
->actor_oper_port_state
&= ~AD_STATE_COLLECTING
;
946 port
->actor_oper_port_state
&= ~AD_STATE_DISTRIBUTING
;
947 ad_disable_collecting_distributing(port
);
950 case AD_MUX_COLLECTING_DISTRIBUTING
:
951 port
->actor_oper_port_state
|= AD_STATE_COLLECTING
;
952 port
->actor_oper_port_state
|= AD_STATE_DISTRIBUTING
;
953 ad_enable_collecting_distributing(port
);
963 * ad_rx_machine - handle a port's rx State Machine
964 * @lacpdu: the lacpdu we've received
965 * @port: the port we're looking at
967 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
968 * CURRENT. If timer expired set the state machine in the proper state.
969 * In other cases, this function checks if we need to switch to other state.
971 static void ad_rx_machine(struct lacpdu
*lacpdu
, struct port
*port
)
973 rx_states_t last_state
;
975 /* keep current State Machine state to compare later if it was
978 last_state
= port
->sm_rx_state
;
980 /* check if state machine should change state */
982 /* first, check if port was reinitialized */
983 if (port
->sm_vars
& AD_PORT_BEGIN
)
984 port
->sm_rx_state
= AD_RX_INITIALIZE
;
985 /* check if port is not enabled */
986 else if (!(port
->sm_vars
& AD_PORT_BEGIN
)
987 && !port
->is_enabled
&& !(port
->sm_vars
& AD_PORT_MOVED
))
988 port
->sm_rx_state
= AD_RX_PORT_DISABLED
;
989 /* check if new lacpdu arrived */
990 else if (lacpdu
&& ((port
->sm_rx_state
== AD_RX_EXPIRED
) ||
991 (port
->sm_rx_state
== AD_RX_DEFAULTED
) ||
992 (port
->sm_rx_state
== AD_RX_CURRENT
))) {
993 port
->sm_rx_timer_counter
= 0;
994 port
->sm_rx_state
= AD_RX_CURRENT
;
996 /* if timer is on, and if it is expired */
997 if (port
->sm_rx_timer_counter
&&
998 !(--port
->sm_rx_timer_counter
)) {
999 switch (port
->sm_rx_state
) {
1001 port
->sm_rx_state
= AD_RX_DEFAULTED
;
1004 port
->sm_rx_state
= AD_RX_EXPIRED
;
1010 /* if no lacpdu arrived and no timer is on */
1011 switch (port
->sm_rx_state
) {
1012 case AD_RX_PORT_DISABLED
:
1013 if (port
->sm_vars
& AD_PORT_MOVED
)
1014 port
->sm_rx_state
= AD_RX_INITIALIZE
;
1015 else if (port
->is_enabled
1017 & AD_PORT_LACP_ENABLED
))
1018 port
->sm_rx_state
= AD_RX_EXPIRED
;
1019 else if (port
->is_enabled
1021 & AD_PORT_LACP_ENABLED
) == 0))
1022 port
->sm_rx_state
= AD_RX_LACP_DISABLED
;
1031 /* check if the State machine was changed or new lacpdu arrived */
1032 if ((port
->sm_rx_state
!= last_state
) || (lacpdu
)) {
1033 pr_debug("Rx Machine: Port=%d, Last State=%d, Curr State=%d\n",
1034 port
->actor_port_number
, last_state
,
1036 switch (port
->sm_rx_state
) {
1037 case AD_RX_INITIALIZE
:
1038 if (!(port
->actor_oper_port_key
& AD_DUPLEX_KEY_BITS
))
1039 port
->sm_vars
&= ~AD_PORT_LACP_ENABLED
;
1041 port
->sm_vars
|= AD_PORT_LACP_ENABLED
;
1042 port
->sm_vars
&= ~AD_PORT_SELECTED
;
1043 __record_default(port
);
1044 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1045 port
->sm_vars
&= ~AD_PORT_MOVED
;
1046 port
->sm_rx_state
= AD_RX_PORT_DISABLED
;
1049 case AD_RX_PORT_DISABLED
:
1050 port
->sm_vars
&= ~AD_PORT_MATCHED
;
1052 case AD_RX_LACP_DISABLED
:
1053 port
->sm_vars
&= ~AD_PORT_SELECTED
;
1054 __record_default(port
);
1055 port
->partner_oper
.port_state
&= ~AD_STATE_AGGREGATION
;
1056 port
->sm_vars
|= AD_PORT_MATCHED
;
1057 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1060 /* Reset of the Synchronization flag (Standard 43.4.12)
1061 * This reset cause to disable this port in the
1062 * COLLECTING_DISTRIBUTING state of the mux machine in
1063 * case of EXPIRED even if LINK_DOWN didn't arrive for
1066 port
->partner_oper
.port_state
&= ~AD_STATE_SYNCHRONIZATION
;
1067 port
->sm_vars
&= ~AD_PORT_MATCHED
;
1068 port
->partner_oper
.port_state
|= AD_STATE_LACP_ACTIVITY
;
1069 port
->sm_rx_timer_counter
= __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER
, (u16
)(AD_SHORT_TIMEOUT
));
1070 port
->actor_oper_port_state
|= AD_STATE_EXPIRED
;
1072 case AD_RX_DEFAULTED
:
1073 __update_default_selected(port
);
1074 __record_default(port
);
1075 port
->sm_vars
|= AD_PORT_MATCHED
;
1076 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1079 /* detect loopback situation */
1080 if (MAC_ADDRESS_EQUAL(&(lacpdu
->actor_system
),
1081 &(port
->actor_system
))) {
1082 pr_err("%s: An illegal loopback occurred on adapter (%s).\nCheck the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n",
1083 port
->slave
->bond
->dev
->name
,
1084 port
->slave
->dev
->name
);
1087 __update_selected(lacpdu
, port
);
1088 __update_ntt(lacpdu
, port
);
1089 __record_pdu(lacpdu
, port
);
1090 port
->sm_rx_timer_counter
= __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER
, (u16
)(port
->actor_oper_port_state
& AD_STATE_LACP_TIMEOUT
));
1091 port
->actor_oper_port_state
&= ~AD_STATE_EXPIRED
;
1100 * ad_tx_machine - handle a port's tx state machine
1101 * @port: the port we're looking at
1103 static void ad_tx_machine(struct port
*port
)
1105 /* check if tx timer expired, to verify that we do not send more than
1106 * 3 packets per second
1108 if (port
->sm_tx_timer_counter
&& !(--port
->sm_tx_timer_counter
)) {
1109 /* check if there is something to send */
1110 if (port
->ntt
&& (port
->sm_vars
& AD_PORT_LACP_ENABLED
)) {
1111 __update_lacpdu_from_port(port
);
1113 if (ad_lacpdu_send(port
) >= 0) {
1114 pr_debug("Sent LACPDU on port %d\n",
1115 port
->actor_port_number
);
1117 /* mark ntt as false, so it will not be sent
1118 * again until demanded
1123 /* restart tx timer(to verify that we will not exceed
1124 * AD_MAX_TX_IN_SECOND
1126 port
->sm_tx_timer_counter
= ad_ticks_per_sec
/AD_MAX_TX_IN_SECOND
;
1131 * ad_periodic_machine - handle a port's periodic state machine
1132 * @port: the port we're looking at
1134 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1136 static void ad_periodic_machine(struct port
*port
)
1138 periodic_states_t last_state
;
1140 /* keep current state machine state to compare later if it was changed */
1141 last_state
= port
->sm_periodic_state
;
1143 /* check if port was reinitialized */
1144 if (((port
->sm_vars
& AD_PORT_BEGIN
) || !(port
->sm_vars
& AD_PORT_LACP_ENABLED
) || !port
->is_enabled
) ||
1145 (!(port
->actor_oper_port_state
& AD_STATE_LACP_ACTIVITY
) && !(port
->partner_oper
.port_state
& AD_STATE_LACP_ACTIVITY
))
1147 port
->sm_periodic_state
= AD_NO_PERIODIC
;
1149 /* check if state machine should change state */
1150 else if (port
->sm_periodic_timer_counter
) {
1151 /* check if periodic state machine expired */
1152 if (!(--port
->sm_periodic_timer_counter
)) {
1153 /* if expired then do tx */
1154 port
->sm_periodic_state
= AD_PERIODIC_TX
;
1156 /* If not expired, check if there is some new timeout
1157 * parameter from the partner state
1159 switch (port
->sm_periodic_state
) {
1160 case AD_FAST_PERIODIC
:
1161 if (!(port
->partner_oper
.port_state
1162 & AD_STATE_LACP_TIMEOUT
))
1163 port
->sm_periodic_state
= AD_SLOW_PERIODIC
;
1165 case AD_SLOW_PERIODIC
:
1166 if ((port
->partner_oper
.port_state
& AD_STATE_LACP_TIMEOUT
)) {
1167 port
->sm_periodic_timer_counter
= 0;
1168 port
->sm_periodic_state
= AD_PERIODIC_TX
;
1176 switch (port
->sm_periodic_state
) {
1177 case AD_NO_PERIODIC
:
1178 port
->sm_periodic_state
= AD_FAST_PERIODIC
;
1180 case AD_PERIODIC_TX
:
1181 if (!(port
->partner_oper
.port_state
&
1182 AD_STATE_LACP_TIMEOUT
))
1183 port
->sm_periodic_state
= AD_SLOW_PERIODIC
;
1185 port
->sm_periodic_state
= AD_FAST_PERIODIC
;
1192 /* check if the state machine was changed */
1193 if (port
->sm_periodic_state
!= last_state
) {
1194 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1195 port
->actor_port_number
, last_state
,
1196 port
->sm_periodic_state
);
1197 switch (port
->sm_periodic_state
) {
1198 case AD_NO_PERIODIC
:
1199 port
->sm_periodic_timer_counter
= 0;
1201 case AD_FAST_PERIODIC
:
1202 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1203 port
->sm_periodic_timer_counter
= __ad_timer_to_ticks(AD_PERIODIC_TIMER
, (u16
)(AD_FAST_PERIODIC_TIME
))-1;
1205 case AD_SLOW_PERIODIC
:
1206 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1207 port
->sm_periodic_timer_counter
= __ad_timer_to_ticks(AD_PERIODIC_TIMER
, (u16
)(AD_SLOW_PERIODIC_TIME
))-1;
1209 case AD_PERIODIC_TX
:
1219 * ad_port_selection_logic - select aggregation groups
1220 * @port: the port we're looking at
1222 * Select aggregation groups, and assign each port for it's aggregetor. The
1223 * selection logic is called in the inititalization (after all the handshkes),
1224 * and after every lacpdu receive (if selected is off).
1226 static void ad_port_selection_logic(struct port
*port
)
1228 struct aggregator
*aggregator
, *free_aggregator
= NULL
, *temp_aggregator
;
1229 struct port
*last_port
= NULL
, *curr_port
;
1230 struct list_head
*iter
;
1231 struct bonding
*bond
;
1232 struct slave
*slave
;
1235 /* if the port is already Selected, do nothing */
1236 if (port
->sm_vars
& AD_PORT_SELECTED
)
1239 bond
= __get_bond_by_port(port
);
1241 /* if the port is connected to other aggregator, detach it */
1242 if (port
->aggregator
) {
1243 /* detach the port from its former aggregator */
1244 temp_aggregator
= port
->aggregator
;
1245 for (curr_port
= temp_aggregator
->lag_ports
; curr_port
;
1246 last_port
= curr_port
,
1247 curr_port
= curr_port
->next_port_in_aggregator
) {
1248 if (curr_port
== port
) {
1249 temp_aggregator
->num_of_ports
--;
1250 /* if it is the first port attached to the
1254 temp_aggregator
->lag_ports
=
1255 port
->next_port_in_aggregator
;
1257 /* not the first port attached to the
1260 last_port
->next_port_in_aggregator
=
1261 port
->next_port_in_aggregator
;
1264 /* clear the port's relations to this
1267 port
->aggregator
= NULL
;
1268 port
->next_port_in_aggregator
= NULL
;
1269 port
->actor_port_aggregator_identifier
= 0;
1271 pr_debug("Port %d left LAG %d\n",
1272 port
->actor_port_number
,
1273 temp_aggregator
->aggregator_identifier
);
1274 /* if the aggregator is empty, clear its
1275 * parameters, and set it ready to be attached
1277 if (!temp_aggregator
->lag_ports
)
1278 ad_clear_agg(temp_aggregator
);
1283 /* meaning: the port was related to an aggregator
1284 * but was not on the aggregator port list
1286 pr_warn("%s: Warning: Port %d (on %s) was related to aggregator %d but was not on its port list\n",
1287 port
->slave
->bond
->dev
->name
,
1288 port
->actor_port_number
,
1289 port
->slave
->dev
->name
,
1290 port
->aggregator
->aggregator_identifier
);
1293 /* search on all aggregators for a suitable aggregator for this port */
1294 bond_for_each_slave(bond
, slave
, iter
) {
1295 aggregator
= &(SLAVE_AD_INFO(slave
).aggregator
);
1297 /* keep a free aggregator for later use(if needed) */
1298 if (!aggregator
->lag_ports
) {
1299 if (!free_aggregator
)
1300 free_aggregator
= aggregator
;
1303 /* check if current aggregator suits us */
1304 if (((aggregator
->actor_oper_aggregator_key
== port
->actor_oper_port_key
) && /* if all parameters match AND */
1305 MAC_ADDRESS_EQUAL(&(aggregator
->partner_system
), &(port
->partner_oper
.system
)) &&
1306 (aggregator
->partner_system_priority
== port
->partner_oper
.system_priority
) &&
1307 (aggregator
->partner_oper_aggregator_key
== port
->partner_oper
.key
)
1309 ((!MAC_ADDRESS_EQUAL(&(port
->partner_oper
.system
), &(null_mac_addr
)) && /* partner answers */
1310 !aggregator
->is_individual
) /* but is not individual OR */
1313 /* attach to the founded aggregator */
1314 port
->aggregator
= aggregator
;
1315 port
->actor_port_aggregator_identifier
=
1316 port
->aggregator
->aggregator_identifier
;
1317 port
->next_port_in_aggregator
= aggregator
->lag_ports
;
1318 port
->aggregator
->num_of_ports
++;
1319 aggregator
->lag_ports
= port
;
1320 pr_debug("Port %d joined LAG %d(existing LAG)\n",
1321 port
->actor_port_number
,
1322 port
->aggregator
->aggregator_identifier
);
1324 /* mark this port as selected */
1325 port
->sm_vars
|= AD_PORT_SELECTED
;
1331 /* the port couldn't find an aggregator - attach it to a new
1335 if (free_aggregator
) {
1336 /* assign port a new aggregator */
1337 port
->aggregator
= free_aggregator
;
1338 port
->actor_port_aggregator_identifier
=
1339 port
->aggregator
->aggregator_identifier
;
1341 /* update the new aggregator's parameters
1342 * if port was responsed from the end-user
1344 if (port
->actor_oper_port_key
& AD_DUPLEX_KEY_BITS
)
1345 /* if port is full duplex */
1346 port
->aggregator
->is_individual
= false;
1348 port
->aggregator
->is_individual
= true;
1350 port
->aggregator
->actor_admin_aggregator_key
= port
->actor_admin_port_key
;
1351 port
->aggregator
->actor_oper_aggregator_key
= port
->actor_oper_port_key
;
1352 port
->aggregator
->partner_system
=
1353 port
->partner_oper
.system
;
1354 port
->aggregator
->partner_system_priority
=
1355 port
->partner_oper
.system_priority
;
1356 port
->aggregator
->partner_oper_aggregator_key
= port
->partner_oper
.key
;
1357 port
->aggregator
->receive_state
= 1;
1358 port
->aggregator
->transmit_state
= 1;
1359 port
->aggregator
->lag_ports
= port
;
1360 port
->aggregator
->num_of_ports
++;
1362 /* mark this port as selected */
1363 port
->sm_vars
|= AD_PORT_SELECTED
;
1365 pr_debug("Port %d joined LAG %d(new LAG)\n",
1366 port
->actor_port_number
,
1367 port
->aggregator
->aggregator_identifier
);
1369 pr_err("%s: Port %d (on %s) did not find a suitable aggregator\n",
1370 port
->slave
->bond
->dev
->name
,
1371 port
->actor_port_number
, port
->slave
->dev
->name
);
1374 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1375 * in all aggregator's ports, else set ready=FALSE in all
1376 * aggregator's ports
1378 __set_agg_ports_ready(port
->aggregator
,
1379 __agg_ports_are_ready(port
->aggregator
));
1381 aggregator
= __get_first_agg(port
);
1382 ad_agg_selection_logic(aggregator
);
1385 /* Decide if "agg" is a better choice for the new active aggregator that
1386 * the current best, according to the ad_select policy.
1388 static struct aggregator
*ad_agg_selection_test(struct aggregator
*best
,
1389 struct aggregator
*curr
)
1391 /* 0. If no best, select current.
1393 * 1. If the current agg is not individual, and the best is
1394 * individual, select current.
1396 * 2. If current agg is individual and the best is not, keep best.
1398 * 3. Therefore, current and best are both individual or both not
1401 * 3a. If current agg partner replied, and best agg partner did not,
1404 * 3b. If current agg partner did not reply and best agg partner
1405 * did reply, keep best.
1407 * 4. Therefore, current and best both have partner replies or
1408 * both do not, so perform selection policy:
1410 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1411 * select by bandwidth.
1413 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1418 if (!curr
->is_individual
&& best
->is_individual
)
1421 if (curr
->is_individual
&& !best
->is_individual
)
1424 if (__agg_has_partner(curr
) && !__agg_has_partner(best
))
1427 if (!__agg_has_partner(curr
) && __agg_has_partner(best
))
1430 switch (__get_agg_selection_mode(curr
->lag_ports
)) {
1432 if (curr
->num_of_ports
> best
->num_of_ports
)
1435 if (curr
->num_of_ports
< best
->num_of_ports
)
1439 case BOND_AD_STABLE
:
1440 case BOND_AD_BANDWIDTH
:
1441 if (__get_agg_bandwidth(curr
) > __get_agg_bandwidth(best
))
1447 pr_warn("%s: Impossible agg select mode %d\n",
1448 curr
->slave
->bond
->dev
->name
,
1449 __get_agg_selection_mode(curr
->lag_ports
));
1456 static int agg_device_up(const struct aggregator
*agg
)
1458 struct port
*port
= agg
->lag_ports
;
1463 return netif_running(port
->slave
->dev
) &&
1464 netif_carrier_ok(port
->slave
->dev
);
1468 * ad_agg_selection_logic - select an aggregation group for a team
1469 * @aggregator: the aggregator we're looking at
1471 * It is assumed that only one aggregator may be selected for a team.
1473 * The logic of this function is to select the aggregator according to
1474 * the ad_select policy:
1476 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1477 * it, and to reselect the active aggregator only if the previous
1478 * aggregator has no more ports related to it.
1480 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1481 * bandwidth, and reselect whenever a link state change takes place or the
1482 * set of slaves in the bond changes.
1484 * BOND_AD_COUNT: select the aggregator with largest number of ports
1485 * (slaves), and reselect whenever a link state change takes place or the
1486 * set of slaves in the bond changes.
1488 * FIXME: this function MUST be called with the first agg in the bond, or
1489 * __get_active_agg() won't work correctly. This function should be better
1490 * called with the bond itself, and retrieve the first agg from it.
1492 static void ad_agg_selection_logic(struct aggregator
*agg
)
1494 struct aggregator
*best
, *active
, *origin
;
1495 struct bonding
*bond
= agg
->slave
->bond
;
1496 struct list_head
*iter
;
1497 struct slave
*slave
;
1502 active
= __get_active_agg(agg
);
1503 best
= (active
&& agg_device_up(active
)) ? active
: NULL
;
1505 bond_for_each_slave_rcu(bond
, slave
, iter
) {
1506 agg
= &(SLAVE_AD_INFO(slave
).aggregator
);
1510 if (agg
->num_of_ports
&& agg_device_up(agg
))
1511 best
= ad_agg_selection_test(best
, agg
);
1515 __get_agg_selection_mode(best
->lag_ports
) == BOND_AD_STABLE
) {
1516 /* For the STABLE policy, don't replace the old active
1517 * aggregator if it's still active (it has an answering
1518 * partner) or if both the best and active don't have an
1519 * answering partner.
1521 if (active
&& active
->lag_ports
&&
1522 active
->lag_ports
->is_enabled
&&
1523 (__agg_has_partner(active
) ||
1524 (!__agg_has_partner(active
) &&
1525 !__agg_has_partner(best
)))) {
1526 if (!(!active
->actor_oper_aggregator_key
&&
1527 best
->actor_oper_aggregator_key
)) {
1529 active
->is_active
= 1;
1534 if (best
&& (best
== active
)) {
1536 active
->is_active
= 1;
1539 /* if there is new best aggregator, activate it */
1541 pr_debug("best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1542 best
->aggregator_identifier
, best
->num_of_ports
,
1543 best
->actor_oper_aggregator_key
,
1544 best
->partner_oper_aggregator_key
,
1545 best
->is_individual
, best
->is_active
);
1546 pr_debug("best ports %p slave %p %s\n",
1547 best
->lag_ports
, best
->slave
,
1548 best
->slave
? best
->slave
->dev
->name
: "NULL");
1550 bond_for_each_slave_rcu(bond
, slave
, iter
) {
1551 agg
= &(SLAVE_AD_INFO(slave
).aggregator
);
1553 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1554 agg
->aggregator_identifier
, agg
->num_of_ports
,
1555 agg
->actor_oper_aggregator_key
,
1556 agg
->partner_oper_aggregator_key
,
1557 agg
->is_individual
, agg
->is_active
);
1560 /* check if any partner replys */
1561 if (best
->is_individual
) {
1562 pr_warn("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1564 best
->slave
->bond
->dev
->name
: "NULL");
1567 best
->is_active
= 1;
1568 pr_debug("LAG %d chosen as the active LAG\n",
1569 best
->aggregator_identifier
);
1570 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1571 best
->aggregator_identifier
, best
->num_of_ports
,
1572 best
->actor_oper_aggregator_key
,
1573 best
->partner_oper_aggregator_key
,
1574 best
->is_individual
, best
->is_active
);
1576 /* disable the ports that were related to the former
1580 for (port
= active
->lag_ports
; port
;
1581 port
= port
->next_port_in_aggregator
) {
1582 __disable_port(port
);
1587 /* if the selected aggregator is of join individuals
1588 * (partner_system is NULL), enable their ports
1590 active
= __get_active_agg(origin
);
1593 if (!__agg_has_partner(active
)) {
1594 for (port
= active
->lag_ports
; port
;
1595 port
= port
->next_port_in_aggregator
) {
1596 __enable_port(port
);
1603 bond_3ad_set_carrier(bond
);
1607 * ad_clear_agg - clear a given aggregator's parameters
1608 * @aggregator: the aggregator we're looking at
1610 static void ad_clear_agg(struct aggregator
*aggregator
)
1613 aggregator
->is_individual
= false;
1614 aggregator
->actor_admin_aggregator_key
= 0;
1615 aggregator
->actor_oper_aggregator_key
= 0;
1616 aggregator
->partner_system
= null_mac_addr
;
1617 aggregator
->partner_system_priority
= 0;
1618 aggregator
->partner_oper_aggregator_key
= 0;
1619 aggregator
->receive_state
= 0;
1620 aggregator
->transmit_state
= 0;
1621 aggregator
->lag_ports
= NULL
;
1622 aggregator
->is_active
= 0;
1623 aggregator
->num_of_ports
= 0;
1624 pr_debug("LAG %d was cleared\n",
1625 aggregator
->aggregator_identifier
);
1630 * ad_initialize_agg - initialize a given aggregator's parameters
1631 * @aggregator: the aggregator we're looking at
1633 static void ad_initialize_agg(struct aggregator
*aggregator
)
1636 ad_clear_agg(aggregator
);
1638 aggregator
->aggregator_mac_address
= null_mac_addr
;
1639 aggregator
->aggregator_identifier
= 0;
1640 aggregator
->slave
= NULL
;
1645 * ad_initialize_port - initialize a given port's parameters
1646 * @aggregator: the aggregator we're looking at
1647 * @lacp_fast: boolean. whether fast periodic should be used
1649 static void ad_initialize_port(struct port
*port
, int lacp_fast
)
1651 static const struct port_params tmpl
= {
1652 .system_priority
= 0xffff,
1655 .port_priority
= 0xff,
1658 static const struct lacpdu lacpdu
= {
1660 .version_number
= 0x01,
1661 .tlv_type_actor_info
= 0x01,
1662 .actor_information_length
= 0x14,
1663 .tlv_type_partner_info
= 0x02,
1664 .partner_information_length
= 0x14,
1665 .tlv_type_collector_info
= 0x03,
1666 .collector_information_length
= 0x10,
1667 .collector_max_delay
= htons(AD_COLLECTOR_MAX_DELAY
),
1671 port
->actor_port_number
= 1;
1672 port
->actor_port_priority
= 0xff;
1673 port
->actor_system
= null_mac_addr
;
1674 port
->actor_system_priority
= 0xffff;
1675 port
->actor_port_aggregator_identifier
= 0;
1677 port
->actor_admin_port_key
= 1;
1678 port
->actor_oper_port_key
= 1;
1679 port
->actor_admin_port_state
= AD_STATE_AGGREGATION
|
1680 AD_STATE_LACP_ACTIVITY
;
1681 port
->actor_oper_port_state
= AD_STATE_AGGREGATION
|
1682 AD_STATE_LACP_ACTIVITY
;
1685 port
->actor_oper_port_state
|= AD_STATE_LACP_TIMEOUT
;
1687 memcpy(&port
->partner_admin
, &tmpl
, sizeof(tmpl
));
1688 memcpy(&port
->partner_oper
, &tmpl
, sizeof(tmpl
));
1690 port
->is_enabled
= true;
1691 /* private parameters */
1692 port
->sm_vars
= 0x3;
1693 port
->sm_rx_state
= 0;
1694 port
->sm_rx_timer_counter
= 0;
1695 port
->sm_periodic_state
= 0;
1696 port
->sm_periodic_timer_counter
= 0;
1697 port
->sm_mux_state
= 0;
1698 port
->sm_mux_timer_counter
= 0;
1699 port
->sm_tx_state
= 0;
1700 port
->sm_tx_timer_counter
= 0;
1702 port
->aggregator
= NULL
;
1703 port
->next_port_in_aggregator
= NULL
;
1704 port
->transaction_id
= 0;
1706 memcpy(&port
->lacpdu
, &lacpdu
, sizeof(lacpdu
));
1711 * ad_enable_collecting_distributing - enable a port's transmit/receive
1712 * @port: the port we're looking at
1714 * Enable @port if it's in an active aggregator
1716 static void ad_enable_collecting_distributing(struct port
*port
)
1718 if (port
->aggregator
->is_active
) {
1719 pr_debug("Enabling port %d(LAG %d)\n",
1720 port
->actor_port_number
,
1721 port
->aggregator
->aggregator_identifier
);
1722 __enable_port(port
);
1727 * ad_disable_collecting_distributing - disable a port's transmit/receive
1728 * @port: the port we're looking at
1730 static void ad_disable_collecting_distributing(struct port
*port
)
1732 if (port
->aggregator
&&
1733 !MAC_ADDRESS_EQUAL(&(port
->aggregator
->partner_system
),
1734 &(null_mac_addr
))) {
1735 pr_debug("Disabling port %d(LAG %d)\n",
1736 port
->actor_port_number
,
1737 port
->aggregator
->aggregator_identifier
);
1738 __disable_port(port
);
1743 * ad_marker_info_received - handle receive of a Marker information frame
1744 * @marker_info: Marker info received
1745 * @port: the port we're looking at
1747 static void ad_marker_info_received(struct bond_marker
*marker_info
,
1750 struct bond_marker marker
;
1752 /* copy the received marker data to the response marker */
1753 memcpy(&marker
, marker_info
, sizeof(struct bond_marker
));
1754 /* change the marker subtype to marker response */
1755 marker
.tlv_type
= AD_MARKER_RESPONSE_SUBTYPE
;
1757 /* send the marker response */
1758 if (ad_marker_send(port
, &marker
) >= 0) {
1759 pr_debug("Sent Marker Response on port %d\n",
1760 port
->actor_port_number
);
1765 * ad_marker_response_received - handle receive of a marker response frame
1766 * @marker: marker PDU received
1767 * @port: the port we're looking at
1769 * This function does nothing since we decided not to implement send and handle
1770 * response for marker PDU's, in this stage, but only to respond to marker
1773 static void ad_marker_response_received(struct bond_marker
*marker
,
1778 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1781 /* ========= AD exported functions to the main bonding code ========= */
1783 /* Check aggregators status in team every T seconds */
1784 #define AD_AGGREGATOR_SELECTION_TIMER 8
1787 * bond_3ad_initiate_agg_selection - initate aggregator selection
1788 * @bond: bonding struct
1790 * Set the aggregation selection timer, to initiate an agg selection in
1791 * the very near future. Called during first initialization, and during
1792 * any down to up transitions of the bond.
1794 void bond_3ad_initiate_agg_selection(struct bonding
*bond
, int timeout
)
1796 BOND_AD_INFO(bond
).agg_select_timer
= timeout
;
1799 static u16 aggregator_identifier
;
1802 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1803 * @bond: bonding struct to work on
1804 * @tick_resolution: tick duration (millisecond resolution)
1806 * Can be called only after the mac address of the bond is set.
1808 void bond_3ad_initialize(struct bonding
*bond
, u16 tick_resolution
)
1810 /* check that the bond is not initialized yet */
1811 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond
).system
.sys_mac_addr
),
1812 bond
->dev
->dev_addr
)) {
1814 aggregator_identifier
= 0;
1816 BOND_AD_INFO(bond
).system
.sys_priority
= 0xFFFF;
1817 BOND_AD_INFO(bond
).system
.sys_mac_addr
= *((struct mac_addr
*)bond
->dev
->dev_addr
);
1819 /* initialize how many times this module is called in one
1820 * second (should be about every 100ms)
1822 ad_ticks_per_sec
= tick_resolution
;
1824 bond_3ad_initiate_agg_selection(bond
,
1825 AD_AGGREGATOR_SELECTION_TIMER
*
1831 * bond_3ad_bind_slave - initialize a slave's port
1832 * @slave: slave struct to work on
1834 * Returns: 0 on success
1837 void bond_3ad_bind_slave(struct slave
*slave
)
1839 struct bonding
*bond
= bond_get_bond_by_slave(slave
);
1841 struct aggregator
*aggregator
;
1843 /* check that the slave has not been initialized yet. */
1844 if (SLAVE_AD_INFO(slave
).port
.slave
!= slave
) {
1846 /* port initialization */
1847 port
= &(SLAVE_AD_INFO(slave
).port
);
1849 ad_initialize_port(port
, bond
->params
.lacp_fast
);
1851 __initialize_port_locks(slave
);
1852 port
->slave
= slave
;
1853 port
->actor_port_number
= SLAVE_AD_INFO(slave
).id
;
1854 /* key is determined according to the link speed, duplex and user key(which
1855 * is yet not supported)
1857 port
->actor_admin_port_key
= 0;
1858 port
->actor_admin_port_key
|= __get_duplex(port
);
1859 port
->actor_admin_port_key
|= (__get_link_speed(port
) << 1);
1860 port
->actor_oper_port_key
= port
->actor_admin_port_key
;
1861 /* if the port is not full duplex, then the port should be not
1864 if (!(port
->actor_oper_port_key
& AD_DUPLEX_KEY_BITS
))
1865 port
->sm_vars
&= ~AD_PORT_LACP_ENABLED
;
1866 /* actor system is the bond's system */
1867 port
->actor_system
= BOND_AD_INFO(bond
).system
.sys_mac_addr
;
1868 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
1869 * lacpdu's are sent in one second)
1871 port
->sm_tx_timer_counter
= ad_ticks_per_sec
/AD_MAX_TX_IN_SECOND
;
1872 port
->aggregator
= NULL
;
1873 port
->next_port_in_aggregator
= NULL
;
1875 __disable_port(port
);
1877 /* aggregator initialization */
1878 aggregator
= &(SLAVE_AD_INFO(slave
).aggregator
);
1880 ad_initialize_agg(aggregator
);
1882 aggregator
->aggregator_mac_address
= *((struct mac_addr
*)bond
->dev
->dev_addr
);
1883 aggregator
->aggregator_identifier
= (++aggregator_identifier
);
1884 aggregator
->slave
= slave
;
1885 aggregator
->is_active
= 0;
1886 aggregator
->num_of_ports
= 0;
1891 * bond_3ad_unbind_slave - deinitialize a slave's port
1892 * @slave: slave struct to work on
1894 * Search for the aggregator that is related to this port, remove the
1895 * aggregator and assign another aggregator for other port related to it
1896 * (if any), and remove the port.
1898 void bond_3ad_unbind_slave(struct slave
*slave
)
1900 struct port
*port
, *prev_port
, *temp_port
;
1901 struct aggregator
*aggregator
, *new_aggregator
, *temp_aggregator
;
1902 int select_new_active_agg
= 0;
1903 struct bonding
*bond
= slave
->bond
;
1904 struct slave
*slave_iter
;
1905 struct list_head
*iter
;
1907 aggregator
= &(SLAVE_AD_INFO(slave
).aggregator
);
1908 port
= &(SLAVE_AD_INFO(slave
).port
);
1910 /* if slave is null, the whole port is not initialized */
1912 pr_warn("Warning: %s: Trying to unbind an uninitialized port on %s\n",
1913 slave
->bond
->dev
->name
, slave
->dev
->name
);
1917 pr_debug("Unbinding Link Aggregation Group %d\n",
1918 aggregator
->aggregator_identifier
);
1920 /* Tell the partner that this port is not suitable for aggregation */
1921 port
->actor_oper_port_state
&= ~AD_STATE_AGGREGATION
;
1922 __update_lacpdu_from_port(port
);
1923 ad_lacpdu_send(port
);
1925 /* check if this aggregator is occupied */
1926 if (aggregator
->lag_ports
) {
1927 /* check if there are other ports related to this aggregator
1928 * except the port related to this slave(thats ensure us that
1929 * there is a reason to search for new aggregator, and that we
1932 if ((aggregator
->lag_ports
!= port
) ||
1933 (aggregator
->lag_ports
->next_port_in_aggregator
)) {
1934 /* find new aggregator for the related port(s) */
1935 bond_for_each_slave(bond
, slave_iter
, iter
) {
1936 new_aggregator
= &(SLAVE_AD_INFO(slave_iter
).aggregator
);
1937 /* if the new aggregator is empty, or it is
1938 * connected to our port only
1940 if (!new_aggregator
->lag_ports
||
1941 ((new_aggregator
->lag_ports
== port
) &&
1942 !new_aggregator
->lag_ports
->next_port_in_aggregator
))
1946 new_aggregator
= NULL
;
1948 /* if new aggregator found, copy the aggregator's
1949 * parameters and connect the related lag_ports to the
1952 if ((new_aggregator
) && ((!new_aggregator
->lag_ports
) || ((new_aggregator
->lag_ports
== port
) && !new_aggregator
->lag_ports
->next_port_in_aggregator
))) {
1953 pr_debug("Some port(s) related to LAG %d - replaceing with LAG %d\n",
1954 aggregator
->aggregator_identifier
,
1955 new_aggregator
->aggregator_identifier
);
1957 if ((new_aggregator
->lag_ports
== port
) &&
1958 new_aggregator
->is_active
) {
1959 pr_info("%s: Removing an active aggregator\n",
1960 aggregator
->slave
->bond
->dev
->name
);
1961 select_new_active_agg
= 1;
1964 new_aggregator
->is_individual
= aggregator
->is_individual
;
1965 new_aggregator
->actor_admin_aggregator_key
= aggregator
->actor_admin_aggregator_key
;
1966 new_aggregator
->actor_oper_aggregator_key
= aggregator
->actor_oper_aggregator_key
;
1967 new_aggregator
->partner_system
= aggregator
->partner_system
;
1968 new_aggregator
->partner_system_priority
= aggregator
->partner_system_priority
;
1969 new_aggregator
->partner_oper_aggregator_key
= aggregator
->partner_oper_aggregator_key
;
1970 new_aggregator
->receive_state
= aggregator
->receive_state
;
1971 new_aggregator
->transmit_state
= aggregator
->transmit_state
;
1972 new_aggregator
->lag_ports
= aggregator
->lag_ports
;
1973 new_aggregator
->is_active
= aggregator
->is_active
;
1974 new_aggregator
->num_of_ports
= aggregator
->num_of_ports
;
1976 /* update the information that is written on
1977 * the ports about the aggregator
1979 for (temp_port
= aggregator
->lag_ports
; temp_port
;
1980 temp_port
= temp_port
->next_port_in_aggregator
) {
1981 temp_port
->aggregator
= new_aggregator
;
1982 temp_port
->actor_port_aggregator_identifier
= new_aggregator
->aggregator_identifier
;
1985 ad_clear_agg(aggregator
);
1987 if (select_new_active_agg
)
1988 ad_agg_selection_logic(__get_first_agg(port
));
1990 pr_warn("%s: Warning: unbinding aggregator, and could not find a new aggregator for its ports\n",
1991 slave
->bond
->dev
->name
);
1994 /* in case that the only port related to this
1995 * aggregator is the one we want to remove
1997 select_new_active_agg
= aggregator
->is_active
;
1998 ad_clear_agg(aggregator
);
1999 if (select_new_active_agg
) {
2000 pr_info("%s: Removing an active aggregator\n",
2001 slave
->bond
->dev
->name
);
2002 /* select new active aggregator */
2003 temp_aggregator
= __get_first_agg(port
);
2004 if (temp_aggregator
)
2005 ad_agg_selection_logic(temp_aggregator
);
2010 pr_debug("Unbinding port %d\n", port
->actor_port_number
);
2012 /* find the aggregator that this port is connected to */
2013 bond_for_each_slave(bond
, slave_iter
, iter
) {
2014 temp_aggregator
= &(SLAVE_AD_INFO(slave_iter
).aggregator
);
2016 /* search the port in the aggregator's related ports */
2017 for (temp_port
= temp_aggregator
->lag_ports
; temp_port
;
2018 prev_port
= temp_port
,
2019 temp_port
= temp_port
->next_port_in_aggregator
) {
2020 if (temp_port
== port
) {
2021 /* the aggregator found - detach the port from
2025 prev_port
->next_port_in_aggregator
= temp_port
->next_port_in_aggregator
;
2027 temp_aggregator
->lag_ports
= temp_port
->next_port_in_aggregator
;
2028 temp_aggregator
->num_of_ports
--;
2029 if (temp_aggregator
->num_of_ports
== 0) {
2030 select_new_active_agg
= temp_aggregator
->is_active
;
2031 ad_clear_agg(temp_aggregator
);
2032 if (select_new_active_agg
) {
2033 pr_info("%s: Removing an active aggregator\n",
2034 slave
->bond
->dev
->name
);
2035 /* select new active aggregator */
2036 ad_agg_selection_logic(__get_first_agg(port
));
2047 * bond_3ad_state_machine_handler - handle state machines timeout
2048 * @bond: bonding struct to work on
2050 * The state machine handling concept in this module is to check every tick
2051 * which state machine should operate any function. The execution order is
2052 * round robin, so when we have an interaction between state machines, the
2053 * reply of one to each other might be delayed until next tick.
2055 * This function also complete the initialization when the agg_select_timer
2056 * times out, and it selects an aggregator for the ports that are yet not
2057 * related to any aggregator, and selects the active aggregator for a bond.
2059 void bond_3ad_state_machine_handler(struct work_struct
*work
)
2061 struct bonding
*bond
= container_of(work
, struct bonding
,
2063 struct aggregator
*aggregator
;
2064 struct list_head
*iter
;
2065 struct slave
*slave
;
2068 read_lock(&bond
->lock
);
2071 /* check if there are any slaves */
2072 if (!bond_has_slaves(bond
))
2075 /* check if agg_select_timer timer after initialize is timed out */
2076 if (BOND_AD_INFO(bond
).agg_select_timer
&&
2077 !(--BOND_AD_INFO(bond
).agg_select_timer
)) {
2078 slave
= bond_first_slave_rcu(bond
);
2079 port
= slave
? &(SLAVE_AD_INFO(slave
).port
) : NULL
;
2081 /* select the active aggregator for the bond */
2084 pr_warn("%s: Warning: bond's first port is uninitialized\n",
2089 aggregator
= __get_first_agg(port
);
2090 ad_agg_selection_logic(aggregator
);
2092 bond_3ad_set_carrier(bond
);
2095 /* for each port run the state machines */
2096 bond_for_each_slave_rcu(bond
, slave
, iter
) {
2097 port
= &(SLAVE_AD_INFO(slave
).port
);
2099 pr_warn("%s: Warning: Found an uninitialized port\n",
2104 /* Lock around state machines to protect data accessed
2105 * by all (e.g., port->sm_vars). ad_rx_machine may run
2106 * concurrently due to incoming LACPDU.
2108 __get_state_machine_lock(port
);
2110 ad_rx_machine(NULL
, port
);
2111 ad_periodic_machine(port
);
2112 ad_port_selection_logic(port
);
2113 ad_mux_machine(port
);
2114 ad_tx_machine(port
);
2116 /* turn off the BEGIN bit, since we already handled it */
2117 if (port
->sm_vars
& AD_PORT_BEGIN
)
2118 port
->sm_vars
&= ~AD_PORT_BEGIN
;
2120 __release_state_machine_lock(port
);
2125 read_unlock(&bond
->lock
);
2126 queue_delayed_work(bond
->wq
, &bond
->ad_work
, ad_delta_in_ticks
);
2130 * bond_3ad_rx_indication - handle a received frame
2131 * @lacpdu: received lacpdu
2132 * @slave: slave struct to work on
2133 * @length: length of the data received
2135 * It is assumed that frames that were sent on this NIC don't returned as new
2136 * received frames (loopback). Since only the payload is given to this
2137 * function, it check for loopback.
2139 static int bond_3ad_rx_indication(struct lacpdu
*lacpdu
, struct slave
*slave
,
2143 int ret
= RX_HANDLER_ANOTHER
;
2145 if (length
>= sizeof(struct lacpdu
)) {
2147 port
= &(SLAVE_AD_INFO(slave
).port
);
2150 pr_warn("%s: Warning: port of slave %s is uninitialized\n",
2151 slave
->dev
->name
, slave
->bond
->dev
->name
);
2155 switch (lacpdu
->subtype
) {
2156 case AD_TYPE_LACPDU
:
2157 ret
= RX_HANDLER_CONSUMED
;
2158 pr_debug("Received LACPDU on port %d\n",
2159 port
->actor_port_number
);
2160 /* Protect against concurrent state machines */
2161 __get_state_machine_lock(port
);
2162 ad_rx_machine(lacpdu
, port
);
2163 __release_state_machine_lock(port
);
2166 case AD_TYPE_MARKER
:
2167 ret
= RX_HANDLER_CONSUMED
;
2168 /* No need to convert fields to Little Endian since we
2169 * don't use the marker's fields.
2172 switch (((struct bond_marker
*)lacpdu
)->tlv_type
) {
2173 case AD_MARKER_INFORMATION_SUBTYPE
:
2174 pr_debug("Received Marker Information on port %d\n",
2175 port
->actor_port_number
);
2176 ad_marker_info_received((struct bond_marker
*)lacpdu
, port
);
2179 case AD_MARKER_RESPONSE_SUBTYPE
:
2180 pr_debug("Received Marker Response on port %d\n",
2181 port
->actor_port_number
);
2182 ad_marker_response_received((struct bond_marker
*)lacpdu
, port
);
2186 pr_debug("Received an unknown Marker subtype on slot %d\n",
2187 port
->actor_port_number
);
2195 * bond_3ad_adapter_speed_changed - handle a slave's speed change indication
2196 * @slave: slave struct to work on
2198 * Handle reselection of aggregator (if needed) for this port.
2200 void bond_3ad_adapter_speed_changed(struct slave
*slave
)
2204 port
= &(SLAVE_AD_INFO(slave
).port
);
2206 /* if slave is null, the whole port is not initialized */
2208 pr_warn("Warning: %s: speed changed for uninitialized port on %s\n",
2209 slave
->bond
->dev
->name
, slave
->dev
->name
);
2213 __get_state_machine_lock(port
);
2215 port
->actor_admin_port_key
&= ~AD_SPEED_KEY_BITS
;
2216 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2217 (__get_link_speed(port
) << 1);
2218 pr_debug("Port %d changed speed\n", port
->actor_port_number
);
2219 /* there is no need to reselect a new aggregator, just signal the
2220 * state machines to reinitialize
2222 port
->sm_vars
|= AD_PORT_BEGIN
;
2224 __release_state_machine_lock(port
);
2228 * bond_3ad_adapter_duplex_changed - handle a slave's duplex change indication
2229 * @slave: slave struct to work on
2231 * Handle reselection of aggregator (if needed) for this port.
2233 void bond_3ad_adapter_duplex_changed(struct slave
*slave
)
2237 port
= &(SLAVE_AD_INFO(slave
).port
);
2239 /* if slave is null, the whole port is not initialized */
2241 pr_warn("%s: Warning: duplex changed for uninitialized port on %s\n",
2242 slave
->bond
->dev
->name
, slave
->dev
->name
);
2246 __get_state_machine_lock(port
);
2248 port
->actor_admin_port_key
&= ~AD_DUPLEX_KEY_BITS
;
2249 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2251 pr_debug("Port %d changed duplex\n", port
->actor_port_number
);
2252 /* there is no need to reselect a new aggregator, just signal the
2253 * state machines to reinitialize
2255 port
->sm_vars
|= AD_PORT_BEGIN
;
2257 __release_state_machine_lock(port
);
2261 * bond_3ad_handle_link_change - handle a slave's link status change indication
2262 * @slave: slave struct to work on
2263 * @status: whether the link is now up or down
2265 * Handle reselection of aggregator (if needed) for this port.
2267 void bond_3ad_handle_link_change(struct slave
*slave
, char link
)
2271 port
= &(SLAVE_AD_INFO(slave
).port
);
2273 /* if slave is null, the whole port is not initialized */
2275 pr_warn("Warning: %s: link status changed for uninitialized port on %s\n",
2276 slave
->bond
->dev
->name
, slave
->dev
->name
);
2280 __get_state_machine_lock(port
);
2281 /* on link down we are zeroing duplex and speed since
2282 * some of the adaptors(ce1000.lan) report full duplex/speed
2283 * instead of N/A(duplex) / 0(speed).
2285 * on link up we are forcing recheck on the duplex and speed since
2286 * some of he adaptors(ce1000.lan) report.
2288 if (link
== BOND_LINK_UP
) {
2289 port
->is_enabled
= true;
2290 port
->actor_admin_port_key
&= ~AD_DUPLEX_KEY_BITS
;
2291 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2293 port
->actor_admin_port_key
&= ~AD_SPEED_KEY_BITS
;
2294 port
->actor_oper_port_key
= port
->actor_admin_port_key
|=
2295 (__get_link_speed(port
) << 1);
2297 /* link has failed */
2298 port
->is_enabled
= false;
2299 port
->actor_admin_port_key
&= ~AD_DUPLEX_KEY_BITS
;
2300 port
->actor_oper_port_key
= (port
->actor_admin_port_key
&=
2301 ~AD_SPEED_KEY_BITS
);
2303 pr_debug("Port %d changed link status to %s",
2304 port
->actor_port_number
,
2305 (link
== BOND_LINK_UP
) ? "UP" : "DOWN");
2306 /* there is no need to reselect a new aggregator, just signal the
2307 * state machines to reinitialize
2309 port
->sm_vars
|= AD_PORT_BEGIN
;
2311 __release_state_machine_lock(port
);
2315 * bond_3ad_set_carrier - set link state for bonding master
2316 * @bond - bonding structure
2318 * if we have an active aggregator, we're up, if not, we're down.
2319 * Presumes that we cannot have an active aggregator if there are
2320 * no slaves with link up.
2322 * This behavior complies with IEEE 802.3 section 43.3.9.
2324 * Called by bond_set_carrier(). Return zero if carrier state does not
2325 * change, nonzero if it does.
2327 int bond_3ad_set_carrier(struct bonding
*bond
)
2329 struct aggregator
*active
;
2330 struct slave
*first_slave
;
2334 first_slave
= bond_first_slave_rcu(bond
);
2339 active
= __get_active_agg(&(SLAVE_AD_INFO(first_slave
).aggregator
));
2341 /* are enough slaves available to consider link up? */
2342 if (active
->num_of_ports
< bond
->params
.min_links
) {
2343 if (netif_carrier_ok(bond
->dev
)) {
2344 netif_carrier_off(bond
->dev
);
2347 } else if (!netif_carrier_ok(bond
->dev
)) {
2348 netif_carrier_on(bond
->dev
);
2351 } else if (netif_carrier_ok(bond
->dev
)) {
2352 netif_carrier_off(bond
->dev
);
2360 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2361 * @bond: bonding struct to work on
2362 * @ad_info: ad_info struct to fill with the bond's info
2364 * Returns: 0 on success
2367 int __bond_3ad_get_active_agg_info(struct bonding
*bond
,
2368 struct ad_info
*ad_info
)
2370 struct aggregator
*aggregator
= NULL
;
2371 struct list_head
*iter
;
2372 struct slave
*slave
;
2375 bond_for_each_slave_rcu(bond
, slave
, iter
) {
2376 port
= &(SLAVE_AD_INFO(slave
).port
);
2377 if (port
->aggregator
&& port
->aggregator
->is_active
) {
2378 aggregator
= port
->aggregator
;
2384 ad_info
->aggregator_id
= aggregator
->aggregator_identifier
;
2385 ad_info
->ports
= aggregator
->num_of_ports
;
2386 ad_info
->actor_key
= aggregator
->actor_oper_aggregator_key
;
2387 ad_info
->partner_key
= aggregator
->partner_oper_aggregator_key
;
2388 memcpy(ad_info
->partner_system
,
2389 aggregator
->partner_system
.mac_addr_value
, ETH_ALEN
);
2396 /* Wrapper used to hold bond->lock so no slave manipulation can occur */
2397 int bond_3ad_get_active_agg_info(struct bonding
*bond
, struct ad_info
*ad_info
)
2402 ret
= __bond_3ad_get_active_agg_info(bond
, ad_info
);
2408 int bond_3ad_xmit_xor(struct sk_buff
*skb
, struct net_device
*dev
)
2410 struct bonding
*bond
= netdev_priv(dev
);
2411 struct slave
*slave
, *first_ok_slave
;
2412 struct aggregator
*agg
;
2413 struct ad_info ad_info
;
2414 struct list_head
*iter
;
2419 if (__bond_3ad_get_active_agg_info(bond
, &ad_info
)) {
2420 pr_debug("%s: Error: __bond_3ad_get_active_agg_info failed\n",
2425 slaves_in_agg
= ad_info
.ports
;
2426 agg_id
= ad_info
.aggregator_id
;
2428 if (slaves_in_agg
== 0) {
2429 pr_debug("%s: Error: active aggregator is empty\n", dev
->name
);
2433 slave_agg_no
= bond_xmit_hash(bond
, skb
, slaves_in_agg
);
2434 first_ok_slave
= NULL
;
2436 bond_for_each_slave_rcu(bond
, slave
, iter
) {
2437 agg
= SLAVE_AD_INFO(slave
).port
.aggregator
;
2438 if (!agg
|| agg
->aggregator_identifier
!= agg_id
)
2441 if (slave_agg_no
>= 0) {
2442 if (!first_ok_slave
&& SLAVE_IS_OK(slave
))
2443 first_ok_slave
= slave
;
2448 if (SLAVE_IS_OK(slave
)) {
2449 bond_dev_queue_xmit(bond
, skb
, slave
->dev
);
2454 if (slave_agg_no
>= 0) {
2455 pr_err("%s: Error: Couldn't find a slave to tx on for aggregator ID %d\n",
2460 /* we couldn't find any suitable slave after the agg_no, so use the
2461 * first suitable found, if found.
2464 bond_dev_queue_xmit(bond
, skb
, first_ok_slave
->dev
);
2469 return NETDEV_TX_OK
;
2471 /* no suitable interface, frame not sent */
2476 int bond_3ad_lacpdu_recv(const struct sk_buff
*skb
, struct bonding
*bond
,
2477 struct slave
*slave
)
2479 int ret
= RX_HANDLER_ANOTHER
;
2480 struct lacpdu
*lacpdu
, _lacpdu
;
2482 if (skb
->protocol
!= PKT_TYPE_LACPDU
)
2485 lacpdu
= skb_header_pointer(skb
, 0, sizeof(_lacpdu
), &_lacpdu
);
2489 read_lock(&bond
->lock
);
2490 ret
= bond_3ad_rx_indication(lacpdu
, slave
, skb
->len
);
2491 read_unlock(&bond
->lock
);
2496 * bond_3ad_update_lacp_rate - change the lacp rate
2497 * @bond - bonding struct
2499 * When modify lacp_rate parameter via sysfs,
2500 * update actor_oper_port_state of each port.
2502 * Hold slave->state_machine_lock,
2503 * so we can modify port->actor_oper_port_state,
2504 * no matter bond is up or down.
2506 void bond_3ad_update_lacp_rate(struct bonding
*bond
)
2508 struct port
*port
= NULL
;
2509 struct list_head
*iter
;
2510 struct slave
*slave
;
2513 lacp_fast
= bond
->params
.lacp_fast
;
2514 bond_for_each_slave(bond
, slave
, iter
) {
2515 port
= &(SLAVE_AD_INFO(slave
).port
);
2516 __get_state_machine_lock(port
);
2518 port
->actor_oper_port_state
|= AD_STATE_LACP_TIMEOUT
;
2520 port
->actor_oper_port_state
&= ~AD_STATE_LACP_TIMEOUT
;
2521 __release_state_machine_lock(port
);