powerpc/mm/4k: don't allocate larger pmd page table for 4k
[linux/fpc-iii.git] / drivers / net / bonding / bond_3ad.c
blobedc70ffad6607ac06d0a40b48316bef554c5f4c2
1 /*
2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
7 * any later version.
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * The full GNU General Public License is included in this distribution in the
19 * file called LICENSE.
23 #include <linux/skbuff.h>
24 #include <linux/if_ether.h>
25 #include <linux/netdevice.h>
26 #include <linux/spinlock.h>
27 #include <linux/ethtool.h>
28 #include <linux/etherdevice.h>
29 #include <linux/if_bonding.h>
30 #include <linux/pkt_sched.h>
31 #include <net/net_namespace.h>
32 #include <net/bonding.h>
33 #include <net/bond_3ad.h>
35 /* General definitions */
36 #define AD_SHORT_TIMEOUT 1
37 #define AD_LONG_TIMEOUT 0
38 #define AD_STANDBY 0x2
39 #define AD_MAX_TX_IN_SECOND 3
40 #define AD_COLLECTOR_MAX_DELAY 0
42 /* Timer definitions (43.4.4 in the 802.3ad standard) */
43 #define AD_FAST_PERIODIC_TIME 1
44 #define AD_SLOW_PERIODIC_TIME 30
45 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
46 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
47 #define AD_CHURN_DETECTION_TIME 60
48 #define AD_AGGREGATE_WAIT_TIME 2
50 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */
51 #define AD_STATE_LACP_ACTIVITY 0x1
52 #define AD_STATE_LACP_TIMEOUT 0x2
53 #define AD_STATE_AGGREGATION 0x4
54 #define AD_STATE_SYNCHRONIZATION 0x8
55 #define AD_STATE_COLLECTING 0x10
56 #define AD_STATE_DISTRIBUTING 0x20
57 #define AD_STATE_DEFAULTED 0x40
58 #define AD_STATE_EXPIRED 0x80
60 /* Port Variables definitions used by the State Machines (43.4.7 in the
61 * 802.3ad standard)
63 #define AD_PORT_BEGIN 0x1
64 #define AD_PORT_LACP_ENABLED 0x2
65 #define AD_PORT_ACTOR_CHURN 0x4
66 #define AD_PORT_PARTNER_CHURN 0x8
67 #define AD_PORT_READY 0x10
68 #define AD_PORT_READY_N 0x20
69 #define AD_PORT_MATCHED 0x40
70 #define AD_PORT_STANDBY 0x80
71 #define AD_PORT_SELECTED 0x100
72 #define AD_PORT_MOVED 0x200
73 #define AD_PORT_CHURNED (AD_PORT_ACTOR_CHURN | AD_PORT_PARTNER_CHURN)
75 /* Port Key definitions
76 * key is determined according to the link speed, duplex and
77 * user key (which is yet not supported)
78 * --------------------------------------------------------------
79 * Port key | User key (10 bits) | Speed (5 bits) | Duplex|
80 * --------------------------------------------------------------
81 * |15 6|5 1|0
83 #define AD_DUPLEX_KEY_MASKS 0x1
84 #define AD_SPEED_KEY_MASKS 0x3E
85 #define AD_USER_KEY_MASKS 0xFFC0
87 enum ad_link_speed_type {
88 AD_LINK_SPEED_1MBPS = 1,
89 AD_LINK_SPEED_10MBPS,
90 AD_LINK_SPEED_100MBPS,
91 AD_LINK_SPEED_1000MBPS,
92 AD_LINK_SPEED_2500MBPS,
93 AD_LINK_SPEED_10000MBPS,
94 AD_LINK_SPEED_20000MBPS,
95 AD_LINK_SPEED_40000MBPS,
96 AD_LINK_SPEED_56000MBPS,
97 AD_LINK_SPEED_100000MBPS,
100 /* compare MAC addresses */
101 #define MAC_ADDRESS_EQUAL(A, B) \
102 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
104 static const u8 null_mac_addr[ETH_ALEN + 2] __long_aligned = {
105 0, 0, 0, 0, 0, 0
107 static u16 ad_ticks_per_sec;
108 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000;
110 static const u8 lacpdu_mcast_addr[ETH_ALEN + 2] __long_aligned =
111 MULTICAST_LACPDU_ADDR;
113 /* ================= main 802.3ad protocol functions ================== */
114 static int ad_lacpdu_send(struct port *port);
115 static int ad_marker_send(struct port *port, struct bond_marker *marker);
116 static void ad_mux_machine(struct port *port, bool *update_slave_arr);
117 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
118 static void ad_tx_machine(struct port *port);
119 static void ad_periodic_machine(struct port *port);
120 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr);
121 static void ad_agg_selection_logic(struct aggregator *aggregator,
122 bool *update_slave_arr);
123 static void ad_clear_agg(struct aggregator *aggregator);
124 static void ad_initialize_agg(struct aggregator *aggregator);
125 static void ad_initialize_port(struct port *port, int lacp_fast);
126 static void ad_enable_collecting_distributing(struct port *port,
127 bool *update_slave_arr);
128 static void ad_disable_collecting_distributing(struct port *port,
129 bool *update_slave_arr);
130 static void ad_marker_info_received(struct bond_marker *marker_info,
131 struct port *port);
132 static void ad_marker_response_received(struct bond_marker *marker,
133 struct port *port);
134 static void ad_update_actor_keys(struct port *port, bool reset);
137 /* ================= api to bonding and kernel code ================== */
140 * __get_bond_by_port - get the port's bonding struct
141 * @port: the port we're looking at
143 * Return @port's bonding struct, or %NULL if it can't be found.
145 static inline struct bonding *__get_bond_by_port(struct port *port)
147 if (port->slave == NULL)
148 return NULL;
150 return bond_get_bond_by_slave(port->slave);
154 * __get_first_agg - get the first aggregator in the bond
155 * @bond: the bond we're looking at
157 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
158 * found.
159 * The caller must hold RCU or RTNL lock.
161 static inline struct aggregator *__get_first_agg(struct port *port)
163 struct bonding *bond = __get_bond_by_port(port);
164 struct slave *first_slave;
165 struct aggregator *agg;
167 /* If there's no bond for this port, or bond has no slaves */
168 if (bond == NULL)
169 return NULL;
171 rcu_read_lock();
172 first_slave = bond_first_slave_rcu(bond);
173 agg = first_slave ? &(SLAVE_AD_INFO(first_slave)->aggregator) : NULL;
174 rcu_read_unlock();
176 return agg;
180 * __agg_has_partner - see if we have a partner
181 * @agg: the agregator we're looking at
183 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
184 * address for the partner). Return 0 if not.
186 static inline int __agg_has_partner(struct aggregator *agg)
188 return !is_zero_ether_addr(agg->partner_system.mac_addr_value);
192 * __disable_port - disable the port's slave
193 * @port: the port we're looking at
195 static inline void __disable_port(struct port *port)
197 bond_set_slave_inactive_flags(port->slave, BOND_SLAVE_NOTIFY_LATER);
201 * __enable_port - enable the port's slave, if it's up
202 * @port: the port we're looking at
204 static inline void __enable_port(struct port *port)
206 struct slave *slave = port->slave;
208 if ((slave->link == BOND_LINK_UP) && bond_slave_is_up(slave))
209 bond_set_slave_active_flags(slave, BOND_SLAVE_NOTIFY_LATER);
213 * __port_is_enabled - check if the port's slave is in active state
214 * @port: the port we're looking at
216 static inline int __port_is_enabled(struct port *port)
218 return bond_is_active_slave(port->slave);
222 * __get_agg_selection_mode - get the aggregator selection mode
223 * @port: the port we're looking at
225 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
227 static inline u32 __get_agg_selection_mode(struct port *port)
229 struct bonding *bond = __get_bond_by_port(port);
231 if (bond == NULL)
232 return BOND_AD_STABLE;
234 return bond->params.ad_select;
238 * __check_agg_selection_timer - check if the selection timer has expired
239 * @port: the port we're looking at
241 static inline int __check_agg_selection_timer(struct port *port)
243 struct bonding *bond = __get_bond_by_port(port);
245 if (bond == NULL)
246 return 0;
248 return BOND_AD_INFO(bond).agg_select_timer ? 1 : 0;
252 * __get_link_speed - get a port's speed
253 * @port: the port we're looking at
255 * Return @port's speed in 802.3ad enum format. i.e. one of:
256 * 0,
257 * %AD_LINK_SPEED_10MBPS,
258 * %AD_LINK_SPEED_100MBPS,
259 * %AD_LINK_SPEED_1000MBPS,
260 * %AD_LINK_SPEED_2500MBPS,
261 * %AD_LINK_SPEED_10000MBPS
262 * %AD_LINK_SPEED_20000MBPS
263 * %AD_LINK_SPEED_40000MBPS
264 * %AD_LINK_SPEED_56000MBPS
265 * %AD_LINK_SPEED_100000MBPS
267 static u16 __get_link_speed(struct port *port)
269 struct slave *slave = port->slave;
270 u16 speed;
272 /* this if covers only a special case: when the configuration starts
273 * with link down, it sets the speed to 0.
274 * This is done in spite of the fact that the e100 driver reports 0
275 * to be compatible with MVT in the future.
277 if (slave->link != BOND_LINK_UP)
278 speed = 0;
279 else {
280 switch (slave->speed) {
281 case SPEED_10:
282 speed = AD_LINK_SPEED_10MBPS;
283 break;
285 case SPEED_100:
286 speed = AD_LINK_SPEED_100MBPS;
287 break;
289 case SPEED_1000:
290 speed = AD_LINK_SPEED_1000MBPS;
291 break;
293 case SPEED_2500:
294 speed = AD_LINK_SPEED_2500MBPS;
295 break;
297 case SPEED_10000:
298 speed = AD_LINK_SPEED_10000MBPS;
299 break;
301 case SPEED_20000:
302 speed = AD_LINK_SPEED_20000MBPS;
303 break;
305 case SPEED_40000:
306 speed = AD_LINK_SPEED_40000MBPS;
307 break;
309 case SPEED_56000:
310 speed = AD_LINK_SPEED_56000MBPS;
311 break;
313 case SPEED_100000:
314 speed = AD_LINK_SPEED_100000MBPS;
315 break;
317 default:
318 /* unknown speed value from ethtool. shouldn't happen */
319 speed = 0;
320 break;
324 netdev_dbg(slave->bond->dev, "Port %d Received link speed %d update from adapter\n",
325 port->actor_port_number, speed);
326 return speed;
330 * __get_duplex - get a port's duplex
331 * @port: the port we're looking at
333 * Return @port's duplex in 802.3ad bitmask format. i.e.:
334 * 0x01 if in full duplex
335 * 0x00 otherwise
337 static u8 __get_duplex(struct port *port)
339 struct slave *slave = port->slave;
340 u8 retval = 0x0;
342 /* handling a special case: when the configuration starts with
343 * link down, it sets the duplex to 0.
345 if (slave->link == BOND_LINK_UP) {
346 switch (slave->duplex) {
347 case DUPLEX_FULL:
348 retval = 0x1;
349 netdev_dbg(slave->bond->dev, "Port %d Received status full duplex update from adapter\n",
350 port->actor_port_number);
351 break;
352 case DUPLEX_HALF:
353 default:
354 retval = 0x0;
355 netdev_dbg(slave->bond->dev, "Port %d Received status NOT full duplex update from adapter\n",
356 port->actor_port_number);
357 break;
360 return retval;
363 static void __ad_actor_update_port(struct port *port)
365 const struct bonding *bond = bond_get_bond_by_slave(port->slave);
367 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr;
368 port->actor_system_priority = BOND_AD_INFO(bond).system.sys_priority;
371 /* Conversions */
374 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
375 * @timer_type: which timer to operate
376 * @par: timer parameter. see below
378 * If @timer_type is %current_while_timer, @par indicates long/short timer.
379 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
380 * %SLOW_PERIODIC_TIME.
382 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par)
384 u16 retval = 0; /* to silence the compiler */
386 switch (timer_type) {
387 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */
388 if (par)
389 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec);
390 else
391 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec);
392 break;
393 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */
394 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
395 break;
396 case AD_PERIODIC_TIMER: /* for periodic machine */
397 retval = (par*ad_ticks_per_sec); /* long timeout */
398 break;
399 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */
400 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
401 break;
402 case AD_WAIT_WHILE_TIMER: /* for selection machine */
403 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec);
404 break;
407 return retval;
411 /* ================= ad_rx_machine helper functions ================== */
414 * __choose_matched - update a port's matched variable from a received lacpdu
415 * @lacpdu: the lacpdu we've received
416 * @port: the port we're looking at
418 * Update the value of the matched variable, using parameter values from a
419 * newly received lacpdu. Parameter values for the partner carried in the
420 * received PDU are compared with the corresponding operational parameter
421 * values for the actor. Matched is set to TRUE if all of these parameters
422 * match and the PDU parameter partner_state.aggregation has the same value as
423 * actor_oper_port_state.aggregation and lacp will actively maintain the link
424 * in the aggregation. Matched is also set to TRUE if the value of
425 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
426 * an individual link and lacp will actively maintain the link. Otherwise,
427 * matched is set to FALSE. LACP is considered to be actively maintaining the
428 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
429 * the actor's actor_oper_port_state.lacp_activity and the PDU's
430 * partner_state.lacp_activity variables are TRUE.
432 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
433 * used here to implement the language from 802.3ad 43.4.9 that requires
434 * recordPDU to "match" the LACPDU parameters to the stored values.
436 static void __choose_matched(struct lacpdu *lacpdu, struct port *port)
438 /* check if all parameters are alike
439 * or this is individual link(aggregation == FALSE)
440 * then update the state machine Matched variable.
442 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) &&
443 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) &&
444 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) &&
445 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) &&
446 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) &&
447 ((lacpdu->partner_state & AD_STATE_AGGREGATION) == (port->actor_oper_port_state & AD_STATE_AGGREGATION))) ||
448 ((lacpdu->actor_state & AD_STATE_AGGREGATION) == 0)
450 port->sm_vars |= AD_PORT_MATCHED;
451 } else {
452 port->sm_vars &= ~AD_PORT_MATCHED;
457 * __record_pdu - record parameters from a received lacpdu
458 * @lacpdu: the lacpdu we've received
459 * @port: the port we're looking at
461 * Record the parameter values for the Actor carried in a received lacpdu as
462 * the current partner operational parameter values and sets
463 * actor_oper_port_state.defaulted to FALSE.
465 static void __record_pdu(struct lacpdu *lacpdu, struct port *port)
467 if (lacpdu && port) {
468 struct port_params *partner = &port->partner_oper;
470 __choose_matched(lacpdu, port);
471 /* record the new parameter values for the partner
472 * operational
474 partner->port_number = ntohs(lacpdu->actor_port);
475 partner->port_priority = ntohs(lacpdu->actor_port_priority);
476 partner->system = lacpdu->actor_system;
477 partner->system_priority = ntohs(lacpdu->actor_system_priority);
478 partner->key = ntohs(lacpdu->actor_key);
479 partner->port_state = lacpdu->actor_state;
481 /* set actor_oper_port_state.defaulted to FALSE */
482 port->actor_oper_port_state &= ~AD_STATE_DEFAULTED;
484 /* set the partner sync. to on if the partner is sync,
485 * and the port is matched
487 if ((port->sm_vars & AD_PORT_MATCHED) &&
488 (lacpdu->actor_state & AD_STATE_SYNCHRONIZATION)) {
489 partner->port_state |= AD_STATE_SYNCHRONIZATION;
490 pr_debug("%s partner sync=1\n", port->slave->dev->name);
491 } else {
492 partner->port_state &= ~AD_STATE_SYNCHRONIZATION;
493 pr_debug("%s partner sync=0\n", port->slave->dev->name);
499 * __record_default - record default parameters
500 * @port: the port we're looking at
502 * This function records the default parameter values for the partner carried
503 * in the Partner Admin parameters as the current partner operational parameter
504 * values and sets actor_oper_port_state.defaulted to TRUE.
506 static void __record_default(struct port *port)
508 if (port) {
509 /* record the partner admin parameters */
510 memcpy(&port->partner_oper, &port->partner_admin,
511 sizeof(struct port_params));
513 /* set actor_oper_port_state.defaulted to true */
514 port->actor_oper_port_state |= AD_STATE_DEFAULTED;
519 * __update_selected - update a port's Selected variable from a received lacpdu
520 * @lacpdu: the lacpdu we've received
521 * @port: the port we're looking at
523 * Update the value of the selected variable, using parameter values from a
524 * newly received lacpdu. The parameter values for the Actor carried in the
525 * received PDU are compared with the corresponding operational parameter
526 * values for the ports partner. If one or more of the comparisons shows that
527 * the value(s) received in the PDU differ from the current operational values,
528 * then selected is set to FALSE and actor_oper_port_state.synchronization is
529 * set to out_of_sync. Otherwise, selected remains unchanged.
531 static void __update_selected(struct lacpdu *lacpdu, struct port *port)
533 if (lacpdu && port) {
534 const struct port_params *partner = &port->partner_oper;
536 /* check if any parameter is different then
537 * update the state machine selected variable.
539 if (ntohs(lacpdu->actor_port) != partner->port_number ||
540 ntohs(lacpdu->actor_port_priority) != partner->port_priority ||
541 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) ||
542 ntohs(lacpdu->actor_system_priority) != partner->system_priority ||
543 ntohs(lacpdu->actor_key) != partner->key ||
544 (lacpdu->actor_state & AD_STATE_AGGREGATION) != (partner->port_state & AD_STATE_AGGREGATION)) {
545 port->sm_vars &= ~AD_PORT_SELECTED;
551 * __update_default_selected - update a port's Selected variable from Partner
552 * @port: the port we're looking at
554 * This function updates the value of the selected variable, using the partner
555 * administrative parameter values. The administrative values are compared with
556 * the corresponding operational parameter values for the partner. If one or
557 * more of the comparisons shows that the administrative value(s) differ from
558 * the current operational values, then Selected is set to FALSE and
559 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
560 * Selected remains unchanged.
562 static void __update_default_selected(struct port *port)
564 if (port) {
565 const struct port_params *admin = &port->partner_admin;
566 const struct port_params *oper = &port->partner_oper;
568 /* check if any parameter is different then
569 * update the state machine selected variable.
571 if (admin->port_number != oper->port_number ||
572 admin->port_priority != oper->port_priority ||
573 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) ||
574 admin->system_priority != oper->system_priority ||
575 admin->key != oper->key ||
576 (admin->port_state & AD_STATE_AGGREGATION)
577 != (oper->port_state & AD_STATE_AGGREGATION)) {
578 port->sm_vars &= ~AD_PORT_SELECTED;
584 * __update_ntt - update a port's ntt variable from a received lacpdu
585 * @lacpdu: the lacpdu we've received
586 * @port: the port we're looking at
588 * Updates the value of the ntt variable, using parameter values from a newly
589 * received lacpdu. The parameter values for the partner carried in the
590 * received PDU are compared with the corresponding operational parameter
591 * values for the Actor. If one or more of the comparisons shows that the
592 * value(s) received in the PDU differ from the current operational values,
593 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
595 static void __update_ntt(struct lacpdu *lacpdu, struct port *port)
597 /* validate lacpdu and port */
598 if (lacpdu && port) {
599 /* check if any parameter is different then
600 * update the port->ntt.
602 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) ||
603 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) ||
604 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) ||
605 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) ||
606 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) ||
607 ((lacpdu->partner_state & AD_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY)) ||
608 ((lacpdu->partner_state & AD_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)) ||
609 ((lacpdu->partner_state & AD_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) ||
610 ((lacpdu->partner_state & AD_STATE_AGGREGATION) != (port->actor_oper_port_state & AD_STATE_AGGREGATION))
612 port->ntt = true;
618 * __agg_ports_are_ready - check if all ports in an aggregator are ready
619 * @aggregator: the aggregator we're looking at
622 static int __agg_ports_are_ready(struct aggregator *aggregator)
624 struct port *port;
625 int retval = 1;
627 if (aggregator) {
628 /* scan all ports in this aggregator to verfy if they are
629 * all ready.
631 for (port = aggregator->lag_ports;
632 port;
633 port = port->next_port_in_aggregator) {
634 if (!(port->sm_vars & AD_PORT_READY_N)) {
635 retval = 0;
636 break;
641 return retval;
645 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
646 * @aggregator: the aggregator we're looking at
647 * @val: Should the ports' ready bit be set on or off
650 static void __set_agg_ports_ready(struct aggregator *aggregator, int val)
652 struct port *port;
654 for (port = aggregator->lag_ports; port;
655 port = port->next_port_in_aggregator) {
656 if (val)
657 port->sm_vars |= AD_PORT_READY;
658 else
659 port->sm_vars &= ~AD_PORT_READY;
663 static int __agg_active_ports(struct aggregator *agg)
665 struct port *port;
666 int active = 0;
668 for (port = agg->lag_ports; port;
669 port = port->next_port_in_aggregator) {
670 if (port->is_enabled)
671 active++;
674 return active;
678 * __get_agg_bandwidth - get the total bandwidth of an aggregator
679 * @aggregator: the aggregator we're looking at
682 static u32 __get_agg_bandwidth(struct aggregator *aggregator)
684 int nports = __agg_active_ports(aggregator);
685 u32 bandwidth = 0;
687 if (nports) {
688 switch (__get_link_speed(aggregator->lag_ports)) {
689 case AD_LINK_SPEED_1MBPS:
690 bandwidth = nports;
691 break;
692 case AD_LINK_SPEED_10MBPS:
693 bandwidth = nports * 10;
694 break;
695 case AD_LINK_SPEED_100MBPS:
696 bandwidth = nports * 100;
697 break;
698 case AD_LINK_SPEED_1000MBPS:
699 bandwidth = nports * 1000;
700 break;
701 case AD_LINK_SPEED_2500MBPS:
702 bandwidth = nports * 2500;
703 break;
704 case AD_LINK_SPEED_10000MBPS:
705 bandwidth = nports * 10000;
706 break;
707 case AD_LINK_SPEED_20000MBPS:
708 bandwidth = nports * 20000;
709 break;
710 case AD_LINK_SPEED_40000MBPS:
711 bandwidth = nports * 40000;
712 break;
713 case AD_LINK_SPEED_56000MBPS:
714 bandwidth = nports * 56000;
715 break;
716 case AD_LINK_SPEED_100000MBPS:
717 bandwidth = nports * 100000;
718 break;
719 default:
720 bandwidth = 0; /* to silence the compiler */
723 return bandwidth;
727 * __get_active_agg - get the current active aggregator
728 * @aggregator: the aggregator we're looking at
730 * Caller must hold RCU lock.
732 static struct aggregator *__get_active_agg(struct aggregator *aggregator)
734 struct bonding *bond = aggregator->slave->bond;
735 struct list_head *iter;
736 struct slave *slave;
738 bond_for_each_slave_rcu(bond, slave, iter)
739 if (SLAVE_AD_INFO(slave)->aggregator.is_active)
740 return &(SLAVE_AD_INFO(slave)->aggregator);
742 return NULL;
746 * __update_lacpdu_from_port - update a port's lacpdu fields
747 * @port: the port we're looking at
749 static inline void __update_lacpdu_from_port(struct port *port)
751 struct lacpdu *lacpdu = &port->lacpdu;
752 const struct port_params *partner = &port->partner_oper;
754 /* update current actual Actor parameters
755 * lacpdu->subtype initialized
756 * lacpdu->version_number initialized
757 * lacpdu->tlv_type_actor_info initialized
758 * lacpdu->actor_information_length initialized
761 lacpdu->actor_system_priority = htons(port->actor_system_priority);
762 lacpdu->actor_system = port->actor_system;
763 lacpdu->actor_key = htons(port->actor_oper_port_key);
764 lacpdu->actor_port_priority = htons(port->actor_port_priority);
765 lacpdu->actor_port = htons(port->actor_port_number);
766 lacpdu->actor_state = port->actor_oper_port_state;
767 pr_debug("update lacpdu: %s, actor port state %x\n",
768 port->slave->dev->name, port->actor_oper_port_state);
770 /* lacpdu->reserved_3_1 initialized
771 * lacpdu->tlv_type_partner_info initialized
772 * lacpdu->partner_information_length initialized
775 lacpdu->partner_system_priority = htons(partner->system_priority);
776 lacpdu->partner_system = partner->system;
777 lacpdu->partner_key = htons(partner->key);
778 lacpdu->partner_port_priority = htons(partner->port_priority);
779 lacpdu->partner_port = htons(partner->port_number);
780 lacpdu->partner_state = partner->port_state;
782 /* lacpdu->reserved_3_2 initialized
783 * lacpdu->tlv_type_collector_info initialized
784 * lacpdu->collector_information_length initialized
785 * collector_max_delay initialized
786 * reserved_12[12] initialized
787 * tlv_type_terminator initialized
788 * terminator_length initialized
789 * reserved_50[50] initialized
793 /* ================= main 802.3ad protocol code ========================= */
796 * ad_lacpdu_send - send out a lacpdu packet on a given port
797 * @port: the port we're looking at
799 * Returns: 0 on success
800 * < 0 on error
802 static int ad_lacpdu_send(struct port *port)
804 struct slave *slave = port->slave;
805 struct sk_buff *skb;
806 struct lacpdu_header *lacpdu_header;
807 int length = sizeof(struct lacpdu_header);
809 skb = dev_alloc_skb(length);
810 if (!skb)
811 return -ENOMEM;
813 skb->dev = slave->dev;
814 skb_reset_mac_header(skb);
815 skb->network_header = skb->mac_header + ETH_HLEN;
816 skb->protocol = PKT_TYPE_LACPDU;
817 skb->priority = TC_PRIO_CONTROL;
819 lacpdu_header = (struct lacpdu_header *)skb_put(skb, length);
821 ether_addr_copy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr);
822 /* Note: source address is set to be the member's PERMANENT address,
823 * because we use it to identify loopback lacpdus in receive.
825 ether_addr_copy(lacpdu_header->hdr.h_source, slave->perm_hwaddr);
826 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU;
828 lacpdu_header->lacpdu = port->lacpdu;
830 dev_queue_xmit(skb);
832 return 0;
836 * ad_marker_send - send marker information/response on a given port
837 * @port: the port we're looking at
838 * @marker: marker data to send
840 * Returns: 0 on success
841 * < 0 on error
843 static int ad_marker_send(struct port *port, struct bond_marker *marker)
845 struct slave *slave = port->slave;
846 struct sk_buff *skb;
847 struct bond_marker_header *marker_header;
848 int length = sizeof(struct bond_marker_header);
850 skb = dev_alloc_skb(length + 16);
851 if (!skb)
852 return -ENOMEM;
854 skb_reserve(skb, 16);
856 skb->dev = slave->dev;
857 skb_reset_mac_header(skb);
858 skb->network_header = skb->mac_header + ETH_HLEN;
859 skb->protocol = PKT_TYPE_LACPDU;
861 marker_header = (struct bond_marker_header *)skb_put(skb, length);
863 ether_addr_copy(marker_header->hdr.h_dest, lacpdu_mcast_addr);
864 /* Note: source address is set to be the member's PERMANENT address,
865 * because we use it to identify loopback MARKERs in receive.
867 ether_addr_copy(marker_header->hdr.h_source, slave->perm_hwaddr);
868 marker_header->hdr.h_proto = PKT_TYPE_LACPDU;
870 marker_header->marker = *marker;
872 dev_queue_xmit(skb);
874 return 0;
878 * ad_mux_machine - handle a port's mux state machine
879 * @port: the port we're looking at
880 * @update_slave_arr: Does slave array need update?
882 static void ad_mux_machine(struct port *port, bool *update_slave_arr)
884 mux_states_t last_state;
886 /* keep current State Machine state to compare later if it was
887 * changed
889 last_state = port->sm_mux_state;
891 if (port->sm_vars & AD_PORT_BEGIN) {
892 port->sm_mux_state = AD_MUX_DETACHED;
893 } else {
894 switch (port->sm_mux_state) {
895 case AD_MUX_DETACHED:
896 if ((port->sm_vars & AD_PORT_SELECTED)
897 || (port->sm_vars & AD_PORT_STANDBY))
898 /* if SELECTED or STANDBY */
899 port->sm_mux_state = AD_MUX_WAITING;
900 break;
901 case AD_MUX_WAITING:
902 /* if SELECTED == FALSE return to DETACH state */
903 if (!(port->sm_vars & AD_PORT_SELECTED)) {
904 port->sm_vars &= ~AD_PORT_READY_N;
905 /* in order to withhold the Selection Logic to
906 * check all ports READY_N value every callback
907 * cycle to update ready variable, we check
908 * READY_N and update READY here
910 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
911 port->sm_mux_state = AD_MUX_DETACHED;
912 break;
915 /* check if the wait_while_timer expired */
916 if (port->sm_mux_timer_counter
917 && !(--port->sm_mux_timer_counter))
918 port->sm_vars |= AD_PORT_READY_N;
920 /* in order to withhold the selection logic to check
921 * all ports READY_N value every callback cycle to
922 * update ready variable, we check READY_N and update
923 * READY here
925 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
927 /* if the wait_while_timer expired, and the port is
928 * in READY state, move to ATTACHED state
930 if ((port->sm_vars & AD_PORT_READY)
931 && !port->sm_mux_timer_counter)
932 port->sm_mux_state = AD_MUX_ATTACHED;
933 break;
934 case AD_MUX_ATTACHED:
935 /* check also if agg_select_timer expired (so the
936 * edable port will take place only after this timer)
938 if ((port->sm_vars & AD_PORT_SELECTED) &&
939 (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) &&
940 !__check_agg_selection_timer(port)) {
941 if (port->aggregator->is_active)
942 port->sm_mux_state =
943 AD_MUX_COLLECTING_DISTRIBUTING;
944 } else if (!(port->sm_vars & AD_PORT_SELECTED) ||
945 (port->sm_vars & AD_PORT_STANDBY)) {
946 /* if UNSELECTED or STANDBY */
947 port->sm_vars &= ~AD_PORT_READY_N;
948 /* in order to withhold the selection logic to
949 * check all ports READY_N value every callback
950 * cycle to update ready variable, we check
951 * READY_N and update READY here
953 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
954 port->sm_mux_state = AD_MUX_DETACHED;
955 } else if (port->aggregator->is_active) {
956 port->actor_oper_port_state |=
957 AD_STATE_SYNCHRONIZATION;
959 break;
960 case AD_MUX_COLLECTING_DISTRIBUTING:
961 if (!(port->sm_vars & AD_PORT_SELECTED) ||
962 (port->sm_vars & AD_PORT_STANDBY) ||
963 !(port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) ||
964 !(port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) {
965 port->sm_mux_state = AD_MUX_ATTACHED;
966 } else {
967 /* if port state hasn't changed make
968 * sure that a collecting distributing
969 * port in an active aggregator is enabled
971 if (port->aggregator &&
972 port->aggregator->is_active &&
973 !__port_is_enabled(port)) {
975 __enable_port(port);
978 break;
979 default:
980 break;
984 /* check if the state machine was changed */
985 if (port->sm_mux_state != last_state) {
986 pr_debug("Mux Machine: Port=%d (%s), Last State=%d, Curr State=%d\n",
987 port->actor_port_number,
988 port->slave->dev->name,
989 last_state,
990 port->sm_mux_state);
991 switch (port->sm_mux_state) {
992 case AD_MUX_DETACHED:
993 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
994 ad_disable_collecting_distributing(port,
995 update_slave_arr);
996 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
997 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
998 port->ntt = true;
999 break;
1000 case AD_MUX_WAITING:
1001 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0);
1002 break;
1003 case AD_MUX_ATTACHED:
1004 if (port->aggregator->is_active)
1005 port->actor_oper_port_state |=
1006 AD_STATE_SYNCHRONIZATION;
1007 else
1008 port->actor_oper_port_state &=
1009 ~AD_STATE_SYNCHRONIZATION;
1010 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
1011 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
1012 ad_disable_collecting_distributing(port,
1013 update_slave_arr);
1014 port->ntt = true;
1015 break;
1016 case AD_MUX_COLLECTING_DISTRIBUTING:
1017 port->actor_oper_port_state |= AD_STATE_COLLECTING;
1018 port->actor_oper_port_state |= AD_STATE_DISTRIBUTING;
1019 port->actor_oper_port_state |= AD_STATE_SYNCHRONIZATION;
1020 ad_enable_collecting_distributing(port,
1021 update_slave_arr);
1022 port->ntt = true;
1023 break;
1024 default:
1025 break;
1031 * ad_rx_machine - handle a port's rx State Machine
1032 * @lacpdu: the lacpdu we've received
1033 * @port: the port we're looking at
1035 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
1036 * CURRENT. If timer expired set the state machine in the proper state.
1037 * In other cases, this function checks if we need to switch to other state.
1039 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
1041 rx_states_t last_state;
1043 /* keep current State Machine state to compare later if it was
1044 * changed
1046 last_state = port->sm_rx_state;
1048 /* check if state machine should change state */
1050 /* first, check if port was reinitialized */
1051 if (port->sm_vars & AD_PORT_BEGIN) {
1052 port->sm_rx_state = AD_RX_INITIALIZE;
1053 port->sm_vars |= AD_PORT_CHURNED;
1054 /* check if port is not enabled */
1055 } else if (!(port->sm_vars & AD_PORT_BEGIN)
1056 && !port->is_enabled && !(port->sm_vars & AD_PORT_MOVED))
1057 port->sm_rx_state = AD_RX_PORT_DISABLED;
1058 /* check if new lacpdu arrived */
1059 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) ||
1060 (port->sm_rx_state == AD_RX_DEFAULTED) ||
1061 (port->sm_rx_state == AD_RX_CURRENT))) {
1062 if (port->sm_rx_state != AD_RX_CURRENT)
1063 port->sm_vars |= AD_PORT_CHURNED;
1064 port->sm_rx_timer_counter = 0;
1065 port->sm_rx_state = AD_RX_CURRENT;
1066 } else {
1067 /* if timer is on, and if it is expired */
1068 if (port->sm_rx_timer_counter &&
1069 !(--port->sm_rx_timer_counter)) {
1070 switch (port->sm_rx_state) {
1071 case AD_RX_EXPIRED:
1072 port->sm_rx_state = AD_RX_DEFAULTED;
1073 break;
1074 case AD_RX_CURRENT:
1075 port->sm_rx_state = AD_RX_EXPIRED;
1076 break;
1077 default:
1078 break;
1080 } else {
1081 /* if no lacpdu arrived and no timer is on */
1082 switch (port->sm_rx_state) {
1083 case AD_RX_PORT_DISABLED:
1084 if (port->sm_vars & AD_PORT_MOVED)
1085 port->sm_rx_state = AD_RX_INITIALIZE;
1086 else if (port->is_enabled
1087 && (port->sm_vars
1088 & AD_PORT_LACP_ENABLED))
1089 port->sm_rx_state = AD_RX_EXPIRED;
1090 else if (port->is_enabled
1091 && ((port->sm_vars
1092 & AD_PORT_LACP_ENABLED) == 0))
1093 port->sm_rx_state = AD_RX_LACP_DISABLED;
1094 break;
1095 default:
1096 break;
1102 /* check if the State machine was changed or new lacpdu arrived */
1103 if ((port->sm_rx_state != last_state) || (lacpdu)) {
1104 pr_debug("Rx Machine: Port=%d (%s), Last State=%d, Curr State=%d\n",
1105 port->actor_port_number,
1106 port->slave->dev->name,
1107 last_state,
1108 port->sm_rx_state);
1109 switch (port->sm_rx_state) {
1110 case AD_RX_INITIALIZE:
1111 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS))
1112 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1113 else
1114 port->sm_vars |= AD_PORT_LACP_ENABLED;
1115 port->sm_vars &= ~AD_PORT_SELECTED;
1116 __record_default(port);
1117 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1118 port->sm_vars &= ~AD_PORT_MOVED;
1119 port->sm_rx_state = AD_RX_PORT_DISABLED;
1121 /* Fall Through */
1122 case AD_RX_PORT_DISABLED:
1123 port->sm_vars &= ~AD_PORT_MATCHED;
1124 break;
1125 case AD_RX_LACP_DISABLED:
1126 port->sm_vars &= ~AD_PORT_SELECTED;
1127 __record_default(port);
1128 port->partner_oper.port_state &= ~AD_STATE_AGGREGATION;
1129 port->sm_vars |= AD_PORT_MATCHED;
1130 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1131 break;
1132 case AD_RX_EXPIRED:
1133 /* Reset of the Synchronization flag (Standard 43.4.12)
1134 * This reset cause to disable this port in the
1135 * COLLECTING_DISTRIBUTING state of the mux machine in
1136 * case of EXPIRED even if LINK_DOWN didn't arrive for
1137 * the port.
1139 port->partner_oper.port_state &= ~AD_STATE_SYNCHRONIZATION;
1140 port->sm_vars &= ~AD_PORT_MATCHED;
1141 port->partner_oper.port_state |= AD_STATE_LACP_TIMEOUT;
1142 port->partner_oper.port_state |= AD_STATE_LACP_ACTIVITY;
1143 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
1144 port->actor_oper_port_state |= AD_STATE_EXPIRED;
1145 port->sm_vars |= AD_PORT_CHURNED;
1146 break;
1147 case AD_RX_DEFAULTED:
1148 __update_default_selected(port);
1149 __record_default(port);
1150 port->sm_vars |= AD_PORT_MATCHED;
1151 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1152 break;
1153 case AD_RX_CURRENT:
1154 /* detect loopback situation */
1155 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system),
1156 &(port->actor_system))) {
1157 netdev_err(port->slave->bond->dev, "An illegal loopback occurred on adapter (%s)\n"
1158 "Check the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n",
1159 port->slave->dev->name);
1160 return;
1162 __update_selected(lacpdu, port);
1163 __update_ntt(lacpdu, port);
1164 __record_pdu(lacpdu, port);
1165 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT));
1166 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1167 break;
1168 default:
1169 break;
1175 * ad_churn_machine - handle port churn's state machine
1176 * @port: the port we're looking at
1179 static void ad_churn_machine(struct port *port)
1181 if (port->sm_vars & AD_PORT_CHURNED) {
1182 port->sm_vars &= ~AD_PORT_CHURNED;
1183 port->sm_churn_actor_state = AD_CHURN_MONITOR;
1184 port->sm_churn_partner_state = AD_CHURN_MONITOR;
1185 port->sm_churn_actor_timer_counter =
1186 __ad_timer_to_ticks(AD_ACTOR_CHURN_TIMER, 0);
1187 port->sm_churn_partner_timer_counter =
1188 __ad_timer_to_ticks(AD_PARTNER_CHURN_TIMER, 0);
1189 return;
1191 if (port->sm_churn_actor_timer_counter &&
1192 !(--port->sm_churn_actor_timer_counter) &&
1193 port->sm_churn_actor_state == AD_CHURN_MONITOR) {
1194 if (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION) {
1195 port->sm_churn_actor_state = AD_NO_CHURN;
1196 } else {
1197 port->churn_actor_count++;
1198 port->sm_churn_actor_state = AD_CHURN;
1201 if (port->sm_churn_partner_timer_counter &&
1202 !(--port->sm_churn_partner_timer_counter) &&
1203 port->sm_churn_partner_state == AD_CHURN_MONITOR) {
1204 if (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) {
1205 port->sm_churn_partner_state = AD_NO_CHURN;
1206 } else {
1207 port->churn_partner_count++;
1208 port->sm_churn_partner_state = AD_CHURN;
1214 * ad_tx_machine - handle a port's tx state machine
1215 * @port: the port we're looking at
1217 static void ad_tx_machine(struct port *port)
1219 /* check if tx timer expired, to verify that we do not send more than
1220 * 3 packets per second
1222 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) {
1223 /* check if there is something to send */
1224 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1225 __update_lacpdu_from_port(port);
1227 if (ad_lacpdu_send(port) >= 0) {
1228 pr_debug("Sent LACPDU on port %d\n",
1229 port->actor_port_number);
1231 /* mark ntt as false, so it will not be sent
1232 * again until demanded
1234 port->ntt = false;
1237 /* restart tx timer(to verify that we will not exceed
1238 * AD_MAX_TX_IN_SECOND
1240 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1245 * ad_periodic_machine - handle a port's periodic state machine
1246 * @port: the port we're looking at
1248 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1250 static void ad_periodic_machine(struct port *port)
1252 periodic_states_t last_state;
1254 /* keep current state machine state to compare later if it was changed */
1255 last_state = port->sm_periodic_state;
1257 /* check if port was reinitialized */
1258 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
1259 (!(port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & AD_STATE_LACP_ACTIVITY))
1261 port->sm_periodic_state = AD_NO_PERIODIC;
1263 /* check if state machine should change state */
1264 else if (port->sm_periodic_timer_counter) {
1265 /* check if periodic state machine expired */
1266 if (!(--port->sm_periodic_timer_counter)) {
1267 /* if expired then do tx */
1268 port->sm_periodic_state = AD_PERIODIC_TX;
1269 } else {
1270 /* If not expired, check if there is some new timeout
1271 * parameter from the partner state
1273 switch (port->sm_periodic_state) {
1274 case AD_FAST_PERIODIC:
1275 if (!(port->partner_oper.port_state
1276 & AD_STATE_LACP_TIMEOUT))
1277 port->sm_periodic_state = AD_SLOW_PERIODIC;
1278 break;
1279 case AD_SLOW_PERIODIC:
1280 if ((port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1281 port->sm_periodic_timer_counter = 0;
1282 port->sm_periodic_state = AD_PERIODIC_TX;
1284 break;
1285 default:
1286 break;
1289 } else {
1290 switch (port->sm_periodic_state) {
1291 case AD_NO_PERIODIC:
1292 port->sm_periodic_state = AD_FAST_PERIODIC;
1293 break;
1294 case AD_PERIODIC_TX:
1295 if (!(port->partner_oper.port_state &
1296 AD_STATE_LACP_TIMEOUT))
1297 port->sm_periodic_state = AD_SLOW_PERIODIC;
1298 else
1299 port->sm_periodic_state = AD_FAST_PERIODIC;
1300 break;
1301 default:
1302 break;
1306 /* check if the state machine was changed */
1307 if (port->sm_periodic_state != last_state) {
1308 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1309 port->actor_port_number, last_state,
1310 port->sm_periodic_state);
1311 switch (port->sm_periodic_state) {
1312 case AD_NO_PERIODIC:
1313 port->sm_periodic_timer_counter = 0;
1314 break;
1315 case AD_FAST_PERIODIC:
1316 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1317 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1;
1318 break;
1319 case AD_SLOW_PERIODIC:
1320 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1321 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1;
1322 break;
1323 case AD_PERIODIC_TX:
1324 port->ntt = true;
1325 break;
1326 default:
1327 break;
1333 * ad_port_selection_logic - select aggregation groups
1334 * @port: the port we're looking at
1335 * @update_slave_arr: Does slave array need update?
1337 * Select aggregation groups, and assign each port for it's aggregetor. The
1338 * selection logic is called in the inititalization (after all the handshkes),
1339 * and after every lacpdu receive (if selected is off).
1341 static void ad_port_selection_logic(struct port *port, bool *update_slave_arr)
1343 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator;
1344 struct port *last_port = NULL, *curr_port;
1345 struct list_head *iter;
1346 struct bonding *bond;
1347 struct slave *slave;
1348 int found = 0;
1350 /* if the port is already Selected, do nothing */
1351 if (port->sm_vars & AD_PORT_SELECTED)
1352 return;
1354 bond = __get_bond_by_port(port);
1356 /* if the port is connected to other aggregator, detach it */
1357 if (port->aggregator) {
1358 /* detach the port from its former aggregator */
1359 temp_aggregator = port->aggregator;
1360 for (curr_port = temp_aggregator->lag_ports; curr_port;
1361 last_port = curr_port,
1362 curr_port = curr_port->next_port_in_aggregator) {
1363 if (curr_port == port) {
1364 temp_aggregator->num_of_ports--;
1365 /* if it is the first port attached to the
1366 * aggregator
1368 if (!last_port) {
1369 temp_aggregator->lag_ports =
1370 port->next_port_in_aggregator;
1371 } else {
1372 /* not the first port attached to the
1373 * aggregator
1375 last_port->next_port_in_aggregator =
1376 port->next_port_in_aggregator;
1379 /* clear the port's relations to this
1380 * aggregator
1382 port->aggregator = NULL;
1383 port->next_port_in_aggregator = NULL;
1384 port->actor_port_aggregator_identifier = 0;
1386 netdev_dbg(bond->dev, "Port %d left LAG %d\n",
1387 port->actor_port_number,
1388 temp_aggregator->aggregator_identifier);
1389 /* if the aggregator is empty, clear its
1390 * parameters, and set it ready to be attached
1392 if (!temp_aggregator->lag_ports)
1393 ad_clear_agg(temp_aggregator);
1394 break;
1397 if (!curr_port) {
1398 /* meaning: the port was related to an aggregator
1399 * but was not on the aggregator port list
1401 net_warn_ratelimited("%s: Warning: Port %d (on %s) was related to aggregator %d but was not on its port list\n",
1402 port->slave->bond->dev->name,
1403 port->actor_port_number,
1404 port->slave->dev->name,
1405 port->aggregator->aggregator_identifier);
1408 /* search on all aggregators for a suitable aggregator for this port */
1409 bond_for_each_slave(bond, slave, iter) {
1410 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
1412 /* keep a free aggregator for later use(if needed) */
1413 if (!aggregator->lag_ports) {
1414 if (!free_aggregator)
1415 free_aggregator = aggregator;
1416 continue;
1418 /* check if current aggregator suits us */
1419 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */
1420 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) &&
1421 (aggregator->partner_system_priority == port->partner_oper.system_priority) &&
1422 (aggregator->partner_oper_aggregator_key == port->partner_oper.key)
1423 ) &&
1424 ((!MAC_ADDRESS_EQUAL(&(port->partner_oper.system), &(null_mac_addr)) && /* partner answers */
1425 !aggregator->is_individual) /* but is not individual OR */
1428 /* attach to the founded aggregator */
1429 port->aggregator = aggregator;
1430 port->actor_port_aggregator_identifier =
1431 port->aggregator->aggregator_identifier;
1432 port->next_port_in_aggregator = aggregator->lag_ports;
1433 port->aggregator->num_of_ports++;
1434 aggregator->lag_ports = port;
1435 netdev_dbg(bond->dev, "Port %d joined LAG %d(existing LAG)\n",
1436 port->actor_port_number,
1437 port->aggregator->aggregator_identifier);
1439 /* mark this port as selected */
1440 port->sm_vars |= AD_PORT_SELECTED;
1441 found = 1;
1442 break;
1446 /* the port couldn't find an aggregator - attach it to a new
1447 * aggregator
1449 if (!found) {
1450 if (free_aggregator) {
1451 /* assign port a new aggregator */
1452 port->aggregator = free_aggregator;
1453 port->actor_port_aggregator_identifier =
1454 port->aggregator->aggregator_identifier;
1456 /* update the new aggregator's parameters
1457 * if port was responsed from the end-user
1459 if (port->actor_oper_port_key & AD_DUPLEX_KEY_MASKS)
1460 /* if port is full duplex */
1461 port->aggregator->is_individual = false;
1462 else
1463 port->aggregator->is_individual = true;
1465 port->aggregator->actor_admin_aggregator_key =
1466 port->actor_admin_port_key;
1467 port->aggregator->actor_oper_aggregator_key =
1468 port->actor_oper_port_key;
1469 port->aggregator->partner_system =
1470 port->partner_oper.system;
1471 port->aggregator->partner_system_priority =
1472 port->partner_oper.system_priority;
1473 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key;
1474 port->aggregator->receive_state = 1;
1475 port->aggregator->transmit_state = 1;
1476 port->aggregator->lag_ports = port;
1477 port->aggregator->num_of_ports++;
1479 /* mark this port as selected */
1480 port->sm_vars |= AD_PORT_SELECTED;
1482 netdev_dbg(bond->dev, "Port %d joined LAG %d(new LAG)\n",
1483 port->actor_port_number,
1484 port->aggregator->aggregator_identifier);
1485 } else {
1486 netdev_err(bond->dev, "Port %d (on %s) did not find a suitable aggregator\n",
1487 port->actor_port_number, port->slave->dev->name);
1490 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1491 * in all aggregator's ports, else set ready=FALSE in all
1492 * aggregator's ports
1494 __set_agg_ports_ready(port->aggregator,
1495 __agg_ports_are_ready(port->aggregator));
1497 aggregator = __get_first_agg(port);
1498 ad_agg_selection_logic(aggregator, update_slave_arr);
1500 if (!port->aggregator->is_active)
1501 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
1504 /* Decide if "agg" is a better choice for the new active aggregator that
1505 * the current best, according to the ad_select policy.
1507 static struct aggregator *ad_agg_selection_test(struct aggregator *best,
1508 struct aggregator *curr)
1510 /* 0. If no best, select current.
1512 * 1. If the current agg is not individual, and the best is
1513 * individual, select current.
1515 * 2. If current agg is individual and the best is not, keep best.
1517 * 3. Therefore, current and best are both individual or both not
1518 * individual, so:
1520 * 3a. If current agg partner replied, and best agg partner did not,
1521 * select current.
1523 * 3b. If current agg partner did not reply and best agg partner
1524 * did reply, keep best.
1526 * 4. Therefore, current and best both have partner replies or
1527 * both do not, so perform selection policy:
1529 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1530 * select by bandwidth.
1532 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1534 if (!best)
1535 return curr;
1537 if (!curr->is_individual && best->is_individual)
1538 return curr;
1540 if (curr->is_individual && !best->is_individual)
1541 return best;
1543 if (__agg_has_partner(curr) && !__agg_has_partner(best))
1544 return curr;
1546 if (!__agg_has_partner(curr) && __agg_has_partner(best))
1547 return best;
1549 switch (__get_agg_selection_mode(curr->lag_ports)) {
1550 case BOND_AD_COUNT:
1551 if (__agg_active_ports(curr) > __agg_active_ports(best))
1552 return curr;
1554 if (__agg_active_ports(curr) < __agg_active_ports(best))
1555 return best;
1557 /*FALLTHROUGH*/
1558 case BOND_AD_STABLE:
1559 case BOND_AD_BANDWIDTH:
1560 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best))
1561 return curr;
1563 break;
1565 default:
1566 net_warn_ratelimited("%s: Impossible agg select mode %d\n",
1567 curr->slave->bond->dev->name,
1568 __get_agg_selection_mode(curr->lag_ports));
1569 break;
1572 return best;
1575 static int agg_device_up(const struct aggregator *agg)
1577 struct port *port = agg->lag_ports;
1579 if (!port)
1580 return 0;
1582 for (port = agg->lag_ports; port;
1583 port = port->next_port_in_aggregator) {
1584 if (netif_running(port->slave->dev) &&
1585 netif_carrier_ok(port->slave->dev))
1586 return 1;
1589 return 0;
1593 * ad_agg_selection_logic - select an aggregation group for a team
1594 * @aggregator: the aggregator we're looking at
1595 * @update_slave_arr: Does slave array need update?
1597 * It is assumed that only one aggregator may be selected for a team.
1599 * The logic of this function is to select the aggregator according to
1600 * the ad_select policy:
1602 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1603 * it, and to reselect the active aggregator only if the previous
1604 * aggregator has no more ports related to it.
1606 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1607 * bandwidth, and reselect whenever a link state change takes place or the
1608 * set of slaves in the bond changes.
1610 * BOND_AD_COUNT: select the aggregator with largest number of ports
1611 * (slaves), and reselect whenever a link state change takes place or the
1612 * set of slaves in the bond changes.
1614 * FIXME: this function MUST be called with the first agg in the bond, or
1615 * __get_active_agg() won't work correctly. This function should be better
1616 * called with the bond itself, and retrieve the first agg from it.
1618 static void ad_agg_selection_logic(struct aggregator *agg,
1619 bool *update_slave_arr)
1621 struct aggregator *best, *active, *origin;
1622 struct bonding *bond = agg->slave->bond;
1623 struct list_head *iter;
1624 struct slave *slave;
1625 struct port *port;
1627 rcu_read_lock();
1628 origin = agg;
1629 active = __get_active_agg(agg);
1630 best = (active && agg_device_up(active)) ? active : NULL;
1632 bond_for_each_slave_rcu(bond, slave, iter) {
1633 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1635 agg->is_active = 0;
1637 if (__agg_active_ports(agg) && agg_device_up(agg))
1638 best = ad_agg_selection_test(best, agg);
1641 if (best &&
1642 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) {
1643 /* For the STABLE policy, don't replace the old active
1644 * aggregator if it's still active (it has an answering
1645 * partner) or if both the best and active don't have an
1646 * answering partner.
1648 if (active && active->lag_ports &&
1649 __agg_active_ports(active) &&
1650 (__agg_has_partner(active) ||
1651 (!__agg_has_partner(active) &&
1652 !__agg_has_partner(best)))) {
1653 if (!(!active->actor_oper_aggregator_key &&
1654 best->actor_oper_aggregator_key)) {
1655 best = NULL;
1656 active->is_active = 1;
1661 if (best && (best == active)) {
1662 best = NULL;
1663 active->is_active = 1;
1666 /* if there is new best aggregator, activate it */
1667 if (best) {
1668 netdev_dbg(bond->dev, "best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1669 best->aggregator_identifier, best->num_of_ports,
1670 best->actor_oper_aggregator_key,
1671 best->partner_oper_aggregator_key,
1672 best->is_individual, best->is_active);
1673 netdev_dbg(bond->dev, "best ports %p slave %p %s\n",
1674 best->lag_ports, best->slave,
1675 best->slave ? best->slave->dev->name : "NULL");
1677 bond_for_each_slave_rcu(bond, slave, iter) {
1678 agg = &(SLAVE_AD_INFO(slave)->aggregator);
1680 netdev_dbg(bond->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1681 agg->aggregator_identifier, agg->num_of_ports,
1682 agg->actor_oper_aggregator_key,
1683 agg->partner_oper_aggregator_key,
1684 agg->is_individual, agg->is_active);
1687 /* check if any partner replys */
1688 if (best->is_individual) {
1689 net_warn_ratelimited("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1690 best->slave ?
1691 best->slave->bond->dev->name : "NULL");
1694 best->is_active = 1;
1695 netdev_dbg(bond->dev, "LAG %d chosen as the active LAG\n",
1696 best->aggregator_identifier);
1697 netdev_dbg(bond->dev, "Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1698 best->aggregator_identifier, best->num_of_ports,
1699 best->actor_oper_aggregator_key,
1700 best->partner_oper_aggregator_key,
1701 best->is_individual, best->is_active);
1703 /* disable the ports that were related to the former
1704 * active_aggregator
1706 if (active) {
1707 for (port = active->lag_ports; port;
1708 port = port->next_port_in_aggregator) {
1709 __disable_port(port);
1712 /* Slave array needs update. */
1713 *update_slave_arr = true;
1716 /* if the selected aggregator is of join individuals
1717 * (partner_system is NULL), enable their ports
1719 active = __get_active_agg(origin);
1721 if (active) {
1722 if (!__agg_has_partner(active)) {
1723 for (port = active->lag_ports; port;
1724 port = port->next_port_in_aggregator) {
1725 __enable_port(port);
1730 rcu_read_unlock();
1732 bond_3ad_set_carrier(bond);
1736 * ad_clear_agg - clear a given aggregator's parameters
1737 * @aggregator: the aggregator we're looking at
1739 static void ad_clear_agg(struct aggregator *aggregator)
1741 if (aggregator) {
1742 aggregator->is_individual = false;
1743 aggregator->actor_admin_aggregator_key = 0;
1744 aggregator->actor_oper_aggregator_key = 0;
1745 eth_zero_addr(aggregator->partner_system.mac_addr_value);
1746 aggregator->partner_system_priority = 0;
1747 aggregator->partner_oper_aggregator_key = 0;
1748 aggregator->receive_state = 0;
1749 aggregator->transmit_state = 0;
1750 aggregator->lag_ports = NULL;
1751 aggregator->is_active = 0;
1752 aggregator->num_of_ports = 0;
1753 pr_debug("LAG %d was cleared\n",
1754 aggregator->aggregator_identifier);
1759 * ad_initialize_agg - initialize a given aggregator's parameters
1760 * @aggregator: the aggregator we're looking at
1762 static void ad_initialize_agg(struct aggregator *aggregator)
1764 if (aggregator) {
1765 ad_clear_agg(aggregator);
1767 eth_zero_addr(aggregator->aggregator_mac_address.mac_addr_value);
1768 aggregator->aggregator_identifier = 0;
1769 aggregator->slave = NULL;
1774 * ad_initialize_port - initialize a given port's parameters
1775 * @aggregator: the aggregator we're looking at
1776 * @lacp_fast: boolean. whether fast periodic should be used
1778 static void ad_initialize_port(struct port *port, int lacp_fast)
1780 static const struct port_params tmpl = {
1781 .system_priority = 0xffff,
1782 .key = 1,
1783 .port_number = 1,
1784 .port_priority = 0xff,
1785 .port_state = 1,
1787 static const struct lacpdu lacpdu = {
1788 .subtype = 0x01,
1789 .version_number = 0x01,
1790 .tlv_type_actor_info = 0x01,
1791 .actor_information_length = 0x14,
1792 .tlv_type_partner_info = 0x02,
1793 .partner_information_length = 0x14,
1794 .tlv_type_collector_info = 0x03,
1795 .collector_information_length = 0x10,
1796 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY),
1799 if (port) {
1800 port->actor_port_priority = 0xff;
1801 port->actor_port_aggregator_identifier = 0;
1802 port->ntt = false;
1803 port->actor_admin_port_state = AD_STATE_AGGREGATION |
1804 AD_STATE_LACP_ACTIVITY;
1805 port->actor_oper_port_state = AD_STATE_AGGREGATION |
1806 AD_STATE_LACP_ACTIVITY;
1808 if (lacp_fast)
1809 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
1811 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
1812 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl));
1814 port->is_enabled = true;
1815 /* private parameters */
1816 port->sm_vars = AD_PORT_BEGIN | AD_PORT_LACP_ENABLED;
1817 port->sm_rx_state = 0;
1818 port->sm_rx_timer_counter = 0;
1819 port->sm_periodic_state = 0;
1820 port->sm_periodic_timer_counter = 0;
1821 port->sm_mux_state = 0;
1822 port->sm_mux_timer_counter = 0;
1823 port->sm_tx_state = 0;
1824 port->aggregator = NULL;
1825 port->next_port_in_aggregator = NULL;
1826 port->transaction_id = 0;
1828 port->sm_churn_actor_timer_counter = 0;
1829 port->sm_churn_actor_state = 0;
1830 port->churn_actor_count = 0;
1831 port->sm_churn_partner_timer_counter = 0;
1832 port->sm_churn_partner_state = 0;
1833 port->churn_partner_count = 0;
1835 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu));
1840 * ad_enable_collecting_distributing - enable a port's transmit/receive
1841 * @port: the port we're looking at
1842 * @update_slave_arr: Does slave array need update?
1844 * Enable @port if it's in an active aggregator
1846 static void ad_enable_collecting_distributing(struct port *port,
1847 bool *update_slave_arr)
1849 if (port->aggregator->is_active) {
1850 pr_debug("Enabling port %d(LAG %d)\n",
1851 port->actor_port_number,
1852 port->aggregator->aggregator_identifier);
1853 __enable_port(port);
1854 /* Slave array needs update */
1855 *update_slave_arr = true;
1860 * ad_disable_collecting_distributing - disable a port's transmit/receive
1861 * @port: the port we're looking at
1862 * @update_slave_arr: Does slave array need update?
1864 static void ad_disable_collecting_distributing(struct port *port,
1865 bool *update_slave_arr)
1867 if (port->aggregator &&
1868 !MAC_ADDRESS_EQUAL(&(port->aggregator->partner_system),
1869 &(null_mac_addr))) {
1870 pr_debug("Disabling port %d(LAG %d)\n",
1871 port->actor_port_number,
1872 port->aggregator->aggregator_identifier);
1873 __disable_port(port);
1874 /* Slave array needs an update */
1875 *update_slave_arr = true;
1880 * ad_marker_info_received - handle receive of a Marker information frame
1881 * @marker_info: Marker info received
1882 * @port: the port we're looking at
1884 static void ad_marker_info_received(struct bond_marker *marker_info,
1885 struct port *port)
1887 struct bond_marker marker;
1889 /* copy the received marker data to the response marker */
1890 memcpy(&marker, marker_info, sizeof(struct bond_marker));
1891 /* change the marker subtype to marker response */
1892 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE;
1894 /* send the marker response */
1895 if (ad_marker_send(port, &marker) >= 0) {
1896 pr_debug("Sent Marker Response on port %d\n",
1897 port->actor_port_number);
1902 * ad_marker_response_received - handle receive of a marker response frame
1903 * @marker: marker PDU received
1904 * @port: the port we're looking at
1906 * This function does nothing since we decided not to implement send and handle
1907 * response for marker PDU's, in this stage, but only to respond to marker
1908 * information.
1910 static void ad_marker_response_received(struct bond_marker *marker,
1911 struct port *port)
1913 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1916 /* ========= AD exported functions to the main bonding code ========= */
1918 /* Check aggregators status in team every T seconds */
1919 #define AD_AGGREGATOR_SELECTION_TIMER 8
1922 * bond_3ad_initiate_agg_selection - initate aggregator selection
1923 * @bond: bonding struct
1925 * Set the aggregation selection timer, to initiate an agg selection in
1926 * the very near future. Called during first initialization, and during
1927 * any down to up transitions of the bond.
1929 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout)
1931 BOND_AD_INFO(bond).agg_select_timer = timeout;
1935 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1936 * @bond: bonding struct to work on
1937 * @tick_resolution: tick duration (millisecond resolution)
1939 * Can be called only after the mac address of the bond is set.
1941 void bond_3ad_initialize(struct bonding *bond, u16 tick_resolution)
1943 /* check that the bond is not initialized yet */
1944 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond).system.sys_mac_addr),
1945 bond->dev->dev_addr)) {
1947 BOND_AD_INFO(bond).aggregator_identifier = 0;
1949 BOND_AD_INFO(bond).system.sys_priority =
1950 bond->params.ad_actor_sys_prio;
1951 if (is_zero_ether_addr(bond->params.ad_actor_system))
1952 BOND_AD_INFO(bond).system.sys_mac_addr =
1953 *((struct mac_addr *)bond->dev->dev_addr);
1954 else
1955 BOND_AD_INFO(bond).system.sys_mac_addr =
1956 *((struct mac_addr *)bond->params.ad_actor_system);
1958 /* initialize how many times this module is called in one
1959 * second (should be about every 100ms)
1961 ad_ticks_per_sec = tick_resolution;
1963 bond_3ad_initiate_agg_selection(bond,
1964 AD_AGGREGATOR_SELECTION_TIMER *
1965 ad_ticks_per_sec);
1970 * bond_3ad_bind_slave - initialize a slave's port
1971 * @slave: slave struct to work on
1973 * Returns: 0 on success
1974 * < 0 on error
1976 void bond_3ad_bind_slave(struct slave *slave)
1978 struct bonding *bond = bond_get_bond_by_slave(slave);
1979 struct port *port;
1980 struct aggregator *aggregator;
1982 /* check that the slave has not been initialized yet. */
1983 if (SLAVE_AD_INFO(slave)->port.slave != slave) {
1985 /* port initialization */
1986 port = &(SLAVE_AD_INFO(slave)->port);
1988 ad_initialize_port(port, bond->params.lacp_fast);
1990 port->slave = slave;
1991 port->actor_port_number = SLAVE_AD_INFO(slave)->id;
1992 /* key is determined according to the link speed, duplex and
1993 * user key
1995 port->actor_admin_port_key = bond->params.ad_user_port_key << 6;
1996 ad_update_actor_keys(port, false);
1997 /* actor system is the bond's system */
1998 __ad_actor_update_port(port);
1999 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
2000 * lacpdu's are sent in one second)
2002 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
2004 __disable_port(port);
2006 /* aggregator initialization */
2007 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2009 ad_initialize_agg(aggregator);
2011 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr);
2012 aggregator->aggregator_identifier = ++BOND_AD_INFO(bond).aggregator_identifier;
2013 aggregator->slave = slave;
2014 aggregator->is_active = 0;
2015 aggregator->num_of_ports = 0;
2020 * bond_3ad_unbind_slave - deinitialize a slave's port
2021 * @slave: slave struct to work on
2023 * Search for the aggregator that is related to this port, remove the
2024 * aggregator and assign another aggregator for other port related to it
2025 * (if any), and remove the port.
2027 void bond_3ad_unbind_slave(struct slave *slave)
2029 struct port *port, *prev_port, *temp_port;
2030 struct aggregator *aggregator, *new_aggregator, *temp_aggregator;
2031 int select_new_active_agg = 0;
2032 struct bonding *bond = slave->bond;
2033 struct slave *slave_iter;
2034 struct list_head *iter;
2035 bool dummy_slave_update; /* Ignore this value as caller updates array */
2037 /* Sync against bond_3ad_state_machine_handler() */
2038 spin_lock_bh(&bond->mode_lock);
2039 aggregator = &(SLAVE_AD_INFO(slave)->aggregator);
2040 port = &(SLAVE_AD_INFO(slave)->port);
2042 /* if slave is null, the whole port is not initialized */
2043 if (!port->slave) {
2044 netdev_warn(bond->dev, "Trying to unbind an uninitialized port on %s\n",
2045 slave->dev->name);
2046 goto out;
2049 netdev_dbg(bond->dev, "Unbinding Link Aggregation Group %d\n",
2050 aggregator->aggregator_identifier);
2052 /* Tell the partner that this port is not suitable for aggregation */
2053 port->actor_oper_port_state &= ~AD_STATE_AGGREGATION;
2054 __update_lacpdu_from_port(port);
2055 ad_lacpdu_send(port);
2057 /* check if this aggregator is occupied */
2058 if (aggregator->lag_ports) {
2059 /* check if there are other ports related to this aggregator
2060 * except the port related to this slave(thats ensure us that
2061 * there is a reason to search for new aggregator, and that we
2062 * will find one
2064 if ((aggregator->lag_ports != port) ||
2065 (aggregator->lag_ports->next_port_in_aggregator)) {
2066 /* find new aggregator for the related port(s) */
2067 bond_for_each_slave(bond, slave_iter, iter) {
2068 new_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2069 /* if the new aggregator is empty, or it is
2070 * connected to our port only
2072 if (!new_aggregator->lag_ports ||
2073 ((new_aggregator->lag_ports == port) &&
2074 !new_aggregator->lag_ports->next_port_in_aggregator))
2075 break;
2077 if (!slave_iter)
2078 new_aggregator = NULL;
2080 /* if new aggregator found, copy the aggregator's
2081 * parameters and connect the related lag_ports to the
2082 * new aggregator
2084 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) {
2085 netdev_dbg(bond->dev, "Some port(s) related to LAG %d - replacing with LAG %d\n",
2086 aggregator->aggregator_identifier,
2087 new_aggregator->aggregator_identifier);
2089 if ((new_aggregator->lag_ports == port) &&
2090 new_aggregator->is_active) {
2091 netdev_info(bond->dev, "Removing an active aggregator\n");
2092 select_new_active_agg = 1;
2095 new_aggregator->is_individual = aggregator->is_individual;
2096 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key;
2097 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key;
2098 new_aggregator->partner_system = aggregator->partner_system;
2099 new_aggregator->partner_system_priority = aggregator->partner_system_priority;
2100 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key;
2101 new_aggregator->receive_state = aggregator->receive_state;
2102 new_aggregator->transmit_state = aggregator->transmit_state;
2103 new_aggregator->lag_ports = aggregator->lag_ports;
2104 new_aggregator->is_active = aggregator->is_active;
2105 new_aggregator->num_of_ports = aggregator->num_of_ports;
2107 /* update the information that is written on
2108 * the ports about the aggregator
2110 for (temp_port = aggregator->lag_ports; temp_port;
2111 temp_port = temp_port->next_port_in_aggregator) {
2112 temp_port->aggregator = new_aggregator;
2113 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier;
2116 ad_clear_agg(aggregator);
2118 if (select_new_active_agg)
2119 ad_agg_selection_logic(__get_first_agg(port),
2120 &dummy_slave_update);
2121 } else {
2122 netdev_warn(bond->dev, "unbinding aggregator, and could not find a new aggregator for its ports\n");
2124 } else {
2125 /* in case that the only port related to this
2126 * aggregator is the one we want to remove
2128 select_new_active_agg = aggregator->is_active;
2129 ad_clear_agg(aggregator);
2130 if (select_new_active_agg) {
2131 netdev_info(bond->dev, "Removing an active aggregator\n");
2132 /* select new active aggregator */
2133 temp_aggregator = __get_first_agg(port);
2134 if (temp_aggregator)
2135 ad_agg_selection_logic(temp_aggregator,
2136 &dummy_slave_update);
2141 netdev_dbg(bond->dev, "Unbinding port %d\n", port->actor_port_number);
2143 /* find the aggregator that this port is connected to */
2144 bond_for_each_slave(bond, slave_iter, iter) {
2145 temp_aggregator = &(SLAVE_AD_INFO(slave_iter)->aggregator);
2146 prev_port = NULL;
2147 /* search the port in the aggregator's related ports */
2148 for (temp_port = temp_aggregator->lag_ports; temp_port;
2149 prev_port = temp_port,
2150 temp_port = temp_port->next_port_in_aggregator) {
2151 if (temp_port == port) {
2152 /* the aggregator found - detach the port from
2153 * this aggregator
2155 if (prev_port)
2156 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator;
2157 else
2158 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator;
2159 temp_aggregator->num_of_ports--;
2160 if (__agg_active_ports(temp_aggregator) == 0) {
2161 select_new_active_agg = temp_aggregator->is_active;
2162 ad_clear_agg(temp_aggregator);
2163 if (select_new_active_agg) {
2164 netdev_info(bond->dev, "Removing an active aggregator\n");
2165 /* select new active aggregator */
2166 ad_agg_selection_logic(__get_first_agg(port),
2167 &dummy_slave_update);
2170 break;
2174 port->slave = NULL;
2176 out:
2177 spin_unlock_bh(&bond->mode_lock);
2181 * bond_3ad_update_ad_actor_settings - reflect change of actor settings to ports
2182 * @bond: bonding struct to work on
2184 * If an ad_actor setting gets changed we need to update the individual port
2185 * settings so the bond device will use the new values when it gets upped.
2187 void bond_3ad_update_ad_actor_settings(struct bonding *bond)
2189 struct list_head *iter;
2190 struct slave *slave;
2192 ASSERT_RTNL();
2194 BOND_AD_INFO(bond).system.sys_priority = bond->params.ad_actor_sys_prio;
2195 if (is_zero_ether_addr(bond->params.ad_actor_system))
2196 BOND_AD_INFO(bond).system.sys_mac_addr =
2197 *((struct mac_addr *)bond->dev->dev_addr);
2198 else
2199 BOND_AD_INFO(bond).system.sys_mac_addr =
2200 *((struct mac_addr *)bond->params.ad_actor_system);
2202 spin_lock_bh(&bond->mode_lock);
2203 bond_for_each_slave(bond, slave, iter) {
2204 struct port *port = &(SLAVE_AD_INFO(slave))->port;
2206 __ad_actor_update_port(port);
2207 port->ntt = true;
2209 spin_unlock_bh(&bond->mode_lock);
2213 * bond_3ad_state_machine_handler - handle state machines timeout
2214 * @bond: bonding struct to work on
2216 * The state machine handling concept in this module is to check every tick
2217 * which state machine should operate any function. The execution order is
2218 * round robin, so when we have an interaction between state machines, the
2219 * reply of one to each other might be delayed until next tick.
2221 * This function also complete the initialization when the agg_select_timer
2222 * times out, and it selects an aggregator for the ports that are yet not
2223 * related to any aggregator, and selects the active aggregator for a bond.
2225 void bond_3ad_state_machine_handler(struct work_struct *work)
2227 struct bonding *bond = container_of(work, struct bonding,
2228 ad_work.work);
2229 struct aggregator *aggregator;
2230 struct list_head *iter;
2231 struct slave *slave;
2232 struct port *port;
2233 bool should_notify_rtnl = BOND_SLAVE_NOTIFY_LATER;
2234 bool update_slave_arr = false;
2236 /* Lock to protect data accessed by all (e.g., port->sm_vars) and
2237 * against running with bond_3ad_unbind_slave. ad_rx_machine may run
2238 * concurrently due to incoming LACPDU as well.
2240 spin_lock_bh(&bond->mode_lock);
2241 rcu_read_lock();
2243 /* check if there are any slaves */
2244 if (!bond_has_slaves(bond))
2245 goto re_arm;
2247 /* check if agg_select_timer timer after initialize is timed out */
2248 if (BOND_AD_INFO(bond).agg_select_timer &&
2249 !(--BOND_AD_INFO(bond).agg_select_timer)) {
2250 slave = bond_first_slave_rcu(bond);
2251 port = slave ? &(SLAVE_AD_INFO(slave)->port) : NULL;
2253 /* select the active aggregator for the bond */
2254 if (port) {
2255 if (!port->slave) {
2256 net_warn_ratelimited("%s: Warning: bond's first port is uninitialized\n",
2257 bond->dev->name);
2258 goto re_arm;
2261 aggregator = __get_first_agg(port);
2262 ad_agg_selection_logic(aggregator, &update_slave_arr);
2264 bond_3ad_set_carrier(bond);
2267 /* for each port run the state machines */
2268 bond_for_each_slave_rcu(bond, slave, iter) {
2269 port = &(SLAVE_AD_INFO(slave)->port);
2270 if (!port->slave) {
2271 net_warn_ratelimited("%s: Warning: Found an uninitialized port\n",
2272 bond->dev->name);
2273 goto re_arm;
2276 ad_rx_machine(NULL, port);
2277 ad_periodic_machine(port);
2278 ad_port_selection_logic(port, &update_slave_arr);
2279 ad_mux_machine(port, &update_slave_arr);
2280 ad_tx_machine(port);
2281 ad_churn_machine(port);
2283 /* turn off the BEGIN bit, since we already handled it */
2284 if (port->sm_vars & AD_PORT_BEGIN)
2285 port->sm_vars &= ~AD_PORT_BEGIN;
2288 re_arm:
2289 bond_for_each_slave_rcu(bond, slave, iter) {
2290 if (slave->should_notify) {
2291 should_notify_rtnl = BOND_SLAVE_NOTIFY_NOW;
2292 break;
2295 rcu_read_unlock();
2296 spin_unlock_bh(&bond->mode_lock);
2298 if (update_slave_arr)
2299 bond_slave_arr_work_rearm(bond, 0);
2301 if (should_notify_rtnl && rtnl_trylock()) {
2302 bond_slave_state_notify(bond);
2303 rtnl_unlock();
2305 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks);
2309 * bond_3ad_rx_indication - handle a received frame
2310 * @lacpdu: received lacpdu
2311 * @slave: slave struct to work on
2312 * @length: length of the data received
2314 * It is assumed that frames that were sent on this NIC don't returned as new
2315 * received frames (loopback). Since only the payload is given to this
2316 * function, it check for loopback.
2318 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave,
2319 u16 length)
2321 struct port *port;
2322 int ret = RX_HANDLER_ANOTHER;
2324 if (length >= sizeof(struct lacpdu)) {
2326 port = &(SLAVE_AD_INFO(slave)->port);
2328 if (!port->slave) {
2329 net_warn_ratelimited("%s: Warning: port of slave %s is uninitialized\n",
2330 slave->dev->name, slave->bond->dev->name);
2331 return ret;
2334 switch (lacpdu->subtype) {
2335 case AD_TYPE_LACPDU:
2336 ret = RX_HANDLER_CONSUMED;
2337 netdev_dbg(slave->bond->dev,
2338 "Received LACPDU on port %d slave %s\n",
2339 port->actor_port_number,
2340 slave->dev->name);
2341 /* Protect against concurrent state machines */
2342 spin_lock(&slave->bond->mode_lock);
2343 ad_rx_machine(lacpdu, port);
2344 spin_unlock(&slave->bond->mode_lock);
2345 break;
2347 case AD_TYPE_MARKER:
2348 ret = RX_HANDLER_CONSUMED;
2349 /* No need to convert fields to Little Endian since we
2350 * don't use the marker's fields.
2353 switch (((struct bond_marker *)lacpdu)->tlv_type) {
2354 case AD_MARKER_INFORMATION_SUBTYPE:
2355 netdev_dbg(slave->bond->dev, "Received Marker Information on port %d\n",
2356 port->actor_port_number);
2357 ad_marker_info_received((struct bond_marker *)lacpdu, port);
2358 break;
2360 case AD_MARKER_RESPONSE_SUBTYPE:
2361 netdev_dbg(slave->bond->dev, "Received Marker Response on port %d\n",
2362 port->actor_port_number);
2363 ad_marker_response_received((struct bond_marker *)lacpdu, port);
2364 break;
2366 default:
2367 netdev_dbg(slave->bond->dev, "Received an unknown Marker subtype on slot %d\n",
2368 port->actor_port_number);
2372 return ret;
2376 * ad_update_actor_keys - Update the oper / admin keys for a port based on
2377 * its current speed and duplex settings.
2379 * @port: the port we'are looking at
2380 * @reset: Boolean to just reset the speed and the duplex part of the key
2382 * The logic to change the oper / admin keys is:
2383 * (a) A full duplex port can participate in LACP with partner.
2384 * (b) When the speed is changed, LACP need to be reinitiated.
2386 static void ad_update_actor_keys(struct port *port, bool reset)
2388 u8 duplex = 0;
2389 u16 ospeed = 0, speed = 0;
2390 u16 old_oper_key = port->actor_oper_port_key;
2392 port->actor_admin_port_key &= ~(AD_SPEED_KEY_MASKS|AD_DUPLEX_KEY_MASKS);
2393 if (!reset) {
2394 speed = __get_link_speed(port);
2395 ospeed = (old_oper_key & AD_SPEED_KEY_MASKS) >> 1;
2396 duplex = __get_duplex(port);
2397 port->actor_admin_port_key |= (speed << 1) | duplex;
2399 port->actor_oper_port_key = port->actor_admin_port_key;
2401 if (old_oper_key != port->actor_oper_port_key) {
2402 /* Only 'duplex' port participates in LACP */
2403 if (duplex)
2404 port->sm_vars |= AD_PORT_LACP_ENABLED;
2405 else
2406 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
2408 if (!reset) {
2409 if (!speed) {
2410 netdev_err(port->slave->dev,
2411 "speed changed to 0 for port %s",
2412 port->slave->dev->name);
2413 } else if (duplex && ospeed != speed) {
2414 /* Speed change restarts LACP state-machine */
2415 port->sm_vars |= AD_PORT_BEGIN;
2422 * bond_3ad_adapter_speed_duplex_changed - handle a slave's speed / duplex
2423 * change indication
2425 * @slave: slave struct to work on
2427 * Handle reselection of aggregator (if needed) for this port.
2429 void bond_3ad_adapter_speed_duplex_changed(struct slave *slave)
2431 struct port *port;
2433 port = &(SLAVE_AD_INFO(slave)->port);
2435 /* if slave is null, the whole port is not initialized */
2436 if (!port->slave) {
2437 netdev_warn(slave->bond->dev,
2438 "speed/duplex changed for uninitialized port %s\n",
2439 slave->dev->name);
2440 return;
2443 spin_lock_bh(&slave->bond->mode_lock);
2444 ad_update_actor_keys(port, false);
2445 netdev_dbg(slave->bond->dev, "Port %d slave %s changed speed/duplex\n",
2446 port->actor_port_number, slave->dev->name);
2447 spin_unlock_bh(&slave->bond->mode_lock);
2451 * bond_3ad_handle_link_change - handle a slave's link status change indication
2452 * @slave: slave struct to work on
2453 * @status: whether the link is now up or down
2455 * Handle reselection of aggregator (if needed) for this port.
2457 void bond_3ad_handle_link_change(struct slave *slave, char link)
2459 struct aggregator *agg;
2460 struct port *port;
2461 bool dummy;
2463 port = &(SLAVE_AD_INFO(slave)->port);
2465 /* if slave is null, the whole port is not initialized */
2466 if (!port->slave) {
2467 netdev_warn(slave->bond->dev, "link status changed for uninitialized port on %s\n",
2468 slave->dev->name);
2469 return;
2472 spin_lock_bh(&slave->bond->mode_lock);
2473 /* on link down we are zeroing duplex and speed since
2474 * some of the adaptors(ce1000.lan) report full duplex/speed
2475 * instead of N/A(duplex) / 0(speed).
2477 * on link up we are forcing recheck on the duplex and speed since
2478 * some of he adaptors(ce1000.lan) report.
2480 if (link == BOND_LINK_UP) {
2481 port->is_enabled = true;
2482 ad_update_actor_keys(port, false);
2483 } else {
2484 /* link has failed */
2485 port->is_enabled = false;
2486 ad_update_actor_keys(port, true);
2488 agg = __get_first_agg(port);
2489 ad_agg_selection_logic(agg, &dummy);
2491 netdev_dbg(slave->bond->dev, "Port %d changed link status to %s\n",
2492 port->actor_port_number,
2493 link == BOND_LINK_UP ? "UP" : "DOWN");
2495 spin_unlock_bh(&slave->bond->mode_lock);
2497 /* RTNL is held and mode_lock is released so it's safe
2498 * to update slave_array here.
2500 bond_update_slave_arr(slave->bond, NULL);
2504 * bond_3ad_set_carrier - set link state for bonding master
2505 * @bond - bonding structure
2507 * if we have an active aggregator, we're up, if not, we're down.
2508 * Presumes that we cannot have an active aggregator if there are
2509 * no slaves with link up.
2511 * This behavior complies with IEEE 802.3 section 43.3.9.
2513 * Called by bond_set_carrier(). Return zero if carrier state does not
2514 * change, nonzero if it does.
2516 int bond_3ad_set_carrier(struct bonding *bond)
2518 struct aggregator *active;
2519 struct slave *first_slave;
2520 int ret = 1;
2522 rcu_read_lock();
2523 first_slave = bond_first_slave_rcu(bond);
2524 if (!first_slave) {
2525 ret = 0;
2526 goto out;
2528 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave)->aggregator));
2529 if (active) {
2530 /* are enough slaves available to consider link up? */
2531 if (__agg_active_ports(active) < bond->params.min_links) {
2532 if (netif_carrier_ok(bond->dev)) {
2533 netif_carrier_off(bond->dev);
2534 goto out;
2536 } else if (!netif_carrier_ok(bond->dev)) {
2537 netif_carrier_on(bond->dev);
2538 goto out;
2540 } else if (netif_carrier_ok(bond->dev)) {
2541 netif_carrier_off(bond->dev);
2543 out:
2544 rcu_read_unlock();
2545 return ret;
2549 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2550 * @bond: bonding struct to work on
2551 * @ad_info: ad_info struct to fill with the bond's info
2553 * Returns: 0 on success
2554 * < 0 on error
2556 int __bond_3ad_get_active_agg_info(struct bonding *bond,
2557 struct ad_info *ad_info)
2559 struct aggregator *aggregator = NULL;
2560 struct list_head *iter;
2561 struct slave *slave;
2562 struct port *port;
2564 bond_for_each_slave_rcu(bond, slave, iter) {
2565 port = &(SLAVE_AD_INFO(slave)->port);
2566 if (port->aggregator && port->aggregator->is_active) {
2567 aggregator = port->aggregator;
2568 break;
2572 if (!aggregator)
2573 return -1;
2575 ad_info->aggregator_id = aggregator->aggregator_identifier;
2576 ad_info->ports = aggregator->num_of_ports;
2577 ad_info->actor_key = aggregator->actor_oper_aggregator_key;
2578 ad_info->partner_key = aggregator->partner_oper_aggregator_key;
2579 ether_addr_copy(ad_info->partner_system,
2580 aggregator->partner_system.mac_addr_value);
2581 return 0;
2584 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info)
2586 int ret;
2588 rcu_read_lock();
2589 ret = __bond_3ad_get_active_agg_info(bond, ad_info);
2590 rcu_read_unlock();
2592 return ret;
2595 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond,
2596 struct slave *slave)
2598 struct lacpdu *lacpdu, _lacpdu;
2600 if (skb->protocol != PKT_TYPE_LACPDU)
2601 return RX_HANDLER_ANOTHER;
2603 if (!MAC_ADDRESS_EQUAL(eth_hdr(skb)->h_dest, lacpdu_mcast_addr))
2604 return RX_HANDLER_ANOTHER;
2606 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu);
2607 if (!lacpdu)
2608 return RX_HANDLER_ANOTHER;
2610 return bond_3ad_rx_indication(lacpdu, slave, skb->len);
2614 * bond_3ad_update_lacp_rate - change the lacp rate
2615 * @bond - bonding struct
2617 * When modify lacp_rate parameter via sysfs,
2618 * update actor_oper_port_state of each port.
2620 * Hold bond->mode_lock,
2621 * so we can modify port->actor_oper_port_state,
2622 * no matter bond is up or down.
2624 void bond_3ad_update_lacp_rate(struct bonding *bond)
2626 struct port *port = NULL;
2627 struct list_head *iter;
2628 struct slave *slave;
2629 int lacp_fast;
2631 lacp_fast = bond->params.lacp_fast;
2632 spin_lock_bh(&bond->mode_lock);
2633 bond_for_each_slave(bond, slave, iter) {
2634 port = &(SLAVE_AD_INFO(slave)->port);
2635 if (lacp_fast)
2636 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
2637 else
2638 port->actor_oper_port_state &= ~AD_STATE_LACP_TIMEOUT;
2640 spin_unlock_bh(&bond->mode_lock);