On Tue, Nov 06, 2007 at 02:33:53AM -0800, akpm@linux-foundation.org wrote:
[mmotm.git] / drivers / net / bonding / bond_3ad.c
blobc3fa31c9f2a7440f893f60ba10e6007ac9150251
1 /*
2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
7 * any later version.
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
18 * The full GNU General Public License is included in this distribution in the
19 * file called LICENSE.
23 #include <linux/skbuff.h>
24 #include <linux/if_ether.h>
25 #include <linux/netdevice.h>
26 #include <linux/spinlock.h>
27 #include <linux/ethtool.h>
28 #include <linux/etherdevice.h>
29 #include <linux/if_bonding.h>
30 #include <linux/pkt_sched.h>
31 #include <net/net_namespace.h>
32 #include "bonding.h"
33 #include "bond_3ad.h"
35 // General definitions
36 #define AD_SHORT_TIMEOUT 1
37 #define AD_LONG_TIMEOUT 0
38 #define AD_STANDBY 0x2
39 #define AD_MAX_TX_IN_SECOND 3
40 #define AD_COLLECTOR_MAX_DELAY 0
42 // Timer definitions(43.4.4 in the 802.3ad standard)
43 #define AD_FAST_PERIODIC_TIME 1
44 #define AD_SLOW_PERIODIC_TIME 30
45 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
46 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
47 #define AD_CHURN_DETECTION_TIME 60
48 #define AD_AGGREGATE_WAIT_TIME 2
50 // Port state definitions(43.4.2.2 in the 802.3ad standard)
51 #define AD_STATE_LACP_ACTIVITY 0x1
52 #define AD_STATE_LACP_TIMEOUT 0x2
53 #define AD_STATE_AGGREGATION 0x4
54 #define AD_STATE_SYNCHRONIZATION 0x8
55 #define AD_STATE_COLLECTING 0x10
56 #define AD_STATE_DISTRIBUTING 0x20
57 #define AD_STATE_DEFAULTED 0x40
58 #define AD_STATE_EXPIRED 0x80
60 // Port Variables definitions used by the State Machines(43.4.7 in the 802.3ad standard)
61 #define AD_PORT_BEGIN 0x1
62 #define AD_PORT_LACP_ENABLED 0x2
63 #define AD_PORT_ACTOR_CHURN 0x4
64 #define AD_PORT_PARTNER_CHURN 0x8
65 #define AD_PORT_READY 0x10
66 #define AD_PORT_READY_N 0x20
67 #define AD_PORT_MATCHED 0x40
68 #define AD_PORT_STANDBY 0x80
69 #define AD_PORT_SELECTED 0x100
70 #define AD_PORT_MOVED 0x200
72 // Port Key definitions
73 // key is determined according to the link speed, duplex and
74 // user key(which is yet not supported)
75 // ------------------------------------------------------------
76 // Port key : | User key | Speed |Duplex|
77 // ------------------------------------------------------------
78 // 16 6 1 0
79 #define AD_DUPLEX_KEY_BITS 0x1
80 #define AD_SPEED_KEY_BITS 0x3E
81 #define AD_USER_KEY_BITS 0xFFC0
83 //dalloun
84 #define AD_LINK_SPEED_BITMASK_1MBPS 0x1
85 #define AD_LINK_SPEED_BITMASK_10MBPS 0x2
86 #define AD_LINK_SPEED_BITMASK_100MBPS 0x4
87 #define AD_LINK_SPEED_BITMASK_1000MBPS 0x8
88 #define AD_LINK_SPEED_BITMASK_10000MBPS 0x10
89 //endalloun
91 // compare MAC addresses
92 #define MAC_ADDRESS_COMPARE(A, B) memcmp(A, B, ETH_ALEN)
94 static struct mac_addr null_mac_addr = {{0, 0, 0, 0, 0, 0}};
95 static u16 ad_ticks_per_sec;
96 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000;
98 static const u8 lacpdu_mcast_addr[ETH_ALEN] = MULTICAST_LACPDU_ADDR;
100 // ================= main 802.3ad protocol functions ==================
101 static int ad_lacpdu_send(struct port *port);
102 static int ad_marker_send(struct port *port, struct bond_marker *marker);
103 static void ad_mux_machine(struct port *port);
104 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
105 static void ad_tx_machine(struct port *port);
106 static void ad_periodic_machine(struct port *port);
107 static void ad_port_selection_logic(struct port *port);
108 static void ad_agg_selection_logic(struct aggregator *aggregator);
109 static void ad_clear_agg(struct aggregator *aggregator);
110 static void ad_initialize_agg(struct aggregator *aggregator);
111 static void ad_initialize_port(struct port *port, int lacp_fast);
112 static void ad_enable_collecting_distributing(struct port *port);
113 static void ad_disable_collecting_distributing(struct port *port);
114 static void ad_marker_info_received(struct bond_marker *marker_info, struct port *port);
115 static void ad_marker_response_received(struct bond_marker *marker, struct port *port);
118 /////////////////////////////////////////////////////////////////////////////////
119 // ================= api to bonding and kernel code ==================
120 /////////////////////////////////////////////////////////////////////////////////
123 * __get_bond_by_port - get the port's bonding struct
124 * @port: the port we're looking at
126 * Return @port's bonding struct, or %NULL if it can't be found.
128 static inline struct bonding *__get_bond_by_port(struct port *port)
130 if (port->slave == NULL) {
131 return NULL;
134 return bond_get_bond_by_slave(port->slave);
138 * __get_first_port - get the first port in the bond
139 * @bond: the bond we're looking at
141 * Return the port of the first slave in @bond, or %NULL if it can't be found.
143 static inline struct port *__get_first_port(struct bonding *bond)
145 if (bond->slave_cnt == 0) {
146 return NULL;
149 return &(SLAVE_AD_INFO(bond->first_slave).port);
153 * __get_next_port - get the next port in the bond
154 * @port: the port we're looking at
156 * Return the port of the slave that is next in line of @port's slave in the
157 * bond, or %NULL if it can't be found.
159 static inline struct port *__get_next_port(struct port *port)
161 struct bonding *bond = __get_bond_by_port(port);
162 struct slave *slave = port->slave;
164 // If there's no bond for this port, or this is the last slave
165 if ((bond == NULL) || (slave->next == bond->first_slave)) {
166 return NULL;
169 return &(SLAVE_AD_INFO(slave->next).port);
173 * __get_first_agg - get the first aggregator in the bond
174 * @bond: the bond we're looking at
176 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
177 * found.
179 static inline struct aggregator *__get_first_agg(struct port *port)
181 struct bonding *bond = __get_bond_by_port(port);
183 // If there's no bond for this port, or bond has no slaves
184 if ((bond == NULL) || (bond->slave_cnt == 0)) {
185 return NULL;
188 return &(SLAVE_AD_INFO(bond->first_slave).aggregator);
192 * __get_next_agg - get the next aggregator in the bond
193 * @aggregator: the aggregator we're looking at
195 * Return the aggregator of the slave that is next in line of @aggregator's
196 * slave in the bond, or %NULL if it can't be found.
198 static inline struct aggregator *__get_next_agg(struct aggregator *aggregator)
200 struct slave *slave = aggregator->slave;
201 struct bonding *bond = bond_get_bond_by_slave(slave);
203 // If there's no bond for this aggregator, or this is the last slave
204 if ((bond == NULL) || (slave->next == bond->first_slave)) {
205 return NULL;
208 return &(SLAVE_AD_INFO(slave->next).aggregator);
212 * __agg_has_partner
214 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
215 * address for the partner). Return 0 if not.
217 static inline int __agg_has_partner(struct aggregator *agg)
219 return !is_zero_ether_addr(agg->partner_system.mac_addr_value);
223 * __disable_port - disable the port's slave
224 * @port: the port we're looking at
227 static inline void __disable_port(struct port *port)
229 bond_set_slave_inactive_flags(port->slave);
233 * __enable_port - enable the port's slave, if it's up
234 * @port: the port we're looking at
237 static inline void __enable_port(struct port *port)
239 struct slave *slave = port->slave;
241 if ((slave->link == BOND_LINK_UP) && IS_UP(slave->dev)) {
242 bond_set_slave_active_flags(slave);
247 * __port_is_enabled - check if the port's slave is in active state
248 * @port: the port we're looking at
251 static inline int __port_is_enabled(struct port *port)
253 return(port->slave->state == BOND_STATE_ACTIVE);
257 * __get_agg_selection_mode - get the aggregator selection mode
258 * @port: the port we're looking at
260 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
262 static inline u32 __get_agg_selection_mode(struct port *port)
264 struct bonding *bond = __get_bond_by_port(port);
266 if (bond == NULL) {
267 return BOND_AD_STABLE;
270 return BOND_AD_INFO(bond).agg_select_mode;
274 * __check_agg_selection_timer - check if the selection timer has expired
275 * @port: the port we're looking at
278 static inline int __check_agg_selection_timer(struct port *port)
280 struct bonding *bond = __get_bond_by_port(port);
282 if (bond == NULL) {
283 return 0;
286 return BOND_AD_INFO(bond).agg_select_timer ? 1 : 0;
290 * __get_rx_machine_lock - lock the port's RX machine
291 * @port: the port we're looking at
294 static inline void __get_rx_machine_lock(struct port *port)
296 spin_lock_bh(&(SLAVE_AD_INFO(port->slave).rx_machine_lock));
300 * __release_rx_machine_lock - unlock the port's RX machine
301 * @port: the port we're looking at
304 static inline void __release_rx_machine_lock(struct port *port)
306 spin_unlock_bh(&(SLAVE_AD_INFO(port->slave).rx_machine_lock));
310 * __get_link_speed - get a port's speed
311 * @port: the port we're looking at
313 * Return @port's speed in 802.3ad bitmask format. i.e. one of:
314 * 0,
315 * %AD_LINK_SPEED_BITMASK_10MBPS,
316 * %AD_LINK_SPEED_BITMASK_100MBPS,
317 * %AD_LINK_SPEED_BITMASK_1000MBPS,
318 * %AD_LINK_SPEED_BITMASK_10000MBPS
320 static u16 __get_link_speed(struct port *port)
322 struct slave *slave = port->slave;
323 u16 speed;
325 /* this if covers only a special case: when the configuration starts with
326 * link down, it sets the speed to 0.
327 * This is done in spite of the fact that the e100 driver reports 0 to be
328 * compatible with MVT in the future.*/
329 if (slave->link != BOND_LINK_UP) {
330 speed=0;
331 } else {
332 switch (slave->speed) {
333 case SPEED_10:
334 speed = AD_LINK_SPEED_BITMASK_10MBPS;
335 break;
337 case SPEED_100:
338 speed = AD_LINK_SPEED_BITMASK_100MBPS;
339 break;
341 case SPEED_1000:
342 speed = AD_LINK_SPEED_BITMASK_1000MBPS;
343 break;
345 case SPEED_10000:
346 speed = AD_LINK_SPEED_BITMASK_10000MBPS;
347 break;
349 default:
350 speed = 0; // unknown speed value from ethtool. shouldn't happen
351 break;
355 pr_debug("Port %d Received link speed %d update from adapter\n", port->actor_port_number, speed);
356 return speed;
360 * __get_duplex - get a port's duplex
361 * @port: the port we're looking at
363 * Return @port's duplex in 802.3ad bitmask format. i.e.:
364 * 0x01 if in full duplex
365 * 0x00 otherwise
367 static u8 __get_duplex(struct port *port)
369 struct slave *slave = port->slave;
371 u8 retval;
373 // handling a special case: when the configuration starts with
374 // link down, it sets the duplex to 0.
375 if (slave->link != BOND_LINK_UP) {
376 retval=0x0;
377 } else {
378 switch (slave->duplex) {
379 case DUPLEX_FULL:
380 retval=0x1;
381 pr_debug("Port %d Received status full duplex update from adapter\n", port->actor_port_number);
382 break;
383 case DUPLEX_HALF:
384 default:
385 retval=0x0;
386 pr_debug("Port %d Received status NOT full duplex update from adapter\n", port->actor_port_number);
387 break;
390 return retval;
394 * __initialize_port_locks - initialize a port's RX machine spinlock
395 * @port: the port we're looking at
398 static inline void __initialize_port_locks(struct port *port)
400 // make sure it isn't called twice
401 spin_lock_init(&(SLAVE_AD_INFO(port->slave).rx_machine_lock));
404 //conversions
407 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
408 * @timer_type: which timer to operate
409 * @par: timer parameter. see below
411 * If @timer_type is %current_while_timer, @par indicates long/short timer.
412 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
413 * %SLOW_PERIODIC_TIME.
415 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par)
417 u16 retval=0; //to silence the compiler
419 switch (timer_type) {
420 case AD_CURRENT_WHILE_TIMER: // for rx machine usage
421 if (par) { // for short or long timeout
422 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec); // short timeout
423 } else {
424 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec); // long timeout
426 break;
427 case AD_ACTOR_CHURN_TIMER: // for local churn machine
428 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
429 break;
430 case AD_PERIODIC_TIMER: // for periodic machine
431 retval = (par*ad_ticks_per_sec); // long timeout
432 break;
433 case AD_PARTNER_CHURN_TIMER: // for remote churn machine
434 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
435 break;
436 case AD_WAIT_WHILE_TIMER: // for selection machine
437 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec);
438 break;
440 return retval;
444 /////////////////////////////////////////////////////////////////////////////////
445 // ================= ad_rx_machine helper functions ==================
446 /////////////////////////////////////////////////////////////////////////////////
449 * __record_pdu - record parameters from a received lacpdu
450 * @lacpdu: the lacpdu we've received
451 * @port: the port we're looking at
453 * Record the parameter values for the Actor carried in a received lacpdu as
454 * the current partner operational parameter values and sets
455 * actor_oper_port_state.defaulted to FALSE.
457 static void __record_pdu(struct lacpdu *lacpdu, struct port *port)
459 if (lacpdu && port) {
460 struct port_params *partner = &port->partner_oper;
462 // record the new parameter values for the partner operational
463 partner->port_number = ntohs(lacpdu->actor_port);
464 partner->port_priority = ntohs(lacpdu->actor_port_priority);
465 partner->system = lacpdu->actor_system;
466 partner->system_priority = ntohs(lacpdu->actor_system_priority);
467 partner->key = ntohs(lacpdu->actor_key);
468 partner->port_state = lacpdu->actor_state;
470 // set actor_oper_port_state.defaulted to FALSE
471 port->actor_oper_port_state &= ~AD_STATE_DEFAULTED;
473 // set the partner sync. to on if the partner is sync. and the port is matched
474 if ((port->sm_vars & AD_PORT_MATCHED) && (lacpdu->actor_state & AD_STATE_SYNCHRONIZATION)) {
475 partner->port_state |= AD_STATE_SYNCHRONIZATION;
476 } else {
477 partner->port_state &= ~AD_STATE_SYNCHRONIZATION;
483 * __record_default - record default parameters
484 * @port: the port we're looking at
486 * This function records the default parameter values for the partner carried
487 * in the Partner Admin parameters as the current partner operational parameter
488 * values and sets actor_oper_port_state.defaulted to TRUE.
490 static void __record_default(struct port *port)
492 if (port) {
493 // record the partner admin parameters
494 memcpy(&port->partner_oper, &port->partner_admin,
495 sizeof(struct port_params));
497 // set actor_oper_port_state.defaulted to true
498 port->actor_oper_port_state |= AD_STATE_DEFAULTED;
503 * __update_selected - update a port's Selected variable from a received lacpdu
504 * @lacpdu: the lacpdu we've received
505 * @port: the port we're looking at
507 * Update the value of the selected variable, using parameter values from a
508 * newly received lacpdu. The parameter values for the Actor carried in the
509 * received PDU are compared with the corresponding operational parameter
510 * values for the ports partner. If one or more of the comparisons shows that
511 * the value(s) received in the PDU differ from the current operational values,
512 * then selected is set to FALSE and actor_oper_port_state.synchronization is
513 * set to out_of_sync. Otherwise, selected remains unchanged.
515 static void __update_selected(struct lacpdu *lacpdu, struct port *port)
517 if (lacpdu && port) {
518 const struct port_params *partner = &port->partner_oper;
520 // check if any parameter is different
521 if (ntohs(lacpdu->actor_port) != partner->port_number
522 || ntohs(lacpdu->actor_port_priority) != partner->port_priority
523 || MAC_ADDRESS_COMPARE(&lacpdu->actor_system, &partner->system)
524 || ntohs(lacpdu->actor_system_priority) != partner->system_priority
525 || ntohs(lacpdu->actor_key) != partner->key
526 || (lacpdu->actor_state & AD_STATE_AGGREGATION) != (partner->port_state & AD_STATE_AGGREGATION)) {
527 // update the state machine Selected variable
528 port->sm_vars &= ~AD_PORT_SELECTED;
534 * __update_default_selected - update a port's Selected variable from Partner
535 * @port: the port we're looking at
537 * This function updates the value of the selected variable, using the partner
538 * administrative parameter values. The administrative values are compared with
539 * the corresponding operational parameter values for the partner. If one or
540 * more of the comparisons shows that the administrative value(s) differ from
541 * the current operational values, then Selected is set to FALSE and
542 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
543 * Selected remains unchanged.
545 static void __update_default_selected(struct port *port)
547 if (port) {
548 const struct port_params *admin = &port->partner_admin;
549 const struct port_params *oper = &port->partner_oper;
551 // check if any parameter is different
552 if (admin->port_number != oper->port_number
553 || admin->port_priority != oper->port_priority
554 || MAC_ADDRESS_COMPARE(&admin->system, &oper->system)
555 || admin->system_priority != oper->system_priority
556 || admin->key != oper->key
557 || (admin->port_state & AD_STATE_AGGREGATION)
558 != (oper->port_state & AD_STATE_AGGREGATION)) {
559 // update the state machine Selected variable
560 port->sm_vars &= ~AD_PORT_SELECTED;
566 * __choose_matched - update a port's matched variable from a received lacpdu
567 * @lacpdu: the lacpdu we've received
568 * @port: the port we're looking at
570 * Update the value of the matched variable, using parameter values from a
571 * newly received lacpdu. Parameter values for the partner carried in the
572 * received PDU are compared with the corresponding operational parameter
573 * values for the actor. Matched is set to TRUE if all of these parameters
574 * match and the PDU parameter partner_state.aggregation has the same value as
575 * actor_oper_port_state.aggregation and lacp will actively maintain the link
576 * in the aggregation. Matched is also set to TRUE if the value of
577 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
578 * an individual link and lacp will actively maintain the link. Otherwise,
579 * matched is set to FALSE. LACP is considered to be actively maintaining the
580 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
581 * the actor's actor_oper_port_state.lacp_activity and the PDU's
582 * partner_state.lacp_activity variables are TRUE.
584 static void __choose_matched(struct lacpdu *lacpdu, struct port *port)
586 // validate lacpdu and port
587 if (lacpdu && port) {
588 // check if all parameters are alike
589 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) &&
590 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) &&
591 !MAC_ADDRESS_COMPARE(&(lacpdu->partner_system), &(port->actor_system)) &&
592 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) &&
593 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) &&
594 ((lacpdu->partner_state & AD_STATE_AGGREGATION) == (port->actor_oper_port_state & AD_STATE_AGGREGATION))) ||
595 // or this is individual link(aggregation == FALSE)
596 ((lacpdu->actor_state & AD_STATE_AGGREGATION) == 0)
598 // update the state machine Matched variable
599 port->sm_vars |= AD_PORT_MATCHED;
600 } else {
601 port->sm_vars &= ~AD_PORT_MATCHED;
607 * __update_ntt - update a port's ntt variable from a received lacpdu
608 * @lacpdu: the lacpdu we've received
609 * @port: the port we're looking at
611 * Updates the value of the ntt variable, using parameter values from a newly
612 * received lacpdu. The parameter values for the partner carried in the
613 * received PDU are compared with the corresponding operational parameter
614 * values for the Actor. If one or more of the comparisons shows that the
615 * value(s) received in the PDU differ from the current operational values,
616 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
618 static void __update_ntt(struct lacpdu *lacpdu, struct port *port)
620 // validate lacpdu and port
621 if (lacpdu && port) {
622 // check if any parameter is different
623 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) ||
624 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) ||
625 MAC_ADDRESS_COMPARE(&(lacpdu->partner_system), &(port->actor_system)) ||
626 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) ||
627 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) ||
628 ((lacpdu->partner_state & AD_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY)) ||
629 ((lacpdu->partner_state & AD_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)) ||
630 ((lacpdu->partner_state & AD_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) ||
631 ((lacpdu->partner_state & AD_STATE_AGGREGATION) != (port->actor_oper_port_state & AD_STATE_AGGREGATION))
634 port->ntt = true;
640 * __attach_bond_to_agg
641 * @port: the port we're looking at
643 * Handle the attaching of the port's control parser/multiplexer and the
644 * aggregator. This function does nothing since the parser/multiplexer of the
645 * receive and the parser/multiplexer of the aggregator are already combined.
647 static void __attach_bond_to_agg(struct port *port)
649 port=NULL; // just to satisfy the compiler
650 // This function does nothing since the parser/multiplexer of the receive
651 // and the parser/multiplexer of the aggregator are already combined
655 * __detach_bond_from_agg
656 * @port: the port we're looking at
658 * Handle the detaching of the port's control parser/multiplexer from the
659 * aggregator. This function does nothing since the parser/multiplexer of the
660 * receive and the parser/multiplexer of the aggregator are already combined.
662 static void __detach_bond_from_agg(struct port *port)
664 port=NULL; // just to satisfy the compiler
665 // This function does nothing sience the parser/multiplexer of the receive
666 // and the parser/multiplexer of the aggregator are already combined
670 * __agg_ports_are_ready - check if all ports in an aggregator are ready
671 * @aggregator: the aggregator we're looking at
674 static int __agg_ports_are_ready(struct aggregator *aggregator)
676 struct port *port;
677 int retval = 1;
679 if (aggregator) {
680 // scan all ports in this aggregator to verfy if they are all ready
681 for (port=aggregator->lag_ports; port; port=port->next_port_in_aggregator) {
682 if (!(port->sm_vars & AD_PORT_READY_N)) {
683 retval = 0;
684 break;
689 return retval;
693 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
694 * @aggregator: the aggregator we're looking at
695 * @val: Should the ports' ready bit be set on or off
698 static void __set_agg_ports_ready(struct aggregator *aggregator, int val)
700 struct port *port;
702 for (port=aggregator->lag_ports; port; port=port->next_port_in_aggregator) {
703 if (val) {
704 port->sm_vars |= AD_PORT_READY;
705 } else {
706 port->sm_vars &= ~AD_PORT_READY;
712 * __get_agg_bandwidth - get the total bandwidth of an aggregator
713 * @aggregator: the aggregator we're looking at
716 static u32 __get_agg_bandwidth(struct aggregator *aggregator)
718 u32 bandwidth=0;
719 u32 basic_speed;
721 if (aggregator->num_of_ports) {
722 basic_speed = __get_link_speed(aggregator->lag_ports);
723 switch (basic_speed) {
724 case AD_LINK_SPEED_BITMASK_1MBPS:
725 bandwidth = aggregator->num_of_ports;
726 break;
727 case AD_LINK_SPEED_BITMASK_10MBPS:
728 bandwidth = aggregator->num_of_ports * 10;
729 break;
730 case AD_LINK_SPEED_BITMASK_100MBPS:
731 bandwidth = aggregator->num_of_ports * 100;
732 break;
733 case AD_LINK_SPEED_BITMASK_1000MBPS:
734 bandwidth = aggregator->num_of_ports * 1000;
735 break;
736 case AD_LINK_SPEED_BITMASK_10000MBPS:
737 bandwidth = aggregator->num_of_ports * 10000;
738 break;
739 default:
740 bandwidth=0; // to silent the compilor ....
743 return bandwidth;
747 * __get_active_agg - get the current active aggregator
748 * @aggregator: the aggregator we're looking at
751 static struct aggregator *__get_active_agg(struct aggregator *aggregator)
753 struct aggregator *retval = NULL;
755 for (; aggregator; aggregator = __get_next_agg(aggregator)) {
756 if (aggregator->is_active) {
757 retval = aggregator;
758 break;
762 return retval;
766 * __update_lacpdu_from_port - update a port's lacpdu fields
767 * @port: the port we're looking at
770 static inline void __update_lacpdu_from_port(struct port *port)
772 struct lacpdu *lacpdu = &port->lacpdu;
773 const struct port_params *partner = &port->partner_oper;
775 /* update current actual Actor parameters */
776 /* lacpdu->subtype initialized
777 * lacpdu->version_number initialized
778 * lacpdu->tlv_type_actor_info initialized
779 * lacpdu->actor_information_length initialized
782 lacpdu->actor_system_priority = htons(port->actor_system_priority);
783 lacpdu->actor_system = port->actor_system;
784 lacpdu->actor_key = htons(port->actor_oper_port_key);
785 lacpdu->actor_port_priority = htons(port->actor_port_priority);
786 lacpdu->actor_port = htons(port->actor_port_number);
787 lacpdu->actor_state = port->actor_oper_port_state;
789 /* lacpdu->reserved_3_1 initialized
790 * lacpdu->tlv_type_partner_info initialized
791 * lacpdu->partner_information_length initialized
794 lacpdu->partner_system_priority = htons(partner->system_priority);
795 lacpdu->partner_system = partner->system;
796 lacpdu->partner_key = htons(partner->key);
797 lacpdu->partner_port_priority = htons(partner->port_priority);
798 lacpdu->partner_port = htons(partner->port_number);
799 lacpdu->partner_state = partner->port_state;
801 /* lacpdu->reserved_3_2 initialized
802 * lacpdu->tlv_type_collector_info initialized
803 * lacpdu->collector_information_length initialized
804 * collector_max_delay initialized
805 * reserved_12[12] initialized
806 * tlv_type_terminator initialized
807 * terminator_length initialized
808 * reserved_50[50] initialized
812 //////////////////////////////////////////////////////////////////////////////////////
813 // ================= main 802.3ad protocol code ======================================
814 //////////////////////////////////////////////////////////////////////////////////////
817 * ad_lacpdu_send - send out a lacpdu packet on a given port
818 * @port: the port we're looking at
820 * Returns: 0 on success
821 * < 0 on error
823 static int ad_lacpdu_send(struct port *port)
825 struct slave *slave = port->slave;
826 struct sk_buff *skb;
827 struct lacpdu_header *lacpdu_header;
828 int length = sizeof(struct lacpdu_header);
830 skb = dev_alloc_skb(length);
831 if (!skb) {
832 return -ENOMEM;
835 skb->dev = slave->dev;
836 skb_reset_mac_header(skb);
837 skb->network_header = skb->mac_header + ETH_HLEN;
838 skb->protocol = PKT_TYPE_LACPDU;
839 skb->priority = TC_PRIO_CONTROL;
841 lacpdu_header = (struct lacpdu_header *)skb_put(skb, length);
843 memcpy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr, ETH_ALEN);
844 /* Note: source addres is set to be the member's PERMANENT address,
845 because we use it to identify loopback lacpdus in receive. */
846 memcpy(lacpdu_header->hdr.h_source, slave->perm_hwaddr, ETH_ALEN);
847 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU;
849 lacpdu_header->lacpdu = port->lacpdu; // struct copy
851 dev_queue_xmit(skb);
853 return 0;
857 * ad_marker_send - send marker information/response on a given port
858 * @port: the port we're looking at
859 * @marker: marker data to send
861 * Returns: 0 on success
862 * < 0 on error
864 static int ad_marker_send(struct port *port, struct bond_marker *marker)
866 struct slave *slave = port->slave;
867 struct sk_buff *skb;
868 struct bond_marker_header *marker_header;
869 int length = sizeof(struct bond_marker_header);
871 skb = dev_alloc_skb(length + 16);
872 if (!skb) {
873 return -ENOMEM;
876 skb_reserve(skb, 16);
878 skb->dev = slave->dev;
879 skb_reset_mac_header(skb);
880 skb->network_header = skb->mac_header + ETH_HLEN;
881 skb->protocol = PKT_TYPE_LACPDU;
883 marker_header = (struct bond_marker_header *)skb_put(skb, length);
885 memcpy(marker_header->hdr.h_dest, lacpdu_mcast_addr, ETH_ALEN);
886 /* Note: source addres is set to be the member's PERMANENT address,
887 because we use it to identify loopback MARKERs in receive. */
888 memcpy(marker_header->hdr.h_source, slave->perm_hwaddr, ETH_ALEN);
889 marker_header->hdr.h_proto = PKT_TYPE_LACPDU;
891 marker_header->marker = *marker; // struct copy
893 dev_queue_xmit(skb);
895 return 0;
899 * ad_mux_machine - handle a port's mux state machine
900 * @port: the port we're looking at
903 static void ad_mux_machine(struct port *port)
905 mux_states_t last_state;
907 // keep current State Machine state to compare later if it was changed
908 last_state = port->sm_mux_state;
910 if (port->sm_vars & AD_PORT_BEGIN) {
911 port->sm_mux_state = AD_MUX_DETACHED; // next state
912 } else {
913 switch (port->sm_mux_state) {
914 case AD_MUX_DETACHED:
915 if ((port->sm_vars & AD_PORT_SELECTED) || (port->sm_vars & AD_PORT_STANDBY)) { // if SELECTED or STANDBY
916 port->sm_mux_state = AD_MUX_WAITING; // next state
918 break;
919 case AD_MUX_WAITING:
920 // if SELECTED == FALSE return to DETACH state
921 if (!(port->sm_vars & AD_PORT_SELECTED)) { // if UNSELECTED
922 port->sm_vars &= ~AD_PORT_READY_N;
923 // in order to withhold the Selection Logic to check all ports READY_N value
924 // every callback cycle to update ready variable, we check READY_N and update READY here
925 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
926 port->sm_mux_state = AD_MUX_DETACHED; // next state
927 break;
930 // check if the wait_while_timer expired
931 if (port->sm_mux_timer_counter && !(--port->sm_mux_timer_counter)) {
932 port->sm_vars |= AD_PORT_READY_N;
935 // in order to withhold the selection logic to check all ports READY_N value
936 // every callback cycle to update ready variable, we check READY_N and update READY here
937 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
939 // if the wait_while_timer expired, and the port is in READY state, move to ATTACHED state
940 if ((port->sm_vars & AD_PORT_READY) && !port->sm_mux_timer_counter) {
941 port->sm_mux_state = AD_MUX_ATTACHED; // next state
943 break;
944 case AD_MUX_ATTACHED:
945 // check also if agg_select_timer expired(so the edable port will take place only after this timer)
946 if ((port->sm_vars & AD_PORT_SELECTED) && (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) && !__check_agg_selection_timer(port)) {
947 port->sm_mux_state = AD_MUX_COLLECTING_DISTRIBUTING;// next state
948 } else if (!(port->sm_vars & AD_PORT_SELECTED) || (port->sm_vars & AD_PORT_STANDBY)) { // if UNSELECTED or STANDBY
949 port->sm_vars &= ~AD_PORT_READY_N;
950 // in order to withhold the selection logic to check all ports READY_N value
951 // every callback cycle to update ready variable, we check READY_N and update READY here
952 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
953 port->sm_mux_state = AD_MUX_DETACHED;// next state
955 break;
956 case AD_MUX_COLLECTING_DISTRIBUTING:
957 if (!(port->sm_vars & AD_PORT_SELECTED) || (port->sm_vars & AD_PORT_STANDBY) ||
958 !(port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION)
960 port->sm_mux_state = AD_MUX_ATTACHED;// next state
962 } else {
963 // if port state hasn't changed make
964 // sure that a collecting distributing
965 // port in an active aggregator is enabled
966 if (port->aggregator &&
967 port->aggregator->is_active &&
968 !__port_is_enabled(port)) {
970 __enable_port(port);
973 break;
974 default: //to silence the compiler
975 break;
979 // check if the state machine was changed
980 if (port->sm_mux_state != last_state) {
981 pr_debug("Mux Machine: Port=%d, Last State=%d, Curr State=%d\n", port->actor_port_number, last_state, port->sm_mux_state);
982 switch (port->sm_mux_state) {
983 case AD_MUX_DETACHED:
984 __detach_bond_from_agg(port);
985 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
986 ad_disable_collecting_distributing(port);
987 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
988 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
989 port->ntt = true;
990 break;
991 case AD_MUX_WAITING:
992 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0);
993 break;
994 case AD_MUX_ATTACHED:
995 __attach_bond_to_agg(port);
996 port->actor_oper_port_state |= AD_STATE_SYNCHRONIZATION;
997 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
998 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
999 ad_disable_collecting_distributing(port);
1000 port->ntt = true;
1001 break;
1002 case AD_MUX_COLLECTING_DISTRIBUTING:
1003 port->actor_oper_port_state |= AD_STATE_COLLECTING;
1004 port->actor_oper_port_state |= AD_STATE_DISTRIBUTING;
1005 ad_enable_collecting_distributing(port);
1006 port->ntt = true;
1007 break;
1008 default: //to silence the compiler
1009 break;
1015 * ad_rx_machine - handle a port's rx State Machine
1016 * @lacpdu: the lacpdu we've received
1017 * @port: the port we're looking at
1019 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
1020 * CURRENT. If timer expired set the state machine in the proper state.
1021 * In other cases, this function checks if we need to switch to other state.
1023 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
1025 rx_states_t last_state;
1027 // Lock to prevent 2 instances of this function to run simultaneously(rx interrupt and periodic machine callback)
1028 __get_rx_machine_lock(port);
1030 // keep current State Machine state to compare later if it was changed
1031 last_state = port->sm_rx_state;
1033 // check if state machine should change state
1034 // first, check if port was reinitialized
1035 if (port->sm_vars & AD_PORT_BEGIN) {
1036 port->sm_rx_state = AD_RX_INITIALIZE; // next state
1038 // check if port is not enabled
1039 else if (!(port->sm_vars & AD_PORT_BEGIN) && !port->is_enabled && !(port->sm_vars & AD_PORT_MOVED)) {
1040 port->sm_rx_state = AD_RX_PORT_DISABLED; // next state
1042 // check if new lacpdu arrived
1043 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) || (port->sm_rx_state == AD_RX_DEFAULTED) || (port->sm_rx_state == AD_RX_CURRENT))) {
1044 port->sm_rx_timer_counter = 0; // zero timer
1045 port->sm_rx_state = AD_RX_CURRENT;
1046 } else {
1047 // if timer is on, and if it is expired
1048 if (port->sm_rx_timer_counter && !(--port->sm_rx_timer_counter)) {
1049 switch (port->sm_rx_state) {
1050 case AD_RX_EXPIRED:
1051 port->sm_rx_state = AD_RX_DEFAULTED; // next state
1052 break;
1053 case AD_RX_CURRENT:
1054 port->sm_rx_state = AD_RX_EXPIRED; // next state
1055 break;
1056 default: //to silence the compiler
1057 break;
1059 } else {
1060 // if no lacpdu arrived and no timer is on
1061 switch (port->sm_rx_state) {
1062 case AD_RX_PORT_DISABLED:
1063 if (port->sm_vars & AD_PORT_MOVED) {
1064 port->sm_rx_state = AD_RX_INITIALIZE; // next state
1065 } else if (port->is_enabled && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1066 port->sm_rx_state = AD_RX_EXPIRED; // next state
1067 } else if (port->is_enabled && ((port->sm_vars & AD_PORT_LACP_ENABLED) == 0)) {
1068 port->sm_rx_state = AD_RX_LACP_DISABLED; // next state
1070 break;
1071 default: //to silence the compiler
1072 break;
1078 // check if the State machine was changed or new lacpdu arrived
1079 if ((port->sm_rx_state != last_state) || (lacpdu)) {
1080 pr_debug("Rx Machine: Port=%d, Last State=%d, Curr State=%d\n", port->actor_port_number, last_state, port->sm_rx_state);
1081 switch (port->sm_rx_state) {
1082 case AD_RX_INITIALIZE:
1083 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_BITS)) {
1084 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1085 } else {
1086 port->sm_vars |= AD_PORT_LACP_ENABLED;
1088 port->sm_vars &= ~AD_PORT_SELECTED;
1089 __record_default(port);
1090 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1091 port->sm_vars &= ~AD_PORT_MOVED;
1092 port->sm_rx_state = AD_RX_PORT_DISABLED; // next state
1094 /*- Fall Through -*/
1096 case AD_RX_PORT_DISABLED:
1097 port->sm_vars &= ~AD_PORT_MATCHED;
1098 break;
1099 case AD_RX_LACP_DISABLED:
1100 port->sm_vars &= ~AD_PORT_SELECTED;
1101 __record_default(port);
1102 port->partner_oper.port_state &= ~AD_STATE_AGGREGATION;
1103 port->sm_vars |= AD_PORT_MATCHED;
1104 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1105 break;
1106 case AD_RX_EXPIRED:
1107 //Reset of the Synchronization flag. (Standard 43.4.12)
1108 //This reset cause to disable this port in the COLLECTING_DISTRIBUTING state of the
1109 //mux machine in case of EXPIRED even if LINK_DOWN didn't arrive for the port.
1110 port->partner_oper.port_state &= ~AD_STATE_SYNCHRONIZATION;
1111 port->sm_vars &= ~AD_PORT_MATCHED;
1112 port->partner_oper.port_state |=
1113 AD_STATE_LACP_ACTIVITY;
1114 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
1115 port->actor_oper_port_state |= AD_STATE_EXPIRED;
1116 break;
1117 case AD_RX_DEFAULTED:
1118 __update_default_selected(port);
1119 __record_default(port);
1120 port->sm_vars |= AD_PORT_MATCHED;
1121 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1122 break;
1123 case AD_RX_CURRENT:
1124 // detect loopback situation
1125 if (!MAC_ADDRESS_COMPARE(&(lacpdu->actor_system), &(port->actor_system))) {
1126 // INFO_RECEIVED_LOOPBACK_FRAMES
1127 pr_err(DRV_NAME ": %s: An illegal loopback occurred on "
1128 "adapter (%s). Check the configuration to verify that all "
1129 "Adapters are connected to 802.3ad compliant switch ports\n",
1130 port->slave->dev->master->name, port->slave->dev->name);
1131 __release_rx_machine_lock(port);
1132 return;
1134 __update_selected(lacpdu, port);
1135 __update_ntt(lacpdu, port);
1136 __record_pdu(lacpdu, port);
1137 __choose_matched(lacpdu, port);
1138 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT));
1139 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1140 // verify that if the aggregator is enabled, the port is enabled too.
1141 //(because if the link goes down for a short time, the 802.3ad will not
1142 // catch it, and the port will continue to be disabled)
1143 if (port->aggregator && port->aggregator->is_active && !__port_is_enabled(port)) {
1144 __enable_port(port);
1146 break;
1147 default: //to silence the compiler
1148 break;
1151 __release_rx_machine_lock(port);
1155 * ad_tx_machine - handle a port's tx state machine
1156 * @port: the port we're looking at
1159 static void ad_tx_machine(struct port *port)
1161 // check if tx timer expired, to verify that we do not send more than 3 packets per second
1162 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) {
1163 // check if there is something to send
1164 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1165 __update_lacpdu_from_port(port);
1167 if (ad_lacpdu_send(port) >= 0) {
1168 pr_debug("Sent LACPDU on port %d\n", port->actor_port_number);
1170 /* mark ntt as false, so it will not be sent again until
1171 demanded */
1172 port->ntt = false;
1175 // restart tx timer(to verify that we will not exceed AD_MAX_TX_IN_SECOND
1176 port->sm_tx_timer_counter=ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1181 * ad_periodic_machine - handle a port's periodic state machine
1182 * @port: the port we're looking at
1184 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1186 static void ad_periodic_machine(struct port *port)
1188 periodic_states_t last_state;
1190 // keep current state machine state to compare later if it was changed
1191 last_state = port->sm_periodic_state;
1193 // check if port was reinitialized
1194 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
1195 (!(port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & AD_STATE_LACP_ACTIVITY))
1197 port->sm_periodic_state = AD_NO_PERIODIC; // next state
1199 // check if state machine should change state
1200 else if (port->sm_periodic_timer_counter) {
1201 // check if periodic state machine expired
1202 if (!(--port->sm_periodic_timer_counter)) {
1203 // if expired then do tx
1204 port->sm_periodic_state = AD_PERIODIC_TX; // next state
1205 } else {
1206 // If not expired, check if there is some new timeout parameter from the partner state
1207 switch (port->sm_periodic_state) {
1208 case AD_FAST_PERIODIC:
1209 if (!(port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1210 port->sm_periodic_state = AD_SLOW_PERIODIC; // next state
1212 break;
1213 case AD_SLOW_PERIODIC:
1214 if ((port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1215 // stop current timer
1216 port->sm_periodic_timer_counter = 0;
1217 port->sm_periodic_state = AD_PERIODIC_TX; // next state
1219 break;
1220 default: //to silence the compiler
1221 break;
1224 } else {
1225 switch (port->sm_periodic_state) {
1226 case AD_NO_PERIODIC:
1227 port->sm_periodic_state = AD_FAST_PERIODIC; // next state
1228 break;
1229 case AD_PERIODIC_TX:
1230 if (!(port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1231 port->sm_periodic_state = AD_SLOW_PERIODIC; // next state
1232 } else {
1233 port->sm_periodic_state = AD_FAST_PERIODIC; // next state
1235 break;
1236 default: //to silence the compiler
1237 break;
1241 // check if the state machine was changed
1242 if (port->sm_periodic_state != last_state) {
1243 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n", port->actor_port_number, last_state, port->sm_periodic_state);
1244 switch (port->sm_periodic_state) {
1245 case AD_NO_PERIODIC:
1246 port->sm_periodic_timer_counter = 0; // zero timer
1247 break;
1248 case AD_FAST_PERIODIC:
1249 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1; // decrement 1 tick we lost in the PERIODIC_TX cycle
1250 break;
1251 case AD_SLOW_PERIODIC:
1252 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1; // decrement 1 tick we lost in the PERIODIC_TX cycle
1253 break;
1254 case AD_PERIODIC_TX:
1255 port->ntt = true;
1256 break;
1257 default: //to silence the compiler
1258 break;
1264 * ad_port_selection_logic - select aggregation groups
1265 * @port: the port we're looking at
1267 * Select aggregation groups, and assign each port for it's aggregetor. The
1268 * selection logic is called in the inititalization (after all the handshkes),
1269 * and after every lacpdu receive (if selected is off).
1271 static void ad_port_selection_logic(struct port *port)
1273 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator;
1274 struct port *last_port = NULL, *curr_port;
1275 int found = 0;
1277 // if the port is already Selected, do nothing
1278 if (port->sm_vars & AD_PORT_SELECTED) {
1279 return;
1282 // if the port is connected to other aggregator, detach it
1283 if (port->aggregator) {
1284 // detach the port from its former aggregator
1285 temp_aggregator=port->aggregator;
1286 for (curr_port=temp_aggregator->lag_ports; curr_port; last_port=curr_port, curr_port=curr_port->next_port_in_aggregator) {
1287 if (curr_port == port) {
1288 temp_aggregator->num_of_ports--;
1289 if (!last_port) {// if it is the first port attached to the aggregator
1290 temp_aggregator->lag_ports=port->next_port_in_aggregator;
1291 } else {// not the first port attached to the aggregator
1292 last_port->next_port_in_aggregator=port->next_port_in_aggregator;
1295 // clear the port's relations to this aggregator
1296 port->aggregator = NULL;
1297 port->next_port_in_aggregator=NULL;
1298 port->actor_port_aggregator_identifier=0;
1300 pr_debug("Port %d left LAG %d\n", port->actor_port_number, temp_aggregator->aggregator_identifier);
1301 // if the aggregator is empty, clear its parameters, and set it ready to be attached
1302 if (!temp_aggregator->lag_ports) {
1303 ad_clear_agg(temp_aggregator);
1305 break;
1308 if (!curr_port) { // meaning: the port was related to an aggregator but was not on the aggregator port list
1309 pr_warning(DRV_NAME ": %s: Warning: Port %d (on %s) "
1310 "was related to aggregator %d but was not "
1311 "on its port list\n",
1312 port->slave->dev->master->name,
1313 port->actor_port_number,
1314 port->slave->dev->name,
1315 port->aggregator->aggregator_identifier);
1318 // search on all aggregators for a suitable aggregator for this port
1319 for (aggregator = __get_first_agg(port); aggregator;
1320 aggregator = __get_next_agg(aggregator)) {
1322 // keep a free aggregator for later use(if needed)
1323 if (!aggregator->lag_ports) {
1324 if (!free_aggregator) {
1325 free_aggregator=aggregator;
1327 continue;
1329 // check if current aggregator suits us
1330 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && // if all parameters match AND
1331 !MAC_ADDRESS_COMPARE(&(aggregator->partner_system), &(port->partner_oper.system)) &&
1332 (aggregator->partner_system_priority == port->partner_oper.system_priority) &&
1333 (aggregator->partner_oper_aggregator_key == port->partner_oper.key)
1334 ) &&
1335 ((MAC_ADDRESS_COMPARE(&(port->partner_oper.system), &(null_mac_addr)) && // partner answers
1336 !aggregator->is_individual) // but is not individual OR
1339 // attach to the founded aggregator
1340 port->aggregator = aggregator;
1341 port->actor_port_aggregator_identifier=port->aggregator->aggregator_identifier;
1342 port->next_port_in_aggregator=aggregator->lag_ports;
1343 port->aggregator->num_of_ports++;
1344 aggregator->lag_ports=port;
1345 pr_debug("Port %d joined LAG %d(existing LAG)\n", port->actor_port_number, port->aggregator->aggregator_identifier);
1347 // mark this port as selected
1348 port->sm_vars |= AD_PORT_SELECTED;
1349 found = 1;
1350 break;
1354 // the port couldn't find an aggregator - attach it to a new aggregator
1355 if (!found) {
1356 if (free_aggregator) {
1357 // assign port a new aggregator
1358 port->aggregator = free_aggregator;
1359 port->actor_port_aggregator_identifier=port->aggregator->aggregator_identifier;
1361 // update the new aggregator's parameters
1362 // if port was responsed from the end-user
1363 if (port->actor_oper_port_key & AD_DUPLEX_KEY_BITS) {// if port is full duplex
1364 port->aggregator->is_individual = false;
1365 } else {
1366 port->aggregator->is_individual = true;
1369 port->aggregator->actor_admin_aggregator_key = port->actor_admin_port_key;
1370 port->aggregator->actor_oper_aggregator_key = port->actor_oper_port_key;
1371 port->aggregator->partner_system=port->partner_oper.system;
1372 port->aggregator->partner_system_priority = port->partner_oper.system_priority;
1373 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key;
1374 port->aggregator->receive_state = 1;
1375 port->aggregator->transmit_state = 1;
1376 port->aggregator->lag_ports = port;
1377 port->aggregator->num_of_ports++;
1379 // mark this port as selected
1380 port->sm_vars |= AD_PORT_SELECTED;
1382 pr_debug("Port %d joined LAG %d(new LAG)\n", port->actor_port_number, port->aggregator->aggregator_identifier);
1383 } else {
1384 pr_err(DRV_NAME ": %s: Port %d (on %s) did not find "
1385 "a suitable aggregator\n",
1386 port->slave->dev->master->name,
1387 port->actor_port_number, port->slave->dev->name);
1390 // if all aggregator's ports are READY_N == TRUE, set ready=TRUE in all aggregator's ports
1391 // else set ready=FALSE in all aggregator's ports
1392 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
1394 aggregator = __get_first_agg(port);
1395 ad_agg_selection_logic(aggregator);
1399 * Decide if "agg" is a better choice for the new active aggregator that
1400 * the current best, according to the ad_select policy.
1402 static struct aggregator *ad_agg_selection_test(struct aggregator *best,
1403 struct aggregator *curr)
1406 * 0. If no best, select current.
1408 * 1. If the current agg is not individual, and the best is
1409 * individual, select current.
1411 * 2. If current agg is individual and the best is not, keep best.
1413 * 3. Therefore, current and best are both individual or both not
1414 * individual, so:
1416 * 3a. If current agg partner replied, and best agg partner did not,
1417 * select current.
1419 * 3b. If current agg partner did not reply and best agg partner
1420 * did reply, keep best.
1422 * 4. Therefore, current and best both have partner replies or
1423 * both do not, so perform selection policy:
1425 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1426 * select by bandwidth.
1428 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1430 if (!best)
1431 return curr;
1433 if (!curr->is_individual && best->is_individual)
1434 return curr;
1436 if (curr->is_individual && !best->is_individual)
1437 return best;
1439 if (__agg_has_partner(curr) && !__agg_has_partner(best))
1440 return curr;
1442 if (!__agg_has_partner(curr) && __agg_has_partner(best))
1443 return best;
1445 switch (__get_agg_selection_mode(curr->lag_ports)) {
1446 case BOND_AD_COUNT:
1447 if (curr->num_of_ports > best->num_of_ports)
1448 return curr;
1450 if (curr->num_of_ports < best->num_of_ports)
1451 return best;
1453 /*FALLTHROUGH*/
1454 case BOND_AD_STABLE:
1455 case BOND_AD_BANDWIDTH:
1456 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best))
1457 return curr;
1459 break;
1461 default:
1462 pr_warning(DRV_NAME
1463 ": %s: Impossible agg select mode %d\n",
1464 curr->slave->dev->master->name,
1465 __get_agg_selection_mode(curr->lag_ports));
1466 break;
1469 return best;
1472 static int agg_device_up(const struct aggregator *agg)
1474 return (netif_running(agg->slave->dev) &&
1475 netif_carrier_ok(agg->slave->dev));
1479 * ad_agg_selection_logic - select an aggregation group for a team
1480 * @aggregator: the aggregator we're looking at
1482 * It is assumed that only one aggregator may be selected for a team.
1484 * The logic of this function is to select the aggregator according to
1485 * the ad_select policy:
1487 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1488 * it, and to reselect the active aggregator only if the previous
1489 * aggregator has no more ports related to it.
1491 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1492 * bandwidth, and reselect whenever a link state change takes place or the
1493 * set of slaves in the bond changes.
1495 * BOND_AD_COUNT: select the aggregator with largest number of ports
1496 * (slaves), and reselect whenever a link state change takes place or the
1497 * set of slaves in the bond changes.
1499 * FIXME: this function MUST be called with the first agg in the bond, or
1500 * __get_active_agg() won't work correctly. This function should be better
1501 * called with the bond itself, and retrieve the first agg from it.
1503 static void ad_agg_selection_logic(struct aggregator *agg)
1505 struct aggregator *best, *active, *origin;
1506 struct port *port;
1508 origin = agg;
1509 active = __get_active_agg(agg);
1510 best = (active && agg_device_up(active)) ? active : NULL;
1512 do {
1513 agg->is_active = 0;
1515 if (agg->num_of_ports && agg_device_up(agg))
1516 best = ad_agg_selection_test(best, agg);
1518 } while ((agg = __get_next_agg(agg)));
1520 if (best &&
1521 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) {
1523 * For the STABLE policy, don't replace the old active
1524 * aggregator if it's still active (it has an answering
1525 * partner) or if both the best and active don't have an
1526 * answering partner.
1528 if (active && active->lag_ports &&
1529 active->lag_ports->is_enabled &&
1530 (__agg_has_partner(active) ||
1531 (!__agg_has_partner(active) && !__agg_has_partner(best)))) {
1532 if (!(!active->actor_oper_aggregator_key &&
1533 best->actor_oper_aggregator_key)) {
1534 best = NULL;
1535 active->is_active = 1;
1540 if (best && (best == active)) {
1541 best = NULL;
1542 active->is_active = 1;
1545 // if there is new best aggregator, activate it
1546 if (best) {
1547 pr_debug("best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1548 best->aggregator_identifier, best->num_of_ports,
1549 best->actor_oper_aggregator_key,
1550 best->partner_oper_aggregator_key,
1551 best->is_individual, best->is_active);
1552 pr_debug("best ports %p slave %p %s\n",
1553 best->lag_ports, best->slave,
1554 best->slave ? best->slave->dev->name : "NULL");
1556 for (agg = __get_first_agg(best->lag_ports); agg;
1557 agg = __get_next_agg(agg)) {
1559 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1560 agg->aggregator_identifier, agg->num_of_ports,
1561 agg->actor_oper_aggregator_key,
1562 agg->partner_oper_aggregator_key,
1563 agg->is_individual, agg->is_active);
1566 // check if any partner replys
1567 if (best->is_individual) {
1568 pr_warning(DRV_NAME ": %s: Warning: No 802.3ad"
1569 " response from the link partner for any"
1570 " adapters in the bond\n",
1571 best->slave->dev->master->name);
1574 best->is_active = 1;
1575 pr_debug("LAG %d chosen as the active LAG\n",
1576 best->aggregator_identifier);
1577 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1578 best->aggregator_identifier, best->num_of_ports,
1579 best->actor_oper_aggregator_key,
1580 best->partner_oper_aggregator_key,
1581 best->is_individual, best->is_active);
1583 // disable the ports that were related to the former active_aggregator
1584 if (active) {
1585 for (port = active->lag_ports; port;
1586 port = port->next_port_in_aggregator) {
1587 __disable_port(port);
1593 * if the selected aggregator is of join individuals
1594 * (partner_system is NULL), enable their ports
1596 active = __get_active_agg(origin);
1598 if (active) {
1599 if (!__agg_has_partner(active)) {
1600 for (port = active->lag_ports; port;
1601 port = port->next_port_in_aggregator) {
1602 __enable_port(port);
1607 if (origin->slave) {
1608 struct bonding *bond;
1610 bond = bond_get_bond_by_slave(origin->slave);
1611 if (bond)
1612 bond_3ad_set_carrier(bond);
1617 * ad_clear_agg - clear a given aggregator's parameters
1618 * @aggregator: the aggregator we're looking at
1621 static void ad_clear_agg(struct aggregator *aggregator)
1623 if (aggregator) {
1624 aggregator->is_individual = false;
1625 aggregator->actor_admin_aggregator_key = 0;
1626 aggregator->actor_oper_aggregator_key = 0;
1627 aggregator->partner_system = null_mac_addr;
1628 aggregator->partner_system_priority = 0;
1629 aggregator->partner_oper_aggregator_key = 0;
1630 aggregator->receive_state = 0;
1631 aggregator->transmit_state = 0;
1632 aggregator->lag_ports = NULL;
1633 aggregator->is_active = 0;
1634 aggregator->num_of_ports = 0;
1635 pr_debug("LAG %d was cleared\n", aggregator->aggregator_identifier);
1640 * ad_initialize_agg - initialize a given aggregator's parameters
1641 * @aggregator: the aggregator we're looking at
1644 static void ad_initialize_agg(struct aggregator *aggregator)
1646 if (aggregator) {
1647 ad_clear_agg(aggregator);
1649 aggregator->aggregator_mac_address = null_mac_addr;
1650 aggregator->aggregator_identifier = 0;
1651 aggregator->slave = NULL;
1656 * ad_initialize_port - initialize a given port's parameters
1657 * @aggregator: the aggregator we're looking at
1658 * @lacp_fast: boolean. whether fast periodic should be used
1661 static void ad_initialize_port(struct port *port, int lacp_fast)
1663 static const struct port_params tmpl = {
1664 .system_priority = 0xffff,
1665 .key = 1,
1666 .port_number = 1,
1667 .port_priority = 0xff,
1668 .port_state = 1,
1670 static const struct lacpdu lacpdu = {
1671 .subtype = 0x01,
1672 .version_number = 0x01,
1673 .tlv_type_actor_info = 0x01,
1674 .actor_information_length = 0x14,
1675 .tlv_type_partner_info = 0x02,
1676 .partner_information_length = 0x14,
1677 .tlv_type_collector_info = 0x03,
1678 .collector_information_length = 0x10,
1679 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY),
1682 if (port) {
1683 port->actor_port_number = 1;
1684 port->actor_port_priority = 0xff;
1685 port->actor_system = null_mac_addr;
1686 port->actor_system_priority = 0xffff;
1687 port->actor_port_aggregator_identifier = 0;
1688 port->ntt = false;
1689 port->actor_admin_port_key = 1;
1690 port->actor_oper_port_key = 1;
1691 port->actor_admin_port_state = AD_STATE_AGGREGATION | AD_STATE_LACP_ACTIVITY;
1692 port->actor_oper_port_state = AD_STATE_AGGREGATION | AD_STATE_LACP_ACTIVITY;
1694 if (lacp_fast) {
1695 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
1698 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
1699 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl));
1701 port->is_enabled = true;
1702 // ****** private parameters ******
1703 port->sm_vars = 0x3;
1704 port->sm_rx_state = 0;
1705 port->sm_rx_timer_counter = 0;
1706 port->sm_periodic_state = 0;
1707 port->sm_periodic_timer_counter = 0;
1708 port->sm_mux_state = 0;
1709 port->sm_mux_timer_counter = 0;
1710 port->sm_tx_state = 0;
1711 port->sm_tx_timer_counter = 0;
1712 port->slave = NULL;
1713 port->aggregator = NULL;
1714 port->next_port_in_aggregator = NULL;
1715 port->transaction_id = 0;
1717 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu));
1722 * ad_enable_collecting_distributing - enable a port's transmit/receive
1723 * @port: the port we're looking at
1725 * Enable @port if it's in an active aggregator
1727 static void ad_enable_collecting_distributing(struct port *port)
1729 if (port->aggregator->is_active) {
1730 pr_debug("Enabling port %d(LAG %d)\n", port->actor_port_number, port->aggregator->aggregator_identifier);
1731 __enable_port(port);
1736 * ad_disable_collecting_distributing - disable a port's transmit/receive
1737 * @port: the port we're looking at
1740 static void ad_disable_collecting_distributing(struct port *port)
1742 if (port->aggregator && MAC_ADDRESS_COMPARE(&(port->aggregator->partner_system), &(null_mac_addr))) {
1743 pr_debug("Disabling port %d(LAG %d)\n", port->actor_port_number, port->aggregator->aggregator_identifier);
1744 __disable_port(port);
1748 #if 0
1750 * ad_marker_info_send - send a marker information frame
1751 * @port: the port we're looking at
1753 * This function does nothing since we decided not to implement send and handle
1754 * response for marker PDU's, in this stage, but only to respond to marker
1755 * information.
1757 static void ad_marker_info_send(struct port *port)
1759 struct bond_marker marker;
1760 u16 index;
1762 // fill the marker PDU with the appropriate values
1763 marker.subtype = 0x02;
1764 marker.version_number = 0x01;
1765 marker.tlv_type = AD_MARKER_INFORMATION_SUBTYPE;
1766 marker.marker_length = 0x16;
1767 // convert requester_port to Big Endian
1768 marker.requester_port = (((port->actor_port_number & 0xFF) << 8) |((u16)(port->actor_port_number & 0xFF00) >> 8));
1769 marker.requester_system = port->actor_system;
1770 // convert requester_port(u32) to Big Endian
1771 marker.requester_transaction_id = (((++port->transaction_id & 0xFF) << 24) |((port->transaction_id & 0xFF00) << 8) |((port->transaction_id & 0xFF0000) >> 8) |((port->transaction_id & 0xFF000000) >> 24));
1772 marker.pad = 0;
1773 marker.tlv_type_terminator = 0x00;
1774 marker.terminator_length = 0x00;
1775 for (index=0; index<90; index++) {
1776 marker.reserved_90[index]=0;
1779 // send the marker information
1780 if (ad_marker_send(port, &marker) >= 0) {
1781 pr_debug("Sent Marker Information on port %d\n", port->actor_port_number);
1784 #endif
1787 * ad_marker_info_received - handle receive of a Marker information frame
1788 * @marker_info: Marker info received
1789 * @port: the port we're looking at
1792 static void ad_marker_info_received(struct bond_marker *marker_info,
1793 struct port *port)
1795 struct bond_marker marker;
1797 // copy the received marker data to the response marker
1798 //marker = *marker_info;
1799 memcpy(&marker, marker_info, sizeof(struct bond_marker));
1800 // change the marker subtype to marker response
1801 marker.tlv_type=AD_MARKER_RESPONSE_SUBTYPE;
1802 // send the marker response
1804 if (ad_marker_send(port, &marker) >= 0) {
1805 pr_debug("Sent Marker Response on port %d\n", port->actor_port_number);
1810 * ad_marker_response_received - handle receive of a marker response frame
1811 * @marker: marker PDU received
1812 * @port: the port we're looking at
1814 * This function does nothing since we decided not to implement send and handle
1815 * response for marker PDU's, in this stage, but only to respond to marker
1816 * information.
1818 static void ad_marker_response_received(struct bond_marker *marker,
1819 struct port *port)
1821 marker=NULL; // just to satisfy the compiler
1822 port=NULL; // just to satisfy the compiler
1823 // DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW
1826 //////////////////////////////////////////////////////////////////////////////////////
1827 // ================= AD exported functions to the main bonding code ==================
1828 //////////////////////////////////////////////////////////////////////////////////////
1830 // Check aggregators status in team every T seconds
1831 #define AD_AGGREGATOR_SELECTION_TIMER 8
1834 * bond_3ad_initiate_agg_selection(struct bonding *bond)
1836 * Set the aggregation selection timer, to initiate an agg selection in
1837 * the very near future. Called during first initialization, and during
1838 * any down to up transitions of the bond.
1840 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout)
1842 BOND_AD_INFO(bond).agg_select_timer = timeout;
1843 BOND_AD_INFO(bond).agg_select_mode = bond->params.ad_select;
1846 static u16 aggregator_identifier;
1849 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1850 * @bond: bonding struct to work on
1851 * @tick_resolution: tick duration (millisecond resolution)
1852 * @lacp_fast: boolean. whether fast periodic should be used
1854 * Can be called only after the mac address of the bond is set.
1856 void bond_3ad_initialize(struct bonding *bond, u16 tick_resolution, int lacp_fast)
1858 // check that the bond is not initialized yet
1859 if (MAC_ADDRESS_COMPARE(&(BOND_AD_INFO(bond).system.sys_mac_addr),
1860 bond->dev->dev_addr)) {
1862 aggregator_identifier = 0;
1864 BOND_AD_INFO(bond).lacp_fast = lacp_fast;
1865 BOND_AD_INFO(bond).system.sys_priority = 0xFFFF;
1866 BOND_AD_INFO(bond).system.sys_mac_addr = *((struct mac_addr *)bond->dev->dev_addr);
1868 // initialize how many times this module is called in one second(should be about every 100ms)
1869 ad_ticks_per_sec = tick_resolution;
1871 bond_3ad_initiate_agg_selection(bond,
1872 AD_AGGREGATOR_SELECTION_TIMER *
1873 ad_ticks_per_sec);
1878 * bond_3ad_bind_slave - initialize a slave's port
1879 * @slave: slave struct to work on
1881 * Returns: 0 on success
1882 * < 0 on error
1884 int bond_3ad_bind_slave(struct slave *slave)
1886 struct bonding *bond = bond_get_bond_by_slave(slave);
1887 struct port *port;
1888 struct aggregator *aggregator;
1890 if (bond == NULL) {
1891 pr_err(DRV_NAME ": %s: The slave %s is not attached to "
1892 "its bond\n",
1893 slave->dev->master->name, slave->dev->name);
1894 return -1;
1897 //check that the slave has not been intialized yet.
1898 if (SLAVE_AD_INFO(slave).port.slave != slave) {
1900 // port initialization
1901 port = &(SLAVE_AD_INFO(slave).port);
1903 ad_initialize_port(port, BOND_AD_INFO(bond).lacp_fast);
1905 port->slave = slave;
1906 port->actor_port_number = SLAVE_AD_INFO(slave).id;
1907 // key is determined according to the link speed, duplex and user key(which is yet not supported)
1908 // ------------------------------------------------------------
1909 // Port key : | User key | Speed |Duplex|
1910 // ------------------------------------------------------------
1911 // 16 6 1 0
1912 port->actor_admin_port_key = 0; // initialize this parameter
1913 port->actor_admin_port_key |= __get_duplex(port);
1914 port->actor_admin_port_key |= (__get_link_speed(port) << 1);
1915 port->actor_oper_port_key = port->actor_admin_port_key;
1916 // if the port is not full duplex, then the port should be not lacp Enabled
1917 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_BITS)) {
1918 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1920 // actor system is the bond's system
1921 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr;
1922 // tx timer(to verify that no more than MAX_TX_IN_SECOND lacpdu's are sent in one second)
1923 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1924 port->aggregator = NULL;
1925 port->next_port_in_aggregator = NULL;
1927 __disable_port(port);
1928 __initialize_port_locks(port);
1931 // aggregator initialization
1932 aggregator = &(SLAVE_AD_INFO(slave).aggregator);
1934 ad_initialize_agg(aggregator);
1936 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr);
1937 aggregator->aggregator_identifier = (++aggregator_identifier);
1938 aggregator->slave = slave;
1939 aggregator->is_active = 0;
1940 aggregator->num_of_ports = 0;
1943 return 0;
1947 * bond_3ad_unbind_slave - deinitialize a slave's port
1948 * @slave: slave struct to work on
1950 * Search for the aggregator that is related to this port, remove the
1951 * aggregator and assign another aggregator for other port related to it
1952 * (if any), and remove the port.
1954 void bond_3ad_unbind_slave(struct slave *slave)
1956 struct port *port, *prev_port, *temp_port;
1957 struct aggregator *aggregator, *new_aggregator, *temp_aggregator;
1958 int select_new_active_agg = 0;
1960 // find the aggregator related to this slave
1961 aggregator = &(SLAVE_AD_INFO(slave).aggregator);
1963 // find the port related to this slave
1964 port = &(SLAVE_AD_INFO(slave).port);
1966 // if slave is null, the whole port is not initialized
1967 if (!port->slave) {
1968 pr_warning(DRV_NAME ": Warning: %s: Trying to "
1969 "unbind an uninitialized port on %s\n",
1970 slave->dev->master->name, slave->dev->name);
1971 return;
1974 pr_debug("Unbinding Link Aggregation Group %d\n", aggregator->aggregator_identifier);
1976 /* Tell the partner that this port is not suitable for aggregation */
1977 port->actor_oper_port_state &= ~AD_STATE_AGGREGATION;
1978 __update_lacpdu_from_port(port);
1979 ad_lacpdu_send(port);
1981 // check if this aggregator is occupied
1982 if (aggregator->lag_ports) {
1983 // check if there are other ports related to this aggregator except
1984 // the port related to this slave(thats ensure us that there is a
1985 // reason to search for new aggregator, and that we will find one
1986 if ((aggregator->lag_ports != port) || (aggregator->lag_ports->next_port_in_aggregator)) {
1987 // find new aggregator for the related port(s)
1988 new_aggregator = __get_first_agg(port);
1989 for (; new_aggregator; new_aggregator = __get_next_agg(new_aggregator)) {
1990 // if the new aggregator is empty, or it is connected to our port only
1991 if (!new_aggregator->lag_ports || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator)) {
1992 break;
1995 // if new aggregator found, copy the aggregator's parameters
1996 // and connect the related lag_ports to the new aggregator
1997 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) {
1998 pr_debug("Some port(s) related to LAG %d - replaceing with LAG %d\n", aggregator->aggregator_identifier, new_aggregator->aggregator_identifier);
2000 if ((new_aggregator->lag_ports == port) && new_aggregator->is_active) {
2001 pr_info(DRV_NAME ": %s: Removing an active aggregator\n",
2002 aggregator->slave->dev->master->name);
2003 // select new active aggregator
2004 select_new_active_agg = 1;
2007 new_aggregator->is_individual = aggregator->is_individual;
2008 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key;
2009 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key;
2010 new_aggregator->partner_system = aggregator->partner_system;
2011 new_aggregator->partner_system_priority = aggregator->partner_system_priority;
2012 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key;
2013 new_aggregator->receive_state = aggregator->receive_state;
2014 new_aggregator->transmit_state = aggregator->transmit_state;
2015 new_aggregator->lag_ports = aggregator->lag_ports;
2016 new_aggregator->is_active = aggregator->is_active;
2017 new_aggregator->num_of_ports = aggregator->num_of_ports;
2019 // update the information that is written on the ports about the aggregator
2020 for (temp_port=aggregator->lag_ports; temp_port; temp_port=temp_port->next_port_in_aggregator) {
2021 temp_port->aggregator=new_aggregator;
2022 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier;
2025 // clear the aggregator
2026 ad_clear_agg(aggregator);
2028 if (select_new_active_agg) {
2029 ad_agg_selection_logic(__get_first_agg(port));
2031 } else {
2032 pr_warning(DRV_NAME ": %s: Warning: unbinding aggregator, "
2033 "and could not find a new aggregator for its ports\n",
2034 slave->dev->master->name);
2036 } else { // in case that the only port related to this aggregator is the one we want to remove
2037 select_new_active_agg = aggregator->is_active;
2038 // clear the aggregator
2039 ad_clear_agg(aggregator);
2040 if (select_new_active_agg) {
2041 pr_info(DRV_NAME ": %s: Removing an active aggregator\n",
2042 slave->dev->master->name);
2043 // select new active aggregator
2044 ad_agg_selection_logic(__get_first_agg(port));
2049 pr_debug("Unbinding port %d\n", port->actor_port_number);
2050 // find the aggregator that this port is connected to
2051 temp_aggregator = __get_first_agg(port);
2052 for (; temp_aggregator; temp_aggregator = __get_next_agg(temp_aggregator)) {
2053 prev_port = NULL;
2054 // search the port in the aggregator's related ports
2055 for (temp_port=temp_aggregator->lag_ports; temp_port; prev_port=temp_port, temp_port=temp_port->next_port_in_aggregator) {
2056 if (temp_port == port) { // the aggregator found - detach the port from this aggregator
2057 if (prev_port) {
2058 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator;
2059 } else {
2060 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator;
2062 temp_aggregator->num_of_ports--;
2063 if (temp_aggregator->num_of_ports==0) {
2064 select_new_active_agg = temp_aggregator->is_active;
2065 // clear the aggregator
2066 ad_clear_agg(temp_aggregator);
2067 if (select_new_active_agg) {
2068 pr_info(DRV_NAME ": %s: Removing an active aggregator\n",
2069 slave->dev->master->name);
2070 // select new active aggregator
2071 ad_agg_selection_logic(__get_first_agg(port));
2074 break;
2078 port->slave=NULL;
2082 * bond_3ad_state_machine_handler - handle state machines timeout
2083 * @bond: bonding struct to work on
2085 * The state machine handling concept in this module is to check every tick
2086 * which state machine should operate any function. The execution order is
2087 * round robin, so when we have an interaction between state machines, the
2088 * reply of one to each other might be delayed until next tick.
2090 * This function also complete the initialization when the agg_select_timer
2091 * times out, and it selects an aggregator for the ports that are yet not
2092 * related to any aggregator, and selects the active aggregator for a bond.
2094 void bond_3ad_state_machine_handler(struct work_struct *work)
2096 struct bonding *bond = container_of(work, struct bonding,
2097 ad_work.work);
2098 struct port *port;
2099 struct aggregator *aggregator;
2101 read_lock(&bond->lock);
2103 if (bond->kill_timers) {
2104 goto out;
2107 //check if there are any slaves
2108 if (bond->slave_cnt == 0) {
2109 goto re_arm;
2112 // check if agg_select_timer timer after initialize is timed out
2113 if (BOND_AD_INFO(bond).agg_select_timer && !(--BOND_AD_INFO(bond).agg_select_timer)) {
2114 // select the active aggregator for the bond
2115 if ((port = __get_first_port(bond))) {
2116 if (!port->slave) {
2117 pr_warning(DRV_NAME ": %s: Warning: bond's first port is "
2118 "uninitialized\n", bond->dev->name);
2119 goto re_arm;
2122 aggregator = __get_first_agg(port);
2123 ad_agg_selection_logic(aggregator);
2125 bond_3ad_set_carrier(bond);
2128 // for each port run the state machines
2129 for (port = __get_first_port(bond); port; port = __get_next_port(port)) {
2130 if (!port->slave) {
2131 pr_warning(DRV_NAME ": %s: Warning: Found an uninitialized "
2132 "port\n", bond->dev->name);
2133 goto re_arm;
2136 ad_rx_machine(NULL, port);
2137 ad_periodic_machine(port);
2138 ad_port_selection_logic(port);
2139 ad_mux_machine(port);
2140 ad_tx_machine(port);
2142 // turn off the BEGIN bit, since we already handled it
2143 if (port->sm_vars & AD_PORT_BEGIN) {
2144 port->sm_vars &= ~AD_PORT_BEGIN;
2148 re_arm:
2149 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks);
2150 out:
2151 read_unlock(&bond->lock);
2155 * bond_3ad_rx_indication - handle a received frame
2156 * @lacpdu: received lacpdu
2157 * @slave: slave struct to work on
2158 * @length: length of the data received
2160 * It is assumed that frames that were sent on this NIC don't returned as new
2161 * received frames (loopback). Since only the payload is given to this
2162 * function, it check for loopback.
2164 static void bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave, u16 length)
2166 struct port *port;
2168 if (length >= sizeof(struct lacpdu)) {
2170 port = &(SLAVE_AD_INFO(slave).port);
2172 if (!port->slave) {
2173 pr_warning(DRV_NAME ": %s: Warning: port of slave %s "
2174 "is uninitialized\n",
2175 slave->dev->name, slave->dev->master->name);
2176 return;
2179 switch (lacpdu->subtype) {
2180 case AD_TYPE_LACPDU:
2181 pr_debug("Received LACPDU on port %d\n", port->actor_port_number);
2182 ad_rx_machine(lacpdu, port);
2183 break;
2185 case AD_TYPE_MARKER:
2186 // No need to convert fields to Little Endian since we don't use the marker's fields.
2188 switch (((struct bond_marker *)lacpdu)->tlv_type) {
2189 case AD_MARKER_INFORMATION_SUBTYPE:
2190 pr_debug("Received Marker Information on port %d\n", port->actor_port_number);
2191 ad_marker_info_received((struct bond_marker *)lacpdu, port);
2192 break;
2194 case AD_MARKER_RESPONSE_SUBTYPE:
2195 pr_debug("Received Marker Response on port %d\n", port->actor_port_number);
2196 ad_marker_response_received((struct bond_marker *)lacpdu, port);
2197 break;
2199 default:
2200 pr_debug("Received an unknown Marker subtype on slot %d\n", port->actor_port_number);
2207 * bond_3ad_adapter_speed_changed - handle a slave's speed change indication
2208 * @slave: slave struct to work on
2210 * Handle reselection of aggregator (if needed) for this port.
2212 void bond_3ad_adapter_speed_changed(struct slave *slave)
2214 struct port *port;
2216 port = &(SLAVE_AD_INFO(slave).port);
2218 // if slave is null, the whole port is not initialized
2219 if (!port->slave) {
2220 pr_warning(DRV_NAME ": Warning: %s: speed "
2221 "changed for uninitialized port on %s\n",
2222 slave->dev->master->name, slave->dev->name);
2223 return;
2226 port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS;
2227 port->actor_oper_port_key=port->actor_admin_port_key |= (__get_link_speed(port) << 1);
2228 pr_debug("Port %d changed speed\n", port->actor_port_number);
2229 // there is no need to reselect a new aggregator, just signal the
2230 // state machines to reinitialize
2231 port->sm_vars |= AD_PORT_BEGIN;
2235 * bond_3ad_adapter_duplex_changed - handle a slave's duplex change indication
2236 * @slave: slave struct to work on
2238 * Handle reselection of aggregator (if needed) for this port.
2240 void bond_3ad_adapter_duplex_changed(struct slave *slave)
2242 struct port *port;
2244 port=&(SLAVE_AD_INFO(slave).port);
2246 // if slave is null, the whole port is not initialized
2247 if (!port->slave) {
2248 pr_warning(DRV_NAME ": %s: Warning: duplex changed "
2249 "for uninitialized port on %s\n",
2250 slave->dev->master->name, slave->dev->name);
2251 return;
2254 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS;
2255 port->actor_oper_port_key=port->actor_admin_port_key |= __get_duplex(port);
2256 pr_debug("Port %d changed duplex\n", port->actor_port_number);
2257 // there is no need to reselect a new aggregator, just signal the
2258 // state machines to reinitialize
2259 port->sm_vars |= AD_PORT_BEGIN;
2263 * bond_3ad_handle_link_change - handle a slave's link status change indication
2264 * @slave: slave struct to work on
2265 * @status: whether the link is now up or down
2267 * Handle reselection of aggregator (if needed) for this port.
2269 void bond_3ad_handle_link_change(struct slave *slave, char link)
2271 struct port *port;
2273 port = &(SLAVE_AD_INFO(slave).port);
2275 // if slave is null, the whole port is not initialized
2276 if (!port->slave) {
2277 pr_warning(DRV_NAME ": Warning: %s: link status changed for "
2278 "uninitialized port on %s\n",
2279 slave->dev->master->name, slave->dev->name);
2280 return;
2283 // on link down we are zeroing duplex and speed since some of the adaptors(ce1000.lan) report full duplex/speed instead of N/A(duplex) / 0(speed)
2284 // on link up we are forcing recheck on the duplex and speed since some of he adaptors(ce1000.lan) report
2285 if (link == BOND_LINK_UP) {
2286 port->is_enabled = true;
2287 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS;
2288 port->actor_oper_port_key=port->actor_admin_port_key |= __get_duplex(port);
2289 port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS;
2290 port->actor_oper_port_key=port->actor_admin_port_key |= (__get_link_speed(port) << 1);
2291 } else {
2292 /* link has failed */
2293 port->is_enabled = false;
2294 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS;
2295 port->actor_oper_port_key= (port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS);
2297 //BOND_PRINT_DBG(("Port %d changed link status to %s", port->actor_port_number, ((link == BOND_LINK_UP)?"UP":"DOWN")));
2298 // there is no need to reselect a new aggregator, just signal the
2299 // state machines to reinitialize
2300 port->sm_vars |= AD_PORT_BEGIN;
2304 * set link state for bonding master: if we have an active
2305 * aggregator, we're up, if not, we're down. Presumes that we cannot
2306 * have an active aggregator if there are no slaves with link up.
2308 * This behavior complies with IEEE 802.3 section 43.3.9.
2310 * Called by bond_set_carrier(). Return zero if carrier state does not
2311 * change, nonzero if it does.
2313 int bond_3ad_set_carrier(struct bonding *bond)
2315 if (__get_active_agg(&(SLAVE_AD_INFO(bond->first_slave).aggregator))) {
2316 if (!netif_carrier_ok(bond->dev)) {
2317 netif_carrier_on(bond->dev);
2318 return 1;
2320 return 0;
2323 if (netif_carrier_ok(bond->dev)) {
2324 netif_carrier_off(bond->dev);
2325 return 1;
2327 return 0;
2331 * bond_3ad_get_active_agg_info - get information of the active aggregator
2332 * @bond: bonding struct to work on
2333 * @ad_info: ad_info struct to fill with the bond's info
2335 * Returns: 0 on success
2336 * < 0 on error
2338 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info)
2340 struct aggregator *aggregator = NULL;
2341 struct port *port;
2343 for (port = __get_first_port(bond); port; port = __get_next_port(port)) {
2344 if (port->aggregator && port->aggregator->is_active) {
2345 aggregator = port->aggregator;
2346 break;
2350 if (aggregator) {
2351 ad_info->aggregator_id = aggregator->aggregator_identifier;
2352 ad_info->ports = aggregator->num_of_ports;
2353 ad_info->actor_key = aggregator->actor_oper_aggregator_key;
2354 ad_info->partner_key = aggregator->partner_oper_aggregator_key;
2355 memcpy(ad_info->partner_system, aggregator->partner_system.mac_addr_value, ETH_ALEN);
2356 return 0;
2359 return -1;
2362 int bond_3ad_xmit_xor(struct sk_buff *skb, struct net_device *dev)
2364 struct slave *slave, *start_at;
2365 struct bonding *bond = netdev_priv(dev);
2366 int slave_agg_no;
2367 int slaves_in_agg;
2368 int agg_id;
2369 int i;
2370 struct ad_info ad_info;
2371 int res = 1;
2373 /* make sure that the slaves list will
2374 * not change during tx
2376 read_lock(&bond->lock);
2378 if (!BOND_IS_OK(bond)) {
2379 goto out;
2382 if (bond_3ad_get_active_agg_info(bond, &ad_info)) {
2383 pr_debug(DRV_NAME ": %s: Error: "
2384 "bond_3ad_get_active_agg_info failed\n", dev->name);
2385 goto out;
2388 slaves_in_agg = ad_info.ports;
2389 agg_id = ad_info.aggregator_id;
2391 if (slaves_in_agg == 0) {
2392 /*the aggregator is empty*/
2393 pr_debug(DRV_NAME ": %s: Error: active aggregator is empty\n",
2394 dev->name);
2395 goto out;
2398 slave_agg_no = bond->xmit_hash_policy(skb, dev, slaves_in_agg);
2400 bond_for_each_slave(bond, slave, i) {
2401 struct aggregator *agg = SLAVE_AD_INFO(slave).port.aggregator;
2403 if (agg && (agg->aggregator_identifier == agg_id)) {
2404 slave_agg_no--;
2405 if (slave_agg_no < 0) {
2406 break;
2411 if (slave_agg_no >= 0) {
2412 pr_err(DRV_NAME ": %s: Error: Couldn't find a slave to tx on "
2413 "for aggregator ID %d\n", dev->name, agg_id);
2414 goto out;
2417 start_at = slave;
2419 bond_for_each_slave_from(bond, slave, i, start_at) {
2420 int slave_agg_id = 0;
2421 struct aggregator *agg = SLAVE_AD_INFO(slave).port.aggregator;
2423 if (agg) {
2424 slave_agg_id = agg->aggregator_identifier;
2427 if (SLAVE_IS_OK(slave) && agg && (slave_agg_id == agg_id)) {
2428 res = bond_dev_queue_xmit(bond, skb, slave->dev);
2429 break;
2433 out:
2434 if (res) {
2435 /* no suitable interface, frame not sent */
2436 dev_kfree_skb(skb);
2438 read_unlock(&bond->lock);
2439 return NETDEV_TX_OK;
2442 int bond_3ad_lacpdu_recv(struct sk_buff *skb, struct net_device *dev, struct packet_type* ptype, struct net_device *orig_dev)
2444 struct bonding *bond = netdev_priv(dev);
2445 struct slave *slave = NULL;
2446 int ret = NET_RX_DROP;
2448 if (dev_net(dev) != &init_net)
2449 goto out;
2451 if (!(dev->flags & IFF_MASTER))
2452 goto out;
2454 read_lock(&bond->lock);
2455 slave = bond_get_slave_by_dev((struct bonding *)netdev_priv(dev),
2456 orig_dev);
2457 if (!slave)
2458 goto out_unlock;
2460 bond_3ad_rx_indication((struct lacpdu *) skb->data, slave, skb->len);
2462 ret = NET_RX_SUCCESS;
2464 out_unlock:
2465 read_unlock(&bond->lock);
2466 out:
2467 dev_kfree_skb(skb);
2469 return ret;