]> git.proxmox.com Git - mirror_ubuntu-jammy-kernel.git/blob - drivers/net/bonding/bond_3ad.c
Merge branch 'bonding_rtnl'
[mirror_ubuntu-jammy-kernel.git] / drivers / net / bonding / bond_3ad.c
1 /*
2 * Copyright(c) 1999 - 2004 Intel Corporation. All rights reserved.
3 *
4 * This program is free software; you can redistribute it and/or modify it
5 * under the terms of the GNU General Public License as published by the Free
6 * Software Foundation; either version 2 of the License, or (at your option)
7 * any later version.
8 *
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
13 *
14 * You should have received a copy of the GNU General Public License along with
15 * this program; if not, write to the Free Software Foundation, Inc., 59
16 * Temple Place - Suite 330, Boston, MA 02111-1307, USA.
17 *
18 * The full GNU General Public License is included in this distribution in the
19 * file called LICENSE.
20 *
21 */
22
23 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
24
25 #include <linux/skbuff.h>
26 #include <linux/if_ether.h>
27 #include <linux/netdevice.h>
28 #include <linux/spinlock.h>
29 #include <linux/ethtool.h>
30 #include <linux/etherdevice.h>
31 #include <linux/if_bonding.h>
32 #include <linux/pkt_sched.h>
33 #include <net/net_namespace.h>
34 #include "bonding.h"
35 #include "bond_3ad.h"
36
37 /* General definitions */
38 #define AD_SHORT_TIMEOUT 1
39 #define AD_LONG_TIMEOUT 0
40 #define AD_STANDBY 0x2
41 #define AD_MAX_TX_IN_SECOND 3
42 #define AD_COLLECTOR_MAX_DELAY 0
43
44 /* Timer definitions (43.4.4 in the 802.3ad standard) */
45 #define AD_FAST_PERIODIC_TIME 1
46 #define AD_SLOW_PERIODIC_TIME 30
47 #define AD_SHORT_TIMEOUT_TIME (3*AD_FAST_PERIODIC_TIME)
48 #define AD_LONG_TIMEOUT_TIME (3*AD_SLOW_PERIODIC_TIME)
49 #define AD_CHURN_DETECTION_TIME 60
50 #define AD_AGGREGATE_WAIT_TIME 2
51
52 /* Port state definitions (43.4.2.2 in the 802.3ad standard) */
53 #define AD_STATE_LACP_ACTIVITY 0x1
54 #define AD_STATE_LACP_TIMEOUT 0x2
55 #define AD_STATE_AGGREGATION 0x4
56 #define AD_STATE_SYNCHRONIZATION 0x8
57 #define AD_STATE_COLLECTING 0x10
58 #define AD_STATE_DISTRIBUTING 0x20
59 #define AD_STATE_DEFAULTED 0x40
60 #define AD_STATE_EXPIRED 0x80
61
62 /* Port Variables definitions used by the State Machines (43.4.7 in the
63 * 802.3ad standard)
64 */
65 #define AD_PORT_BEGIN 0x1
66 #define AD_PORT_LACP_ENABLED 0x2
67 #define AD_PORT_ACTOR_CHURN 0x4
68 #define AD_PORT_PARTNER_CHURN 0x8
69 #define AD_PORT_READY 0x10
70 #define AD_PORT_READY_N 0x20
71 #define AD_PORT_MATCHED 0x40
72 #define AD_PORT_STANDBY 0x80
73 #define AD_PORT_SELECTED 0x100
74 #define AD_PORT_MOVED 0x200
75
76 /* Port Key definitions
77 * key is determined according to the link speed, duplex and
78 * user key (which is yet not supported)
79 * --------------------------------------------------------------
80 * Port key : | User key | Speed | Duplex |
81 * --------------------------------------------------------------
82 * 16 6 1 0
83 */
84 #define AD_DUPLEX_KEY_BITS 0x1
85 #define AD_SPEED_KEY_BITS 0x3E
86 #define AD_USER_KEY_BITS 0xFFC0
87
88 #define AD_LINK_SPEED_BITMASK_1MBPS 0x1
89 #define AD_LINK_SPEED_BITMASK_10MBPS 0x2
90 #define AD_LINK_SPEED_BITMASK_100MBPS 0x4
91 #define AD_LINK_SPEED_BITMASK_1000MBPS 0x8
92 #define AD_LINK_SPEED_BITMASK_10000MBPS 0x10
93
94 /* compare MAC addresses */
95 #define MAC_ADDRESS_EQUAL(A, B) \
96 ether_addr_equal_64bits((const u8 *)A, (const u8 *)B)
97
98 static struct mac_addr null_mac_addr = { { 0, 0, 0, 0, 0, 0 } };
99 static u16 ad_ticks_per_sec;
100 static const int ad_delta_in_ticks = (AD_TIMER_INTERVAL * HZ) / 1000;
101
102 static const u8 lacpdu_mcast_addr[ETH_ALEN] = MULTICAST_LACPDU_ADDR;
103
104 /* ================= main 802.3ad protocol functions ================== */
105 static int ad_lacpdu_send(struct port *port);
106 static int ad_marker_send(struct port *port, struct bond_marker *marker);
107 static void ad_mux_machine(struct port *port);
108 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
109 static void ad_tx_machine(struct port *port);
110 static void ad_periodic_machine(struct port *port);
111 static void ad_port_selection_logic(struct port *port);
112 static void ad_agg_selection_logic(struct aggregator *aggregator);
113 static void ad_clear_agg(struct aggregator *aggregator);
114 static void ad_initialize_agg(struct aggregator *aggregator);
115 static void ad_initialize_port(struct port *port, int lacp_fast);
116 static void ad_enable_collecting_distributing(struct port *port);
117 static void ad_disable_collecting_distributing(struct port *port);
118 static void ad_marker_info_received(struct bond_marker *marker_info,
119 struct port *port);
120 static void ad_marker_response_received(struct bond_marker *marker,
121 struct port *port);
122
123
124 /* ================= api to bonding and kernel code ================== */
125
126 /**
127 * __get_bond_by_port - get the port's bonding struct
128 * @port: the port we're looking at
129 *
130 * Return @port's bonding struct, or %NULL if it can't be found.
131 */
132 static inline struct bonding *__get_bond_by_port(struct port *port)
133 {
134 if (port->slave == NULL)
135 return NULL;
136
137 return bond_get_bond_by_slave(port->slave);
138 }
139
140 /**
141 * __get_first_agg - get the first aggregator in the bond
142 * @bond: the bond we're looking at
143 *
144 * Return the aggregator of the first slave in @bond, or %NULL if it can't be
145 * found.
146 * The caller must hold RCU or RTNL lock.
147 */
148 static inline struct aggregator *__get_first_agg(struct port *port)
149 {
150 struct bonding *bond = __get_bond_by_port(port);
151 struct slave *first_slave;
152 struct aggregator *agg;
153
154 /* If there's no bond for this port, or bond has no slaves */
155 if (bond == NULL)
156 return NULL;
157
158 rcu_read_lock();
159 first_slave = bond_first_slave_rcu(bond);
160 agg = first_slave ? &(SLAVE_AD_INFO(first_slave).aggregator) : NULL;
161 rcu_read_unlock();
162
163 return agg;
164 }
165
166 /**
167 * __agg_has_partner - see if we have a partner
168 * @agg: the agregator we're looking at
169 *
170 * Return nonzero if aggregator has a partner (denoted by a non-zero ether
171 * address for the partner). Return 0 if not.
172 */
173 static inline int __agg_has_partner(struct aggregator *agg)
174 {
175 return !is_zero_ether_addr(agg->partner_system.mac_addr_value);
176 }
177
178 /**
179 * __disable_port - disable the port's slave
180 * @port: the port we're looking at
181 */
182 static inline void __disable_port(struct port *port)
183 {
184 bond_set_slave_inactive_flags(port->slave, BOND_SLAVE_NOTIFY_LATER);
185 }
186
187 /**
188 * __enable_port - enable the port's slave, if it's up
189 * @port: the port we're looking at
190 */
191 static inline void __enable_port(struct port *port)
192 {
193 struct slave *slave = port->slave;
194
195 if ((slave->link == BOND_LINK_UP) && IS_UP(slave->dev))
196 bond_set_slave_active_flags(slave, BOND_SLAVE_NOTIFY_LATER);
197 }
198
199 /**
200 * __port_is_enabled - check if the port's slave is in active state
201 * @port: the port we're looking at
202 */
203 static inline int __port_is_enabled(struct port *port)
204 {
205 return bond_is_active_slave(port->slave);
206 }
207
208 /**
209 * __get_agg_selection_mode - get the aggregator selection mode
210 * @port: the port we're looking at
211 *
212 * Get the aggregator selection mode. Can be %STABLE, %BANDWIDTH or %COUNT.
213 */
214 static inline u32 __get_agg_selection_mode(struct port *port)
215 {
216 struct bonding *bond = __get_bond_by_port(port);
217
218 if (bond == NULL)
219 return BOND_AD_STABLE;
220
221 return bond->params.ad_select;
222 }
223
224 /**
225 * __check_agg_selection_timer - check if the selection timer has expired
226 * @port: the port we're looking at
227 */
228 static inline int __check_agg_selection_timer(struct port *port)
229 {
230 struct bonding *bond = __get_bond_by_port(port);
231
232 if (bond == NULL)
233 return 0;
234
235 return BOND_AD_INFO(bond).agg_select_timer ? 1 : 0;
236 }
237
238 /**
239 * __get_state_machine_lock - lock the port's state machines
240 * @port: the port we're looking at
241 */
242 static inline void __get_state_machine_lock(struct port *port)
243 {
244 spin_lock_bh(&(SLAVE_AD_INFO(port->slave).state_machine_lock));
245 }
246
247 /**
248 * __release_state_machine_lock - unlock the port's state machines
249 * @port: the port we're looking at
250 */
251 static inline void __release_state_machine_lock(struct port *port)
252 {
253 spin_unlock_bh(&(SLAVE_AD_INFO(port->slave).state_machine_lock));
254 }
255
256 /**
257 * __get_link_speed - get a port's speed
258 * @port: the port we're looking at
259 *
260 * Return @port's speed in 802.3ad bitmask format. i.e. one of:
261 * 0,
262 * %AD_LINK_SPEED_BITMASK_10MBPS,
263 * %AD_LINK_SPEED_BITMASK_100MBPS,
264 * %AD_LINK_SPEED_BITMASK_1000MBPS,
265 * %AD_LINK_SPEED_BITMASK_10000MBPS
266 */
267 static u16 __get_link_speed(struct port *port)
268 {
269 struct slave *slave = port->slave;
270 u16 speed;
271
272 /* this if covers only a special case: when the configuration starts
273 * with link down, it sets the speed to 0.
274 * This is done in spite of the fact that the e100 driver reports 0
275 * to be compatible with MVT in the future.
276 */
277 if (slave->link != BOND_LINK_UP)
278 speed = 0;
279 else {
280 switch (slave->speed) {
281 case SPEED_10:
282 speed = AD_LINK_SPEED_BITMASK_10MBPS;
283 break;
284
285 case SPEED_100:
286 speed = AD_LINK_SPEED_BITMASK_100MBPS;
287 break;
288
289 case SPEED_1000:
290 speed = AD_LINK_SPEED_BITMASK_1000MBPS;
291 break;
292
293 case SPEED_10000:
294 speed = AD_LINK_SPEED_BITMASK_10000MBPS;
295 break;
296
297 default:
298 /* unknown speed value from ethtool. shouldn't happen */
299 speed = 0;
300 break;
301 }
302 }
303
304 pr_debug("Port %d Received link speed %d update from adapter\n",
305 port->actor_port_number, speed);
306 return speed;
307 }
308
309 /**
310 * __get_duplex - get a port's duplex
311 * @port: the port we're looking at
312 *
313 * Return @port's duplex in 802.3ad bitmask format. i.e.:
314 * 0x01 if in full duplex
315 * 0x00 otherwise
316 */
317 static u8 __get_duplex(struct port *port)
318 {
319 struct slave *slave = port->slave;
320
321 u8 retval;
322
323 /* handling a special case: when the configuration starts with
324 * link down, it sets the duplex to 0.
325 */
326 if (slave->link != BOND_LINK_UP)
327 retval = 0x0;
328 else {
329 switch (slave->duplex) {
330 case DUPLEX_FULL:
331 retval = 0x1;
332 pr_debug("Port %d Received status full duplex update from adapter\n",
333 port->actor_port_number);
334 break;
335 case DUPLEX_HALF:
336 default:
337 retval = 0x0;
338 pr_debug("Port %d Received status NOT full duplex update from adapter\n",
339 port->actor_port_number);
340 break;
341 }
342 }
343 return retval;
344 }
345
346 /**
347 * __initialize_port_locks - initialize a port's STATE machine spinlock
348 * @port: the slave of the port we're looking at
349 */
350 static inline void __initialize_port_locks(struct slave *slave)
351 {
352 /* make sure it isn't called twice */
353 spin_lock_init(&(SLAVE_AD_INFO(slave).state_machine_lock));
354 }
355
356 /* Conversions */
357
358 /**
359 * __ad_timer_to_ticks - convert a given timer type to AD module ticks
360 * @timer_type: which timer to operate
361 * @par: timer parameter. see below
362 *
363 * If @timer_type is %current_while_timer, @par indicates long/short timer.
364 * If @timer_type is %periodic_timer, @par is one of %FAST_PERIODIC_TIME,
365 * %SLOW_PERIODIC_TIME.
366 */
367 static u16 __ad_timer_to_ticks(u16 timer_type, u16 par)
368 {
369 u16 retval = 0; /* to silence the compiler */
370
371 switch (timer_type) {
372 case AD_CURRENT_WHILE_TIMER: /* for rx machine usage */
373 if (par)
374 retval = (AD_SHORT_TIMEOUT_TIME*ad_ticks_per_sec);
375 else
376 retval = (AD_LONG_TIMEOUT_TIME*ad_ticks_per_sec);
377 break;
378 case AD_ACTOR_CHURN_TIMER: /* for local churn machine */
379 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
380 break;
381 case AD_PERIODIC_TIMER: /* for periodic machine */
382 retval = (par*ad_ticks_per_sec); /* long timeout */
383 break;
384 case AD_PARTNER_CHURN_TIMER: /* for remote churn machine */
385 retval = (AD_CHURN_DETECTION_TIME*ad_ticks_per_sec);
386 break;
387 case AD_WAIT_WHILE_TIMER: /* for selection machine */
388 retval = (AD_AGGREGATE_WAIT_TIME*ad_ticks_per_sec);
389 break;
390 }
391
392 return retval;
393 }
394
395
396 /* ================= ad_rx_machine helper functions ================== */
397
398 /**
399 * __choose_matched - update a port's matched variable from a received lacpdu
400 * @lacpdu: the lacpdu we've received
401 * @port: the port we're looking at
402 *
403 * Update the value of the matched variable, using parameter values from a
404 * newly received lacpdu. Parameter values for the partner carried in the
405 * received PDU are compared with the corresponding operational parameter
406 * values for the actor. Matched is set to TRUE if all of these parameters
407 * match and the PDU parameter partner_state.aggregation has the same value as
408 * actor_oper_port_state.aggregation and lacp will actively maintain the link
409 * in the aggregation. Matched is also set to TRUE if the value of
410 * actor_state.aggregation in the received PDU is set to FALSE, i.e., indicates
411 * an individual link and lacp will actively maintain the link. Otherwise,
412 * matched is set to FALSE. LACP is considered to be actively maintaining the
413 * link if either the PDU's actor_state.lacp_activity variable is TRUE or both
414 * the actor's actor_oper_port_state.lacp_activity and the PDU's
415 * partner_state.lacp_activity variables are TRUE.
416 *
417 * Note: the AD_PORT_MATCHED "variable" is not specified by 802.3ad; it is
418 * used here to implement the language from 802.3ad 43.4.9 that requires
419 * recordPDU to "match" the LACPDU parameters to the stored values.
420 */
421 static void __choose_matched(struct lacpdu *lacpdu, struct port *port)
422 {
423 /* check if all parameters are alike
424 * or this is individual link(aggregation == FALSE)
425 * then update the state machine Matched variable.
426 */
427 if (((ntohs(lacpdu->partner_port) == port->actor_port_number) &&
428 (ntohs(lacpdu->partner_port_priority) == port->actor_port_priority) &&
429 MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) &&
430 (ntohs(lacpdu->partner_system_priority) == port->actor_system_priority) &&
431 (ntohs(lacpdu->partner_key) == port->actor_oper_port_key) &&
432 ((lacpdu->partner_state & AD_STATE_AGGREGATION) == (port->actor_oper_port_state & AD_STATE_AGGREGATION))) ||
433 ((lacpdu->actor_state & AD_STATE_AGGREGATION) == 0)
434 ) {
435 port->sm_vars |= AD_PORT_MATCHED;
436 } else {
437 port->sm_vars &= ~AD_PORT_MATCHED;
438 }
439 }
440
441 /**
442 * __record_pdu - record parameters from a received lacpdu
443 * @lacpdu: the lacpdu we've received
444 * @port: the port we're looking at
445 *
446 * Record the parameter values for the Actor carried in a received lacpdu as
447 * the current partner operational parameter values and sets
448 * actor_oper_port_state.defaulted to FALSE.
449 */
450 static void __record_pdu(struct lacpdu *lacpdu, struct port *port)
451 {
452 if (lacpdu && port) {
453 struct port_params *partner = &port->partner_oper;
454
455 __choose_matched(lacpdu, port);
456 /* record the new parameter values for the partner
457 * operational
458 */
459 partner->port_number = ntohs(lacpdu->actor_port);
460 partner->port_priority = ntohs(lacpdu->actor_port_priority);
461 partner->system = lacpdu->actor_system;
462 partner->system_priority = ntohs(lacpdu->actor_system_priority);
463 partner->key = ntohs(lacpdu->actor_key);
464 partner->port_state = lacpdu->actor_state;
465
466 /* set actor_oper_port_state.defaulted to FALSE */
467 port->actor_oper_port_state &= ~AD_STATE_DEFAULTED;
468
469 /* set the partner sync. to on if the partner is sync,
470 * and the port is matched
471 */
472 if ((port->sm_vars & AD_PORT_MATCHED)
473 && (lacpdu->actor_state & AD_STATE_SYNCHRONIZATION))
474 partner->port_state |= AD_STATE_SYNCHRONIZATION;
475 else
476 partner->port_state &= ~AD_STATE_SYNCHRONIZATION;
477 }
478 }
479
480 /**
481 * __record_default - record default parameters
482 * @port: the port we're looking at
483 *
484 * This function records the default parameter values for the partner carried
485 * in the Partner Admin parameters as the current partner operational parameter
486 * values and sets actor_oper_port_state.defaulted to TRUE.
487 */
488 static void __record_default(struct port *port)
489 {
490 if (port) {
491 /* record the partner admin parameters */
492 memcpy(&port->partner_oper, &port->partner_admin,
493 sizeof(struct port_params));
494
495 /* set actor_oper_port_state.defaulted to true */
496 port->actor_oper_port_state |= AD_STATE_DEFAULTED;
497 }
498 }
499
500 /**
501 * __update_selected - update a port's Selected variable from a received lacpdu
502 * @lacpdu: the lacpdu we've received
503 * @port: the port we're looking at
504 *
505 * Update the value of the selected variable, using parameter values from a
506 * newly received lacpdu. The parameter values for the Actor carried in the
507 * received PDU are compared with the corresponding operational parameter
508 * values for the ports partner. If one or more of the comparisons shows that
509 * the value(s) received in the PDU differ from the current operational values,
510 * then selected is set to FALSE and actor_oper_port_state.synchronization is
511 * set to out_of_sync. Otherwise, selected remains unchanged.
512 */
513 static void __update_selected(struct lacpdu *lacpdu, struct port *port)
514 {
515 if (lacpdu && port) {
516 const struct port_params *partner = &port->partner_oper;
517
518 /* check if any parameter is different then
519 * update the state machine selected variable.
520 */
521 if (ntohs(lacpdu->actor_port) != partner->port_number ||
522 ntohs(lacpdu->actor_port_priority) != partner->port_priority ||
523 !MAC_ADDRESS_EQUAL(&lacpdu->actor_system, &partner->system) ||
524 ntohs(lacpdu->actor_system_priority) != partner->system_priority ||
525 ntohs(lacpdu->actor_key) != partner->key ||
526 (lacpdu->actor_state & AD_STATE_AGGREGATION) != (partner->port_state & AD_STATE_AGGREGATION)) {
527 port->sm_vars &= ~AD_PORT_SELECTED;
528 }
529 }
530 }
531
532 /**
533 * __update_default_selected - update a port's Selected variable from Partner
534 * @port: the port we're looking at
535 *
536 * This function updates the value of the selected variable, using the partner
537 * administrative parameter values. The administrative values are compared with
538 * the corresponding operational parameter values for the partner. If one or
539 * more of the comparisons shows that the administrative value(s) differ from
540 * the current operational values, then Selected is set to FALSE and
541 * actor_oper_port_state.synchronization is set to OUT_OF_SYNC. Otherwise,
542 * Selected remains unchanged.
543 */
544 static void __update_default_selected(struct port *port)
545 {
546 if (port) {
547 const struct port_params *admin = &port->partner_admin;
548 const struct port_params *oper = &port->partner_oper;
549
550 /* check if any parameter is different then
551 * update the state machine selected variable.
552 */
553 if (admin->port_number != oper->port_number ||
554 admin->port_priority != oper->port_priority ||
555 !MAC_ADDRESS_EQUAL(&admin->system, &oper->system) ||
556 admin->system_priority != oper->system_priority ||
557 admin->key != oper->key ||
558 (admin->port_state & AD_STATE_AGGREGATION)
559 != (oper->port_state & AD_STATE_AGGREGATION)) {
560 port->sm_vars &= ~AD_PORT_SELECTED;
561 }
562 }
563 }
564
565 /**
566 * __update_ntt - update a port's ntt variable from a received lacpdu
567 * @lacpdu: the lacpdu we've received
568 * @port: the port we're looking at
569 *
570 * Updates the value of the ntt variable, using parameter values from a newly
571 * received lacpdu. The parameter values for the partner carried in the
572 * received PDU are compared with the corresponding operational parameter
573 * values for the Actor. If one or more of the comparisons shows that the
574 * value(s) received in the PDU differ from the current operational values,
575 * then ntt is set to TRUE. Otherwise, ntt remains unchanged.
576 */
577 static void __update_ntt(struct lacpdu *lacpdu, struct port *port)
578 {
579 /* validate lacpdu and port */
580 if (lacpdu && port) {
581 /* check if any parameter is different then
582 * update the port->ntt.
583 */
584 if ((ntohs(lacpdu->partner_port) != port->actor_port_number) ||
585 (ntohs(lacpdu->partner_port_priority) != port->actor_port_priority) ||
586 !MAC_ADDRESS_EQUAL(&(lacpdu->partner_system), &(port->actor_system)) ||
587 (ntohs(lacpdu->partner_system_priority) != port->actor_system_priority) ||
588 (ntohs(lacpdu->partner_key) != port->actor_oper_port_key) ||
589 ((lacpdu->partner_state & AD_STATE_LACP_ACTIVITY) != (port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY)) ||
590 ((lacpdu->partner_state & AD_STATE_LACP_TIMEOUT) != (port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT)) ||
591 ((lacpdu->partner_state & AD_STATE_SYNCHRONIZATION) != (port->actor_oper_port_state & AD_STATE_SYNCHRONIZATION)) ||
592 ((lacpdu->partner_state & AD_STATE_AGGREGATION) != (port->actor_oper_port_state & AD_STATE_AGGREGATION))
593 ) {
594 port->ntt = true;
595 }
596 }
597 }
598
599 /**
600 * __agg_ports_are_ready - check if all ports in an aggregator are ready
601 * @aggregator: the aggregator we're looking at
602 *
603 */
604 static int __agg_ports_are_ready(struct aggregator *aggregator)
605 {
606 struct port *port;
607 int retval = 1;
608
609 if (aggregator) {
610 /* scan all ports in this aggregator to verfy if they are
611 * all ready.
612 */
613 for (port = aggregator->lag_ports;
614 port;
615 port = port->next_port_in_aggregator) {
616 if (!(port->sm_vars & AD_PORT_READY_N)) {
617 retval = 0;
618 break;
619 }
620 }
621 }
622
623 return retval;
624 }
625
626 /**
627 * __set_agg_ports_ready - set value of Ready bit in all ports of an aggregator
628 * @aggregator: the aggregator we're looking at
629 * @val: Should the ports' ready bit be set on or off
630 *
631 */
632 static void __set_agg_ports_ready(struct aggregator *aggregator, int val)
633 {
634 struct port *port;
635
636 for (port = aggregator->lag_ports; port;
637 port = port->next_port_in_aggregator) {
638 if (val)
639 port->sm_vars |= AD_PORT_READY;
640 else
641 port->sm_vars &= ~AD_PORT_READY;
642 }
643 }
644
645 /**
646 * __get_agg_bandwidth - get the total bandwidth of an aggregator
647 * @aggregator: the aggregator we're looking at
648 *
649 */
650 static u32 __get_agg_bandwidth(struct aggregator *aggregator)
651 {
652 u32 bandwidth = 0;
653
654 if (aggregator->num_of_ports) {
655 switch (__get_link_speed(aggregator->lag_ports)) {
656 case AD_LINK_SPEED_BITMASK_1MBPS:
657 bandwidth = aggregator->num_of_ports;
658 break;
659 case AD_LINK_SPEED_BITMASK_10MBPS:
660 bandwidth = aggregator->num_of_ports * 10;
661 break;
662 case AD_LINK_SPEED_BITMASK_100MBPS:
663 bandwidth = aggregator->num_of_ports * 100;
664 break;
665 case AD_LINK_SPEED_BITMASK_1000MBPS:
666 bandwidth = aggregator->num_of_ports * 1000;
667 break;
668 case AD_LINK_SPEED_BITMASK_10000MBPS:
669 bandwidth = aggregator->num_of_ports * 10000;
670 break;
671 default:
672 bandwidth = 0; /* to silence the compiler */
673 }
674 }
675 return bandwidth;
676 }
677
678 /**
679 * __get_active_agg - get the current active aggregator
680 * @aggregator: the aggregator we're looking at
681 *
682 * Caller must hold RCU lock.
683 */
684 static struct aggregator *__get_active_agg(struct aggregator *aggregator)
685 {
686 struct bonding *bond = aggregator->slave->bond;
687 struct list_head *iter;
688 struct slave *slave;
689
690 bond_for_each_slave_rcu(bond, slave, iter)
691 if (SLAVE_AD_INFO(slave).aggregator.is_active)
692 return &(SLAVE_AD_INFO(slave).aggregator);
693
694 return NULL;
695 }
696
697 /**
698 * __update_lacpdu_from_port - update a port's lacpdu fields
699 * @port: the port we're looking at
700 */
701 static inline void __update_lacpdu_from_port(struct port *port)
702 {
703 struct lacpdu *lacpdu = &port->lacpdu;
704 const struct port_params *partner = &port->partner_oper;
705
706 /* update current actual Actor parameters
707 * lacpdu->subtype initialized
708 * lacpdu->version_number initialized
709 * lacpdu->tlv_type_actor_info initialized
710 * lacpdu->actor_information_length initialized
711 */
712
713 lacpdu->actor_system_priority = htons(port->actor_system_priority);
714 lacpdu->actor_system = port->actor_system;
715 lacpdu->actor_key = htons(port->actor_oper_port_key);
716 lacpdu->actor_port_priority = htons(port->actor_port_priority);
717 lacpdu->actor_port = htons(port->actor_port_number);
718 lacpdu->actor_state = port->actor_oper_port_state;
719
720 /* lacpdu->reserved_3_1 initialized
721 * lacpdu->tlv_type_partner_info initialized
722 * lacpdu->partner_information_length initialized
723 */
724
725 lacpdu->partner_system_priority = htons(partner->system_priority);
726 lacpdu->partner_system = partner->system;
727 lacpdu->partner_key = htons(partner->key);
728 lacpdu->partner_port_priority = htons(partner->port_priority);
729 lacpdu->partner_port = htons(partner->port_number);
730 lacpdu->partner_state = partner->port_state;
731
732 /* lacpdu->reserved_3_2 initialized
733 * lacpdu->tlv_type_collector_info initialized
734 * lacpdu->collector_information_length initialized
735 * collector_max_delay initialized
736 * reserved_12[12] initialized
737 * tlv_type_terminator initialized
738 * terminator_length initialized
739 * reserved_50[50] initialized
740 */
741 }
742
743 /* ================= main 802.3ad protocol code ========================= */
744
745 /**
746 * ad_lacpdu_send - send out a lacpdu packet on a given port
747 * @port: the port we're looking at
748 *
749 * Returns: 0 on success
750 * < 0 on error
751 */
752 static int ad_lacpdu_send(struct port *port)
753 {
754 struct slave *slave = port->slave;
755 struct sk_buff *skb;
756 struct lacpdu_header *lacpdu_header;
757 int length = sizeof(struct lacpdu_header);
758
759 skb = dev_alloc_skb(length);
760 if (!skb)
761 return -ENOMEM;
762
763 skb->dev = slave->dev;
764 skb_reset_mac_header(skb);
765 skb->network_header = skb->mac_header + ETH_HLEN;
766 skb->protocol = PKT_TYPE_LACPDU;
767 skb->priority = TC_PRIO_CONTROL;
768
769 lacpdu_header = (struct lacpdu_header *)skb_put(skb, length);
770
771 memcpy(lacpdu_header->hdr.h_dest, lacpdu_mcast_addr, ETH_ALEN);
772 /* Note: source address is set to be the member's PERMANENT address,
773 * because we use it to identify loopback lacpdus in receive.
774 */
775 memcpy(lacpdu_header->hdr.h_source, slave->perm_hwaddr, ETH_ALEN);
776 lacpdu_header->hdr.h_proto = PKT_TYPE_LACPDU;
777
778 lacpdu_header->lacpdu = port->lacpdu;
779
780 dev_queue_xmit(skb);
781
782 return 0;
783 }
784
785 /**
786 * ad_marker_send - send marker information/response on a given port
787 * @port: the port we're looking at
788 * @marker: marker data to send
789 *
790 * Returns: 0 on success
791 * < 0 on error
792 */
793 static int ad_marker_send(struct port *port, struct bond_marker *marker)
794 {
795 struct slave *slave = port->slave;
796 struct sk_buff *skb;
797 struct bond_marker_header *marker_header;
798 int length = sizeof(struct bond_marker_header);
799
800 skb = dev_alloc_skb(length + 16);
801 if (!skb)
802 return -ENOMEM;
803
804 skb_reserve(skb, 16);
805
806 skb->dev = slave->dev;
807 skb_reset_mac_header(skb);
808 skb->network_header = skb->mac_header + ETH_HLEN;
809 skb->protocol = PKT_TYPE_LACPDU;
810
811 marker_header = (struct bond_marker_header *)skb_put(skb, length);
812
813 memcpy(marker_header->hdr.h_dest, lacpdu_mcast_addr, ETH_ALEN);
814 /* Note: source address is set to be the member's PERMANENT address,
815 * because we use it to identify loopback MARKERs in receive.
816 */
817 memcpy(marker_header->hdr.h_source, slave->perm_hwaddr, ETH_ALEN);
818 marker_header->hdr.h_proto = PKT_TYPE_LACPDU;
819
820 marker_header->marker = *marker;
821
822 dev_queue_xmit(skb);
823
824 return 0;
825 }
826
827 /**
828 * ad_mux_machine - handle a port's mux state machine
829 * @port: the port we're looking at
830 */
831 static void ad_mux_machine(struct port *port)
832 {
833 mux_states_t last_state;
834
835 /* keep current State Machine state to compare later if it was
836 * changed
837 */
838 last_state = port->sm_mux_state;
839
840 if (port->sm_vars & AD_PORT_BEGIN) {
841 port->sm_mux_state = AD_MUX_DETACHED;
842 } else {
843 switch (port->sm_mux_state) {
844 case AD_MUX_DETACHED:
845 if ((port->sm_vars & AD_PORT_SELECTED)
846 || (port->sm_vars & AD_PORT_STANDBY))
847 /* if SELECTED or STANDBY */
848 port->sm_mux_state = AD_MUX_WAITING;
849 break;
850 case AD_MUX_WAITING:
851 /* if SELECTED == FALSE return to DETACH state */
852 if (!(port->sm_vars & AD_PORT_SELECTED)) {
853 port->sm_vars &= ~AD_PORT_READY_N;
854 /* in order to withhold the Selection Logic to
855 * check all ports READY_N value every callback
856 * cycle to update ready variable, we check
857 * READY_N and update READY here
858 */
859 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
860 port->sm_mux_state = AD_MUX_DETACHED;
861 break;
862 }
863
864 /* check if the wait_while_timer expired */
865 if (port->sm_mux_timer_counter
866 && !(--port->sm_mux_timer_counter))
867 port->sm_vars |= AD_PORT_READY_N;
868
869 /* in order to withhold the selection logic to check
870 * all ports READY_N value every callback cycle to
871 * update ready variable, we check READY_N and update
872 * READY here
873 */
874 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
875
876 /* if the wait_while_timer expired, and the port is
877 * in READY state, move to ATTACHED state
878 */
879 if ((port->sm_vars & AD_PORT_READY)
880 && !port->sm_mux_timer_counter)
881 port->sm_mux_state = AD_MUX_ATTACHED;
882 break;
883 case AD_MUX_ATTACHED:
884 /* check also if agg_select_timer expired (so the
885 * edable port will take place only after this timer)
886 */
887 if ((port->sm_vars & AD_PORT_SELECTED) &&
888 (port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION) &&
889 !__check_agg_selection_timer(port)) {
890 port->sm_mux_state = AD_MUX_COLLECTING_DISTRIBUTING;
891 } else if (!(port->sm_vars & AD_PORT_SELECTED) ||
892 (port->sm_vars & AD_PORT_STANDBY)) {
893 /* if UNSELECTED or STANDBY */
894 port->sm_vars &= ~AD_PORT_READY_N;
895 /* in order to withhold the selection logic to
896 * check all ports READY_N value every callback
897 * cycle to update ready variable, we check
898 * READY_N and update READY here
899 */
900 __set_agg_ports_ready(port->aggregator, __agg_ports_are_ready(port->aggregator));
901 port->sm_mux_state = AD_MUX_DETACHED;
902 }
903 break;
904 case AD_MUX_COLLECTING_DISTRIBUTING:
905 if (!(port->sm_vars & AD_PORT_SELECTED) ||
906 (port->sm_vars & AD_PORT_STANDBY) ||
907 !(port->partner_oper.port_state & AD_STATE_SYNCHRONIZATION)) {
908 port->sm_mux_state = AD_MUX_ATTACHED;
909 } else {
910 /* if port state hasn't changed make
911 * sure that a collecting distributing
912 * port in an active aggregator is enabled
913 */
914 if (port->aggregator &&
915 port->aggregator->is_active &&
916 !__port_is_enabled(port)) {
917
918 __enable_port(port);
919 }
920 }
921 break;
922 default:
923 break;
924 }
925 }
926
927 /* check if the state machine was changed */
928 if (port->sm_mux_state != last_state) {
929 pr_debug("Mux Machine: Port=%d, Last State=%d, Curr State=%d\n",
930 port->actor_port_number, last_state,
931 port->sm_mux_state);
932 switch (port->sm_mux_state) {
933 case AD_MUX_DETACHED:
934 port->actor_oper_port_state &= ~AD_STATE_SYNCHRONIZATION;
935 ad_disable_collecting_distributing(port);
936 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
937 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
938 port->ntt = true;
939 break;
940 case AD_MUX_WAITING:
941 port->sm_mux_timer_counter = __ad_timer_to_ticks(AD_WAIT_WHILE_TIMER, 0);
942 break;
943 case AD_MUX_ATTACHED:
944 port->actor_oper_port_state |= AD_STATE_SYNCHRONIZATION;
945 port->actor_oper_port_state &= ~AD_STATE_COLLECTING;
946 port->actor_oper_port_state &= ~AD_STATE_DISTRIBUTING;
947 ad_disable_collecting_distributing(port);
948 port->ntt = true;
949 break;
950 case AD_MUX_COLLECTING_DISTRIBUTING:
951 port->actor_oper_port_state |= AD_STATE_COLLECTING;
952 port->actor_oper_port_state |= AD_STATE_DISTRIBUTING;
953 ad_enable_collecting_distributing(port);
954 port->ntt = true;
955 break;
956 default:
957 break;
958 }
959 }
960 }
961
962 /**
963 * ad_rx_machine - handle a port's rx State Machine
964 * @lacpdu: the lacpdu we've received
965 * @port: the port we're looking at
966 *
967 * If lacpdu arrived, stop previous timer (if exists) and set the next state as
968 * CURRENT. If timer expired set the state machine in the proper state.
969 * In other cases, this function checks if we need to switch to other state.
970 */
971 static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
972 {
973 rx_states_t last_state;
974
975 /* keep current State Machine state to compare later if it was
976 * changed
977 */
978 last_state = port->sm_rx_state;
979
980 /* check if state machine should change state */
981
982 /* first, check if port was reinitialized */
983 if (port->sm_vars & AD_PORT_BEGIN)
984 port->sm_rx_state = AD_RX_INITIALIZE;
985 /* check if port is not enabled */
986 else if (!(port->sm_vars & AD_PORT_BEGIN)
987 && !port->is_enabled && !(port->sm_vars & AD_PORT_MOVED))
988 port->sm_rx_state = AD_RX_PORT_DISABLED;
989 /* check if new lacpdu arrived */
990 else if (lacpdu && ((port->sm_rx_state == AD_RX_EXPIRED) ||
991 (port->sm_rx_state == AD_RX_DEFAULTED) ||
992 (port->sm_rx_state == AD_RX_CURRENT))) {
993 port->sm_rx_timer_counter = 0;
994 port->sm_rx_state = AD_RX_CURRENT;
995 } else {
996 /* if timer is on, and if it is expired */
997 if (port->sm_rx_timer_counter &&
998 !(--port->sm_rx_timer_counter)) {
999 switch (port->sm_rx_state) {
1000 case AD_RX_EXPIRED:
1001 port->sm_rx_state = AD_RX_DEFAULTED;
1002 break;
1003 case AD_RX_CURRENT:
1004 port->sm_rx_state = AD_RX_EXPIRED;
1005 break;
1006 default:
1007 break;
1008 }
1009 } else {
1010 /* if no lacpdu arrived and no timer is on */
1011 switch (port->sm_rx_state) {
1012 case AD_RX_PORT_DISABLED:
1013 if (port->sm_vars & AD_PORT_MOVED)
1014 port->sm_rx_state = AD_RX_INITIALIZE;
1015 else if (port->is_enabled
1016 && (port->sm_vars
1017 & AD_PORT_LACP_ENABLED))
1018 port->sm_rx_state = AD_RX_EXPIRED;
1019 else if (port->is_enabled
1020 && ((port->sm_vars
1021 & AD_PORT_LACP_ENABLED) == 0))
1022 port->sm_rx_state = AD_RX_LACP_DISABLED;
1023 break;
1024 default:
1025 break;
1026
1027 }
1028 }
1029 }
1030
1031 /* check if the State machine was changed or new lacpdu arrived */
1032 if ((port->sm_rx_state != last_state) || (lacpdu)) {
1033 pr_debug("Rx Machine: Port=%d, Last State=%d, Curr State=%d\n",
1034 port->actor_port_number, last_state,
1035 port->sm_rx_state);
1036 switch (port->sm_rx_state) {
1037 case AD_RX_INITIALIZE:
1038 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_BITS))
1039 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1040 else
1041 port->sm_vars |= AD_PORT_LACP_ENABLED;
1042 port->sm_vars &= ~AD_PORT_SELECTED;
1043 __record_default(port);
1044 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1045 port->sm_vars &= ~AD_PORT_MOVED;
1046 port->sm_rx_state = AD_RX_PORT_DISABLED;
1047
1048 /* Fall Through */
1049 case AD_RX_PORT_DISABLED:
1050 port->sm_vars &= ~AD_PORT_MATCHED;
1051 break;
1052 case AD_RX_LACP_DISABLED:
1053 port->sm_vars &= ~AD_PORT_SELECTED;
1054 __record_default(port);
1055 port->partner_oper.port_state &= ~AD_STATE_AGGREGATION;
1056 port->sm_vars |= AD_PORT_MATCHED;
1057 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1058 break;
1059 case AD_RX_EXPIRED:
1060 /* Reset of the Synchronization flag (Standard 43.4.12)
1061 * This reset cause to disable this port in the
1062 * COLLECTING_DISTRIBUTING state of the mux machine in
1063 * case of EXPIRED even if LINK_DOWN didn't arrive for
1064 * the port.
1065 */
1066 port->partner_oper.port_state &= ~AD_STATE_SYNCHRONIZATION;
1067 port->sm_vars &= ~AD_PORT_MATCHED;
1068 port->partner_oper.port_state |= AD_STATE_LACP_ACTIVITY;
1069 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
1070 port->actor_oper_port_state |= AD_STATE_EXPIRED;
1071 break;
1072 case AD_RX_DEFAULTED:
1073 __update_default_selected(port);
1074 __record_default(port);
1075 port->sm_vars |= AD_PORT_MATCHED;
1076 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1077 break;
1078 case AD_RX_CURRENT:
1079 /* detect loopback situation */
1080 if (MAC_ADDRESS_EQUAL(&(lacpdu->actor_system),
1081 &(port->actor_system))) {
1082 pr_err("%s: An illegal loopback occurred on adapter (%s).\nCheck the configuration to verify that all adapters are connected to 802.3ad compliant switch ports\n",
1083 port->slave->bond->dev->name,
1084 port->slave->dev->name);
1085 return;
1086 }
1087 __update_selected(lacpdu, port);
1088 __update_ntt(lacpdu, port);
1089 __record_pdu(lacpdu, port);
1090 port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(port->actor_oper_port_state & AD_STATE_LACP_TIMEOUT));
1091 port->actor_oper_port_state &= ~AD_STATE_EXPIRED;
1092 break;
1093 default:
1094 break;
1095 }
1096 }
1097 }
1098
1099 /**
1100 * ad_tx_machine - handle a port's tx state machine
1101 * @port: the port we're looking at
1102 */
1103 static void ad_tx_machine(struct port *port)
1104 {
1105 /* check if tx timer expired, to verify that we do not send more than
1106 * 3 packets per second
1107 */
1108 if (port->sm_tx_timer_counter && !(--port->sm_tx_timer_counter)) {
1109 /* check if there is something to send */
1110 if (port->ntt && (port->sm_vars & AD_PORT_LACP_ENABLED)) {
1111 __update_lacpdu_from_port(port);
1112
1113 if (ad_lacpdu_send(port) >= 0) {
1114 pr_debug("Sent LACPDU on port %d\n",
1115 port->actor_port_number);
1116
1117 /* mark ntt as false, so it will not be sent
1118 * again until demanded
1119 */
1120 port->ntt = false;
1121 }
1122 }
1123 /* restart tx timer(to verify that we will not exceed
1124 * AD_MAX_TX_IN_SECOND
1125 */
1126 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1127 }
1128 }
1129
1130 /**
1131 * ad_periodic_machine - handle a port's periodic state machine
1132 * @port: the port we're looking at
1133 *
1134 * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
1135 */
1136 static void ad_periodic_machine(struct port *port)
1137 {
1138 periodic_states_t last_state;
1139
1140 /* keep current state machine state to compare later if it was changed */
1141 last_state = port->sm_periodic_state;
1142
1143 /* check if port was reinitialized */
1144 if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
1145 (!(port->actor_oper_port_state & AD_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & AD_STATE_LACP_ACTIVITY))
1146 ) {
1147 port->sm_periodic_state = AD_NO_PERIODIC;
1148 }
1149 /* check if state machine should change state */
1150 else if (port->sm_periodic_timer_counter) {
1151 /* check if periodic state machine expired */
1152 if (!(--port->sm_periodic_timer_counter)) {
1153 /* if expired then do tx */
1154 port->sm_periodic_state = AD_PERIODIC_TX;
1155 } else {
1156 /* If not expired, check if there is some new timeout
1157 * parameter from the partner state
1158 */
1159 switch (port->sm_periodic_state) {
1160 case AD_FAST_PERIODIC:
1161 if (!(port->partner_oper.port_state
1162 & AD_STATE_LACP_TIMEOUT))
1163 port->sm_periodic_state = AD_SLOW_PERIODIC;
1164 break;
1165 case AD_SLOW_PERIODIC:
1166 if ((port->partner_oper.port_state & AD_STATE_LACP_TIMEOUT)) {
1167 port->sm_periodic_timer_counter = 0;
1168 port->sm_periodic_state = AD_PERIODIC_TX;
1169 }
1170 break;
1171 default:
1172 break;
1173 }
1174 }
1175 } else {
1176 switch (port->sm_periodic_state) {
1177 case AD_NO_PERIODIC:
1178 port->sm_periodic_state = AD_FAST_PERIODIC;
1179 break;
1180 case AD_PERIODIC_TX:
1181 if (!(port->partner_oper.port_state &
1182 AD_STATE_LACP_TIMEOUT))
1183 port->sm_periodic_state = AD_SLOW_PERIODIC;
1184 else
1185 port->sm_periodic_state = AD_FAST_PERIODIC;
1186 break;
1187 default:
1188 break;
1189 }
1190 }
1191
1192 /* check if the state machine was changed */
1193 if (port->sm_periodic_state != last_state) {
1194 pr_debug("Periodic Machine: Port=%d, Last State=%d, Curr State=%d\n",
1195 port->actor_port_number, last_state,
1196 port->sm_periodic_state);
1197 switch (port->sm_periodic_state) {
1198 case AD_NO_PERIODIC:
1199 port->sm_periodic_timer_counter = 0;
1200 break;
1201 case AD_FAST_PERIODIC:
1202 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1203 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_FAST_PERIODIC_TIME))-1;
1204 break;
1205 case AD_SLOW_PERIODIC:
1206 /* decrement 1 tick we lost in the PERIODIC_TX cycle */
1207 port->sm_periodic_timer_counter = __ad_timer_to_ticks(AD_PERIODIC_TIMER, (u16)(AD_SLOW_PERIODIC_TIME))-1;
1208 break;
1209 case AD_PERIODIC_TX:
1210 port->ntt = true;
1211 break;
1212 default:
1213 break;
1214 }
1215 }
1216 }
1217
1218 /**
1219 * ad_port_selection_logic - select aggregation groups
1220 * @port: the port we're looking at
1221 *
1222 * Select aggregation groups, and assign each port for it's aggregetor. The
1223 * selection logic is called in the inititalization (after all the handshkes),
1224 * and after every lacpdu receive (if selected is off).
1225 */
1226 static void ad_port_selection_logic(struct port *port)
1227 {
1228 struct aggregator *aggregator, *free_aggregator = NULL, *temp_aggregator;
1229 struct port *last_port = NULL, *curr_port;
1230 struct list_head *iter;
1231 struct bonding *bond;
1232 struct slave *slave;
1233 int found = 0;
1234
1235 /* if the port is already Selected, do nothing */
1236 if (port->sm_vars & AD_PORT_SELECTED)
1237 return;
1238
1239 bond = __get_bond_by_port(port);
1240
1241 /* if the port is connected to other aggregator, detach it */
1242 if (port->aggregator) {
1243 /* detach the port from its former aggregator */
1244 temp_aggregator = port->aggregator;
1245 for (curr_port = temp_aggregator->lag_ports; curr_port;
1246 last_port = curr_port,
1247 curr_port = curr_port->next_port_in_aggregator) {
1248 if (curr_port == port) {
1249 temp_aggregator->num_of_ports--;
1250 /* if it is the first port attached to the
1251 * aggregator
1252 */
1253 if (!last_port) {
1254 temp_aggregator->lag_ports =
1255 port->next_port_in_aggregator;
1256 } else {
1257 /* not the first port attached to the
1258 * aggregator
1259 */
1260 last_port->next_port_in_aggregator =
1261 port->next_port_in_aggregator;
1262 }
1263
1264 /* clear the port's relations to this
1265 * aggregator
1266 */
1267 port->aggregator = NULL;
1268 port->next_port_in_aggregator = NULL;
1269 port->actor_port_aggregator_identifier = 0;
1270
1271 pr_debug("Port %d left LAG %d\n",
1272 port->actor_port_number,
1273 temp_aggregator->aggregator_identifier);
1274 /* if the aggregator is empty, clear its
1275 * parameters, and set it ready to be attached
1276 */
1277 if (!temp_aggregator->lag_ports)
1278 ad_clear_agg(temp_aggregator);
1279 break;
1280 }
1281 }
1282 if (!curr_port) {
1283 /* meaning: the port was related to an aggregator
1284 * but was not on the aggregator port list
1285 */
1286 pr_warn("%s: Warning: Port %d (on %s) was related to aggregator %d but was not on its port list\n",
1287 port->slave->bond->dev->name,
1288 port->actor_port_number,
1289 port->slave->dev->name,
1290 port->aggregator->aggregator_identifier);
1291 }
1292 }
1293 /* search on all aggregators for a suitable aggregator for this port */
1294 bond_for_each_slave(bond, slave, iter) {
1295 aggregator = &(SLAVE_AD_INFO(slave).aggregator);
1296
1297 /* keep a free aggregator for later use(if needed) */
1298 if (!aggregator->lag_ports) {
1299 if (!free_aggregator)
1300 free_aggregator = aggregator;
1301 continue;
1302 }
1303 /* check if current aggregator suits us */
1304 if (((aggregator->actor_oper_aggregator_key == port->actor_oper_port_key) && /* if all parameters match AND */
1305 MAC_ADDRESS_EQUAL(&(aggregator->partner_system), &(port->partner_oper.system)) &&
1306 (aggregator->partner_system_priority == port->partner_oper.system_priority) &&
1307 (aggregator->partner_oper_aggregator_key == port->partner_oper.key)
1308 ) &&
1309 ((!MAC_ADDRESS_EQUAL(&(port->partner_oper.system), &(null_mac_addr)) && /* partner answers */
1310 !aggregator->is_individual) /* but is not individual OR */
1311 )
1312 ) {
1313 /* attach to the founded aggregator */
1314 port->aggregator = aggregator;
1315 port->actor_port_aggregator_identifier =
1316 port->aggregator->aggregator_identifier;
1317 port->next_port_in_aggregator = aggregator->lag_ports;
1318 port->aggregator->num_of_ports++;
1319 aggregator->lag_ports = port;
1320 pr_debug("Port %d joined LAG %d(existing LAG)\n",
1321 port->actor_port_number,
1322 port->aggregator->aggregator_identifier);
1323
1324 /* mark this port as selected */
1325 port->sm_vars |= AD_PORT_SELECTED;
1326 found = 1;
1327 break;
1328 }
1329 }
1330
1331 /* the port couldn't find an aggregator - attach it to a new
1332 * aggregator
1333 */
1334 if (!found) {
1335 if (free_aggregator) {
1336 /* assign port a new aggregator */
1337 port->aggregator = free_aggregator;
1338 port->actor_port_aggregator_identifier =
1339 port->aggregator->aggregator_identifier;
1340
1341 /* update the new aggregator's parameters
1342 * if port was responsed from the end-user
1343 */
1344 if (port->actor_oper_port_key & AD_DUPLEX_KEY_BITS)
1345 /* if port is full duplex */
1346 port->aggregator->is_individual = false;
1347 else
1348 port->aggregator->is_individual = true;
1349
1350 port->aggregator->actor_admin_aggregator_key = port->actor_admin_port_key;
1351 port->aggregator->actor_oper_aggregator_key = port->actor_oper_port_key;
1352 port->aggregator->partner_system =
1353 port->partner_oper.system;
1354 port->aggregator->partner_system_priority =
1355 port->partner_oper.system_priority;
1356 port->aggregator->partner_oper_aggregator_key = port->partner_oper.key;
1357 port->aggregator->receive_state = 1;
1358 port->aggregator->transmit_state = 1;
1359 port->aggregator->lag_ports = port;
1360 port->aggregator->num_of_ports++;
1361
1362 /* mark this port as selected */
1363 port->sm_vars |= AD_PORT_SELECTED;
1364
1365 pr_debug("Port %d joined LAG %d(new LAG)\n",
1366 port->actor_port_number,
1367 port->aggregator->aggregator_identifier);
1368 } else {
1369 pr_err("%s: Port %d (on %s) did not find a suitable aggregator\n",
1370 port->slave->bond->dev->name,
1371 port->actor_port_number, port->slave->dev->name);
1372 }
1373 }
1374 /* if all aggregator's ports are READY_N == TRUE, set ready=TRUE
1375 * in all aggregator's ports, else set ready=FALSE in all
1376 * aggregator's ports
1377 */
1378 __set_agg_ports_ready(port->aggregator,
1379 __agg_ports_are_ready(port->aggregator));
1380
1381 aggregator = __get_first_agg(port);
1382 ad_agg_selection_logic(aggregator);
1383 }
1384
1385 /* Decide if "agg" is a better choice for the new active aggregator that
1386 * the current best, according to the ad_select policy.
1387 */
1388 static struct aggregator *ad_agg_selection_test(struct aggregator *best,
1389 struct aggregator *curr)
1390 {
1391 /* 0. If no best, select current.
1392 *
1393 * 1. If the current agg is not individual, and the best is
1394 * individual, select current.
1395 *
1396 * 2. If current agg is individual and the best is not, keep best.
1397 *
1398 * 3. Therefore, current and best are both individual or both not
1399 * individual, so:
1400 *
1401 * 3a. If current agg partner replied, and best agg partner did not,
1402 * select current.
1403 *
1404 * 3b. If current agg partner did not reply and best agg partner
1405 * did reply, keep best.
1406 *
1407 * 4. Therefore, current and best both have partner replies or
1408 * both do not, so perform selection policy:
1409 *
1410 * BOND_AD_COUNT: Select by count of ports. If count is equal,
1411 * select by bandwidth.
1412 *
1413 * BOND_AD_STABLE, BOND_AD_BANDWIDTH: Select by bandwidth.
1414 */
1415 if (!best)
1416 return curr;
1417
1418 if (!curr->is_individual && best->is_individual)
1419 return curr;
1420
1421 if (curr->is_individual && !best->is_individual)
1422 return best;
1423
1424 if (__agg_has_partner(curr) && !__agg_has_partner(best))
1425 return curr;
1426
1427 if (!__agg_has_partner(curr) && __agg_has_partner(best))
1428 return best;
1429
1430 switch (__get_agg_selection_mode(curr->lag_ports)) {
1431 case BOND_AD_COUNT:
1432 if (curr->num_of_ports > best->num_of_ports)
1433 return curr;
1434
1435 if (curr->num_of_ports < best->num_of_ports)
1436 return best;
1437
1438 /*FALLTHROUGH*/
1439 case BOND_AD_STABLE:
1440 case BOND_AD_BANDWIDTH:
1441 if (__get_agg_bandwidth(curr) > __get_agg_bandwidth(best))
1442 return curr;
1443
1444 break;
1445
1446 default:
1447 pr_warn("%s: Impossible agg select mode %d\n",
1448 curr->slave->bond->dev->name,
1449 __get_agg_selection_mode(curr->lag_ports));
1450 break;
1451 }
1452
1453 return best;
1454 }
1455
1456 static int agg_device_up(const struct aggregator *agg)
1457 {
1458 struct port *port = agg->lag_ports;
1459
1460 if (!port)
1461 return 0;
1462
1463 return netif_running(port->slave->dev) &&
1464 netif_carrier_ok(port->slave->dev);
1465 }
1466
1467 /**
1468 * ad_agg_selection_logic - select an aggregation group for a team
1469 * @aggregator: the aggregator we're looking at
1470 *
1471 * It is assumed that only one aggregator may be selected for a team.
1472 *
1473 * The logic of this function is to select the aggregator according to
1474 * the ad_select policy:
1475 *
1476 * BOND_AD_STABLE: select the aggregator with the most ports attached to
1477 * it, and to reselect the active aggregator only if the previous
1478 * aggregator has no more ports related to it.
1479 *
1480 * BOND_AD_BANDWIDTH: select the aggregator with the highest total
1481 * bandwidth, and reselect whenever a link state change takes place or the
1482 * set of slaves in the bond changes.
1483 *
1484 * BOND_AD_COUNT: select the aggregator with largest number of ports
1485 * (slaves), and reselect whenever a link state change takes place or the
1486 * set of slaves in the bond changes.
1487 *
1488 * FIXME: this function MUST be called with the first agg in the bond, or
1489 * __get_active_agg() won't work correctly. This function should be better
1490 * called with the bond itself, and retrieve the first agg from it.
1491 */
1492 static void ad_agg_selection_logic(struct aggregator *agg)
1493 {
1494 struct aggregator *best, *active, *origin;
1495 struct bonding *bond = agg->slave->bond;
1496 struct list_head *iter;
1497 struct slave *slave;
1498 struct port *port;
1499
1500 rcu_read_lock();
1501 origin = agg;
1502 active = __get_active_agg(agg);
1503 best = (active && agg_device_up(active)) ? active : NULL;
1504
1505 bond_for_each_slave_rcu(bond, slave, iter) {
1506 agg = &(SLAVE_AD_INFO(slave).aggregator);
1507
1508 agg->is_active = 0;
1509
1510 if (agg->num_of_ports && agg_device_up(agg))
1511 best = ad_agg_selection_test(best, agg);
1512 }
1513
1514 if (best &&
1515 __get_agg_selection_mode(best->lag_ports) == BOND_AD_STABLE) {
1516 /* For the STABLE policy, don't replace the old active
1517 * aggregator if it's still active (it has an answering
1518 * partner) or if both the best and active don't have an
1519 * answering partner.
1520 */
1521 if (active && active->lag_ports &&
1522 active->lag_ports->is_enabled &&
1523 (__agg_has_partner(active) ||
1524 (!__agg_has_partner(active) &&
1525 !__agg_has_partner(best)))) {
1526 if (!(!active->actor_oper_aggregator_key &&
1527 best->actor_oper_aggregator_key)) {
1528 best = NULL;
1529 active->is_active = 1;
1530 }
1531 }
1532 }
1533
1534 if (best && (best == active)) {
1535 best = NULL;
1536 active->is_active = 1;
1537 }
1538
1539 /* if there is new best aggregator, activate it */
1540 if (best) {
1541 pr_debug("best Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1542 best->aggregator_identifier, best->num_of_ports,
1543 best->actor_oper_aggregator_key,
1544 best->partner_oper_aggregator_key,
1545 best->is_individual, best->is_active);
1546 pr_debug("best ports %p slave %p %s\n",
1547 best->lag_ports, best->slave,
1548 best->slave ? best->slave->dev->name : "NULL");
1549
1550 bond_for_each_slave_rcu(bond, slave, iter) {
1551 agg = &(SLAVE_AD_INFO(slave).aggregator);
1552
1553 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1554 agg->aggregator_identifier, agg->num_of_ports,
1555 agg->actor_oper_aggregator_key,
1556 agg->partner_oper_aggregator_key,
1557 agg->is_individual, agg->is_active);
1558 }
1559
1560 /* check if any partner replys */
1561 if (best->is_individual) {
1562 pr_warn("%s: Warning: No 802.3ad response from the link partner for any adapters in the bond\n",
1563 best->slave ?
1564 best->slave->bond->dev->name : "NULL");
1565 }
1566
1567 best->is_active = 1;
1568 pr_debug("LAG %d chosen as the active LAG\n",
1569 best->aggregator_identifier);
1570 pr_debug("Agg=%d; P=%d; a k=%d; p k=%d; Ind=%d; Act=%d\n",
1571 best->aggregator_identifier, best->num_of_ports,
1572 best->actor_oper_aggregator_key,
1573 best->partner_oper_aggregator_key,
1574 best->is_individual, best->is_active);
1575
1576 /* disable the ports that were related to the former
1577 * active_aggregator
1578 */
1579 if (active) {
1580 for (port = active->lag_ports; port;
1581 port = port->next_port_in_aggregator) {
1582 __disable_port(port);
1583 }
1584 }
1585 }
1586
1587 /* if the selected aggregator is of join individuals
1588 * (partner_system is NULL), enable their ports
1589 */
1590 active = __get_active_agg(origin);
1591
1592 if (active) {
1593 if (!__agg_has_partner(active)) {
1594 for (port = active->lag_ports; port;
1595 port = port->next_port_in_aggregator) {
1596 __enable_port(port);
1597 }
1598 }
1599 }
1600
1601 rcu_read_unlock();
1602
1603 bond_3ad_set_carrier(bond);
1604 }
1605
1606 /**
1607 * ad_clear_agg - clear a given aggregator's parameters
1608 * @aggregator: the aggregator we're looking at
1609 */
1610 static void ad_clear_agg(struct aggregator *aggregator)
1611 {
1612 if (aggregator) {
1613 aggregator->is_individual = false;
1614 aggregator->actor_admin_aggregator_key = 0;
1615 aggregator->actor_oper_aggregator_key = 0;
1616 aggregator->partner_system = null_mac_addr;
1617 aggregator->partner_system_priority = 0;
1618 aggregator->partner_oper_aggregator_key = 0;
1619 aggregator->receive_state = 0;
1620 aggregator->transmit_state = 0;
1621 aggregator->lag_ports = NULL;
1622 aggregator->is_active = 0;
1623 aggregator->num_of_ports = 0;
1624 pr_debug("LAG %d was cleared\n",
1625 aggregator->aggregator_identifier);
1626 }
1627 }
1628
1629 /**
1630 * ad_initialize_agg - initialize a given aggregator's parameters
1631 * @aggregator: the aggregator we're looking at
1632 */
1633 static void ad_initialize_agg(struct aggregator *aggregator)
1634 {
1635 if (aggregator) {
1636 ad_clear_agg(aggregator);
1637
1638 aggregator->aggregator_mac_address = null_mac_addr;
1639 aggregator->aggregator_identifier = 0;
1640 aggregator->slave = NULL;
1641 }
1642 }
1643
1644 /**
1645 * ad_initialize_port - initialize a given port's parameters
1646 * @aggregator: the aggregator we're looking at
1647 * @lacp_fast: boolean. whether fast periodic should be used
1648 */
1649 static void ad_initialize_port(struct port *port, int lacp_fast)
1650 {
1651 static const struct port_params tmpl = {
1652 .system_priority = 0xffff,
1653 .key = 1,
1654 .port_number = 1,
1655 .port_priority = 0xff,
1656 .port_state = 1,
1657 };
1658 static const struct lacpdu lacpdu = {
1659 .subtype = 0x01,
1660 .version_number = 0x01,
1661 .tlv_type_actor_info = 0x01,
1662 .actor_information_length = 0x14,
1663 .tlv_type_partner_info = 0x02,
1664 .partner_information_length = 0x14,
1665 .tlv_type_collector_info = 0x03,
1666 .collector_information_length = 0x10,
1667 .collector_max_delay = htons(AD_COLLECTOR_MAX_DELAY),
1668 };
1669
1670 if (port) {
1671 port->actor_port_number = 1;
1672 port->actor_port_priority = 0xff;
1673 port->actor_system = null_mac_addr;
1674 port->actor_system_priority = 0xffff;
1675 port->actor_port_aggregator_identifier = 0;
1676 port->ntt = false;
1677 port->actor_admin_port_key = 1;
1678 port->actor_oper_port_key = 1;
1679 port->actor_admin_port_state = AD_STATE_AGGREGATION |
1680 AD_STATE_LACP_ACTIVITY;
1681 port->actor_oper_port_state = AD_STATE_AGGREGATION |
1682 AD_STATE_LACP_ACTIVITY;
1683
1684 if (lacp_fast)
1685 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
1686
1687 memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
1688 memcpy(&port->partner_oper, &tmpl, sizeof(tmpl));
1689
1690 port->is_enabled = true;
1691 /* private parameters */
1692 port->sm_vars = 0x3;
1693 port->sm_rx_state = 0;
1694 port->sm_rx_timer_counter = 0;
1695 port->sm_periodic_state = 0;
1696 port->sm_periodic_timer_counter = 0;
1697 port->sm_mux_state = 0;
1698 port->sm_mux_timer_counter = 0;
1699 port->sm_tx_state = 0;
1700 port->sm_tx_timer_counter = 0;
1701 port->slave = NULL;
1702 port->aggregator = NULL;
1703 port->next_port_in_aggregator = NULL;
1704 port->transaction_id = 0;
1705
1706 memcpy(&port->lacpdu, &lacpdu, sizeof(lacpdu));
1707 }
1708 }
1709
1710 /**
1711 * ad_enable_collecting_distributing - enable a port's transmit/receive
1712 * @port: the port we're looking at
1713 *
1714 * Enable @port if it's in an active aggregator
1715 */
1716 static void ad_enable_collecting_distributing(struct port *port)
1717 {
1718 if (port->aggregator->is_active) {
1719 pr_debug("Enabling port %d(LAG %d)\n",
1720 port->actor_port_number,
1721 port->aggregator->aggregator_identifier);
1722 __enable_port(port);
1723 }
1724 }
1725
1726 /**
1727 * ad_disable_collecting_distributing - disable a port's transmit/receive
1728 * @port: the port we're looking at
1729 */
1730 static void ad_disable_collecting_distributing(struct port *port)
1731 {
1732 if (port->aggregator &&
1733 !MAC_ADDRESS_EQUAL(&(port->aggregator->partner_system),
1734 &(null_mac_addr))) {
1735 pr_debug("Disabling port %d(LAG %d)\n",
1736 port->actor_port_number,
1737 port->aggregator->aggregator_identifier);
1738 __disable_port(port);
1739 }
1740 }
1741
1742 /**
1743 * ad_marker_info_received - handle receive of a Marker information frame
1744 * @marker_info: Marker info received
1745 * @port: the port we're looking at
1746 */
1747 static void ad_marker_info_received(struct bond_marker *marker_info,
1748 struct port *port)
1749 {
1750 struct bond_marker marker;
1751
1752 /* copy the received marker data to the response marker */
1753 memcpy(&marker, marker_info, sizeof(struct bond_marker));
1754 /* change the marker subtype to marker response */
1755 marker.tlv_type = AD_MARKER_RESPONSE_SUBTYPE;
1756
1757 /* send the marker response */
1758 if (ad_marker_send(port, &marker) >= 0) {
1759 pr_debug("Sent Marker Response on port %d\n",
1760 port->actor_port_number);
1761 }
1762 }
1763
1764 /**
1765 * ad_marker_response_received - handle receive of a marker response frame
1766 * @marker: marker PDU received
1767 * @port: the port we're looking at
1768 *
1769 * This function does nothing since we decided not to implement send and handle
1770 * response for marker PDU's, in this stage, but only to respond to marker
1771 * information.
1772 */
1773 static void ad_marker_response_received(struct bond_marker *marker,
1774 struct port *port)
1775 {
1776 marker = NULL;
1777 port = NULL;
1778 /* DO NOTHING, SINCE WE DECIDED NOT TO IMPLEMENT THIS FEATURE FOR NOW */
1779 }
1780
1781 /* ========= AD exported functions to the main bonding code ========= */
1782
1783 /* Check aggregators status in team every T seconds */
1784 #define AD_AGGREGATOR_SELECTION_TIMER 8
1785
1786 /**
1787 * bond_3ad_initiate_agg_selection - initate aggregator selection
1788 * @bond: bonding struct
1789 *
1790 * Set the aggregation selection timer, to initiate an agg selection in
1791 * the very near future. Called during first initialization, and during
1792 * any down to up transitions of the bond.
1793 */
1794 void bond_3ad_initiate_agg_selection(struct bonding *bond, int timeout)
1795 {
1796 BOND_AD_INFO(bond).agg_select_timer = timeout;
1797 }
1798
1799 /**
1800 * bond_3ad_initialize - initialize a bond's 802.3ad parameters and structures
1801 * @bond: bonding struct to work on
1802 * @tick_resolution: tick duration (millisecond resolution)
1803 *
1804 * Can be called only after the mac address of the bond is set.
1805 */
1806 void bond_3ad_initialize(struct bonding *bond, u16 tick_resolution)
1807 {
1808 /* check that the bond is not initialized yet */
1809 if (!MAC_ADDRESS_EQUAL(&(BOND_AD_INFO(bond).system.sys_mac_addr),
1810 bond->dev->dev_addr)) {
1811
1812 BOND_AD_INFO(bond).aggregator_identifier = 0;
1813
1814 BOND_AD_INFO(bond).system.sys_priority = 0xFFFF;
1815 BOND_AD_INFO(bond).system.sys_mac_addr = *((struct mac_addr *)bond->dev->dev_addr);
1816
1817 /* initialize how many times this module is called in one
1818 * second (should be about every 100ms)
1819 */
1820 ad_ticks_per_sec = tick_resolution;
1821
1822 bond_3ad_initiate_agg_selection(bond,
1823 AD_AGGREGATOR_SELECTION_TIMER *
1824 ad_ticks_per_sec);
1825 }
1826 }
1827
1828 /**
1829 * bond_3ad_bind_slave - initialize a slave's port
1830 * @slave: slave struct to work on
1831 *
1832 * Returns: 0 on success
1833 * < 0 on error
1834 */
1835 void bond_3ad_bind_slave(struct slave *slave)
1836 {
1837 struct bonding *bond = bond_get_bond_by_slave(slave);
1838 struct port *port;
1839 struct aggregator *aggregator;
1840
1841 /* check that the slave has not been initialized yet. */
1842 if (SLAVE_AD_INFO(slave).port.slave != slave) {
1843
1844 /* port initialization */
1845 port = &(SLAVE_AD_INFO(slave).port);
1846
1847 ad_initialize_port(port, bond->params.lacp_fast);
1848
1849 __initialize_port_locks(slave);
1850 port->slave = slave;
1851 port->actor_port_number = SLAVE_AD_INFO(slave).id;
1852 /* key is determined according to the link speed, duplex and user key(which
1853 * is yet not supported)
1854 */
1855 port->actor_admin_port_key = 0;
1856 port->actor_admin_port_key |= __get_duplex(port);
1857 port->actor_admin_port_key |= (__get_link_speed(port) << 1);
1858 port->actor_oper_port_key = port->actor_admin_port_key;
1859 /* if the port is not full duplex, then the port should be not
1860 * lacp Enabled
1861 */
1862 if (!(port->actor_oper_port_key & AD_DUPLEX_KEY_BITS))
1863 port->sm_vars &= ~AD_PORT_LACP_ENABLED;
1864 /* actor system is the bond's system */
1865 port->actor_system = BOND_AD_INFO(bond).system.sys_mac_addr;
1866 /* tx timer(to verify that no more than MAX_TX_IN_SECOND
1867 * lacpdu's are sent in one second)
1868 */
1869 port->sm_tx_timer_counter = ad_ticks_per_sec/AD_MAX_TX_IN_SECOND;
1870 port->aggregator = NULL;
1871 port->next_port_in_aggregator = NULL;
1872
1873 __disable_port(port);
1874
1875 /* aggregator initialization */
1876 aggregator = &(SLAVE_AD_INFO(slave).aggregator);
1877
1878 ad_initialize_agg(aggregator);
1879
1880 aggregator->aggregator_mac_address = *((struct mac_addr *)bond->dev->dev_addr);
1881 aggregator->aggregator_identifier = ++BOND_AD_INFO(bond).aggregator_identifier;
1882 aggregator->slave = slave;
1883 aggregator->is_active = 0;
1884 aggregator->num_of_ports = 0;
1885 }
1886 }
1887
1888 /**
1889 * bond_3ad_unbind_slave - deinitialize a slave's port
1890 * @slave: slave struct to work on
1891 *
1892 * Search for the aggregator that is related to this port, remove the
1893 * aggregator and assign another aggregator for other port related to it
1894 * (if any), and remove the port.
1895 */
1896 void bond_3ad_unbind_slave(struct slave *slave)
1897 {
1898 struct port *port, *prev_port, *temp_port;
1899 struct aggregator *aggregator, *new_aggregator, *temp_aggregator;
1900 int select_new_active_agg = 0;
1901 struct bonding *bond = slave->bond;
1902 struct slave *slave_iter;
1903 struct list_head *iter;
1904
1905 aggregator = &(SLAVE_AD_INFO(slave).aggregator);
1906 port = &(SLAVE_AD_INFO(slave).port);
1907
1908 /* if slave is null, the whole port is not initialized */
1909 if (!port->slave) {
1910 pr_warn("Warning: %s: Trying to unbind an uninitialized port on %s\n",
1911 slave->bond->dev->name, slave->dev->name);
1912 return;
1913 }
1914
1915 pr_debug("Unbinding Link Aggregation Group %d\n",
1916 aggregator->aggregator_identifier);
1917
1918 /* Tell the partner that this port is not suitable for aggregation */
1919 port->actor_oper_port_state &= ~AD_STATE_AGGREGATION;
1920 __update_lacpdu_from_port(port);
1921 ad_lacpdu_send(port);
1922
1923 /* check if this aggregator is occupied */
1924 if (aggregator->lag_ports) {
1925 /* check if there are other ports related to this aggregator
1926 * except the port related to this slave(thats ensure us that
1927 * there is a reason to search for new aggregator, and that we
1928 * will find one
1929 */
1930 if ((aggregator->lag_ports != port) ||
1931 (aggregator->lag_ports->next_port_in_aggregator)) {
1932 /* find new aggregator for the related port(s) */
1933 bond_for_each_slave(bond, slave_iter, iter) {
1934 new_aggregator = &(SLAVE_AD_INFO(slave_iter).aggregator);
1935 /* if the new aggregator is empty, or it is
1936 * connected to our port only
1937 */
1938 if (!new_aggregator->lag_ports ||
1939 ((new_aggregator->lag_ports == port) &&
1940 !new_aggregator->lag_ports->next_port_in_aggregator))
1941 break;
1942 }
1943 if (!slave_iter)
1944 new_aggregator = NULL;
1945
1946 /* if new aggregator found, copy the aggregator's
1947 * parameters and connect the related lag_ports to the
1948 * new aggregator
1949 */
1950 if ((new_aggregator) && ((!new_aggregator->lag_ports) || ((new_aggregator->lag_ports == port) && !new_aggregator->lag_ports->next_port_in_aggregator))) {
1951 pr_debug("Some port(s) related to LAG %d - replaceing with LAG %d\n",
1952 aggregator->aggregator_identifier,
1953 new_aggregator->aggregator_identifier);
1954
1955 if ((new_aggregator->lag_ports == port) &&
1956 new_aggregator->is_active) {
1957 pr_info("%s: Removing an active aggregator\n",
1958 aggregator->slave->bond->dev->name);
1959 select_new_active_agg = 1;
1960 }
1961
1962 new_aggregator->is_individual = aggregator->is_individual;
1963 new_aggregator->actor_admin_aggregator_key = aggregator->actor_admin_aggregator_key;
1964 new_aggregator->actor_oper_aggregator_key = aggregator->actor_oper_aggregator_key;
1965 new_aggregator->partner_system = aggregator->partner_system;
1966 new_aggregator->partner_system_priority = aggregator->partner_system_priority;
1967 new_aggregator->partner_oper_aggregator_key = aggregator->partner_oper_aggregator_key;
1968 new_aggregator->receive_state = aggregator->receive_state;
1969 new_aggregator->transmit_state = aggregator->transmit_state;
1970 new_aggregator->lag_ports = aggregator->lag_ports;
1971 new_aggregator->is_active = aggregator->is_active;
1972 new_aggregator->num_of_ports = aggregator->num_of_ports;
1973
1974 /* update the information that is written on
1975 * the ports about the aggregator
1976 */
1977 for (temp_port = aggregator->lag_ports; temp_port;
1978 temp_port = temp_port->next_port_in_aggregator) {
1979 temp_port->aggregator = new_aggregator;
1980 temp_port->actor_port_aggregator_identifier = new_aggregator->aggregator_identifier;
1981 }
1982
1983 ad_clear_agg(aggregator);
1984
1985 if (select_new_active_agg)
1986 ad_agg_selection_logic(__get_first_agg(port));
1987 } else {
1988 pr_warn("%s: Warning: unbinding aggregator, and could not find a new aggregator for its ports\n",
1989 slave->bond->dev->name);
1990 }
1991 } else {
1992 /* in case that the only port related to this
1993 * aggregator is the one we want to remove
1994 */
1995 select_new_active_agg = aggregator->is_active;
1996 ad_clear_agg(aggregator);
1997 if (select_new_active_agg) {
1998 pr_info("%s: Removing an active aggregator\n",
1999 slave->bond->dev->name);
2000 /* select new active aggregator */
2001 temp_aggregator = __get_first_agg(port);
2002 if (temp_aggregator)
2003 ad_agg_selection_logic(temp_aggregator);
2004 }
2005 }
2006 }
2007
2008 pr_debug("Unbinding port %d\n", port->actor_port_number);
2009
2010 /* find the aggregator that this port is connected to */
2011 bond_for_each_slave(bond, slave_iter, iter) {
2012 temp_aggregator = &(SLAVE_AD_INFO(slave_iter).aggregator);
2013 prev_port = NULL;
2014 /* search the port in the aggregator's related ports */
2015 for (temp_port = temp_aggregator->lag_ports; temp_port;
2016 prev_port = temp_port,
2017 temp_port = temp_port->next_port_in_aggregator) {
2018 if (temp_port == port) {
2019 /* the aggregator found - detach the port from
2020 * this aggregator
2021 */
2022 if (prev_port)
2023 prev_port->next_port_in_aggregator = temp_port->next_port_in_aggregator;
2024 else
2025 temp_aggregator->lag_ports = temp_port->next_port_in_aggregator;
2026 temp_aggregator->num_of_ports--;
2027 if (temp_aggregator->num_of_ports == 0) {
2028 select_new_active_agg = temp_aggregator->is_active;
2029 ad_clear_agg(temp_aggregator);
2030 if (select_new_active_agg) {
2031 pr_info("%s: Removing an active aggregator\n",
2032 slave->bond->dev->name);
2033 /* select new active aggregator */
2034 ad_agg_selection_logic(__get_first_agg(port));
2035 }
2036 }
2037 break;
2038 }
2039 }
2040 }
2041 port->slave = NULL;
2042 }
2043
2044 /**
2045 * bond_3ad_state_machine_handler - handle state machines timeout
2046 * @bond: bonding struct to work on
2047 *
2048 * The state machine handling concept in this module is to check every tick
2049 * which state machine should operate any function. The execution order is
2050 * round robin, so when we have an interaction between state machines, the
2051 * reply of one to each other might be delayed until next tick.
2052 *
2053 * This function also complete the initialization when the agg_select_timer
2054 * times out, and it selects an aggregator for the ports that are yet not
2055 * related to any aggregator, and selects the active aggregator for a bond.
2056 */
2057 void bond_3ad_state_machine_handler(struct work_struct *work)
2058 {
2059 struct bonding *bond = container_of(work, struct bonding,
2060 ad_work.work);
2061 struct aggregator *aggregator;
2062 struct list_head *iter;
2063 struct slave *slave;
2064 struct port *port;
2065 bool should_notify_rtnl = BOND_SLAVE_NOTIFY_LATER;
2066
2067 read_lock(&bond->lock);
2068 rcu_read_lock();
2069
2070 /* check if there are any slaves */
2071 if (!bond_has_slaves(bond))
2072 goto re_arm;
2073
2074 /* check if agg_select_timer timer after initialize is timed out */
2075 if (BOND_AD_INFO(bond).agg_select_timer &&
2076 !(--BOND_AD_INFO(bond).agg_select_timer)) {
2077 slave = bond_first_slave_rcu(bond);
2078 port = slave ? &(SLAVE_AD_INFO(slave).port) : NULL;
2079
2080 /* select the active aggregator for the bond */
2081 if (port) {
2082 if (!port->slave) {
2083 pr_warn("%s: Warning: bond's first port is uninitialized\n",
2084 bond->dev->name);
2085 goto re_arm;
2086 }
2087
2088 aggregator = __get_first_agg(port);
2089 ad_agg_selection_logic(aggregator);
2090 }
2091 bond_3ad_set_carrier(bond);
2092 }
2093
2094 /* for each port run the state machines */
2095 bond_for_each_slave_rcu(bond, slave, iter) {
2096 port = &(SLAVE_AD_INFO(slave).port);
2097 if (!port->slave) {
2098 pr_warn("%s: Warning: Found an uninitialized port\n",
2099 bond->dev->name);
2100 goto re_arm;
2101 }
2102
2103 /* Lock around state machines to protect data accessed
2104 * by all (e.g., port->sm_vars). ad_rx_machine may run
2105 * concurrently due to incoming LACPDU.
2106 */
2107 __get_state_machine_lock(port);
2108
2109 ad_rx_machine(NULL, port);
2110 ad_periodic_machine(port);
2111 ad_port_selection_logic(port);
2112 ad_mux_machine(port);
2113 ad_tx_machine(port);
2114
2115 /* turn off the BEGIN bit, since we already handled it */
2116 if (port->sm_vars & AD_PORT_BEGIN)
2117 port->sm_vars &= ~AD_PORT_BEGIN;
2118
2119 __release_state_machine_lock(port);
2120 }
2121
2122 re_arm:
2123 bond_for_each_slave_rcu(bond, slave, iter) {
2124 if (slave->should_notify) {
2125 should_notify_rtnl = BOND_SLAVE_NOTIFY_NOW;
2126 break;
2127 }
2128 }
2129 rcu_read_unlock();
2130 read_unlock(&bond->lock);
2131
2132 if (should_notify_rtnl && rtnl_trylock()) {
2133 bond_slave_state_notify(bond);
2134 rtnl_unlock();
2135 }
2136 queue_delayed_work(bond->wq, &bond->ad_work, ad_delta_in_ticks);
2137 }
2138
2139 /**
2140 * bond_3ad_rx_indication - handle a received frame
2141 * @lacpdu: received lacpdu
2142 * @slave: slave struct to work on
2143 * @length: length of the data received
2144 *
2145 * It is assumed that frames that were sent on this NIC don't returned as new
2146 * received frames (loopback). Since only the payload is given to this
2147 * function, it check for loopback.
2148 */
2149 static int bond_3ad_rx_indication(struct lacpdu *lacpdu, struct slave *slave,
2150 u16 length)
2151 {
2152 struct port *port;
2153 int ret = RX_HANDLER_ANOTHER;
2154
2155 if (length >= sizeof(struct lacpdu)) {
2156
2157 port = &(SLAVE_AD_INFO(slave).port);
2158
2159 if (!port->slave) {
2160 pr_warn("%s: Warning: port of slave %s is uninitialized\n",
2161 slave->dev->name, slave->bond->dev->name);
2162 return ret;
2163 }
2164
2165 switch (lacpdu->subtype) {
2166 case AD_TYPE_LACPDU:
2167 ret = RX_HANDLER_CONSUMED;
2168 pr_debug("Received LACPDU on port %d\n",
2169 port->actor_port_number);
2170 /* Protect against concurrent state machines */
2171 __get_state_machine_lock(port);
2172 ad_rx_machine(lacpdu, port);
2173 __release_state_machine_lock(port);
2174 break;
2175
2176 case AD_TYPE_MARKER:
2177 ret = RX_HANDLER_CONSUMED;
2178 /* No need to convert fields to Little Endian since we
2179 * don't use the marker's fields.
2180 */
2181
2182 switch (((struct bond_marker *)lacpdu)->tlv_type) {
2183 case AD_MARKER_INFORMATION_SUBTYPE:
2184 pr_debug("Received Marker Information on port %d\n",
2185 port->actor_port_number);
2186 ad_marker_info_received((struct bond_marker *)lacpdu, port);
2187 break;
2188
2189 case AD_MARKER_RESPONSE_SUBTYPE:
2190 pr_debug("Received Marker Response on port %d\n",
2191 port->actor_port_number);
2192 ad_marker_response_received((struct bond_marker *)lacpdu, port);
2193 break;
2194
2195 default:
2196 pr_debug("Received an unknown Marker subtype on slot %d\n",
2197 port->actor_port_number);
2198 }
2199 }
2200 }
2201 return ret;
2202 }
2203
2204 /**
2205 * bond_3ad_adapter_speed_changed - handle a slave's speed change indication
2206 * @slave: slave struct to work on
2207 *
2208 * Handle reselection of aggregator (if needed) for this port.
2209 */
2210 void bond_3ad_adapter_speed_changed(struct slave *slave)
2211 {
2212 struct port *port;
2213
2214 port = &(SLAVE_AD_INFO(slave).port);
2215
2216 /* if slave is null, the whole port is not initialized */
2217 if (!port->slave) {
2218 pr_warn("Warning: %s: speed changed for uninitialized port on %s\n",
2219 slave->bond->dev->name, slave->dev->name);
2220 return;
2221 }
2222
2223 __get_state_machine_lock(port);
2224
2225 port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS;
2226 port->actor_oper_port_key = port->actor_admin_port_key |=
2227 (__get_link_speed(port) << 1);
2228 pr_debug("Port %d changed speed\n", port->actor_port_number);
2229 /* there is no need to reselect a new aggregator, just signal the
2230 * state machines to reinitialize
2231 */
2232 port->sm_vars |= AD_PORT_BEGIN;
2233
2234 __release_state_machine_lock(port);
2235 }
2236
2237 /**
2238 * bond_3ad_adapter_duplex_changed - handle a slave's duplex change indication
2239 * @slave: slave struct to work on
2240 *
2241 * Handle reselection of aggregator (if needed) for this port.
2242 */
2243 void bond_3ad_adapter_duplex_changed(struct slave *slave)
2244 {
2245 struct port *port;
2246
2247 port = &(SLAVE_AD_INFO(slave).port);
2248
2249 /* if slave is null, the whole port is not initialized */
2250 if (!port->slave) {
2251 pr_warn("%s: Warning: duplex changed for uninitialized port on %s\n",
2252 slave->bond->dev->name, slave->dev->name);
2253 return;
2254 }
2255
2256 __get_state_machine_lock(port);
2257
2258 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS;
2259 port->actor_oper_port_key = port->actor_admin_port_key |=
2260 __get_duplex(port);
2261 pr_debug("Port %d changed duplex\n", port->actor_port_number);
2262 /* there is no need to reselect a new aggregator, just signal the
2263 * state machines to reinitialize
2264 */
2265 port->sm_vars |= AD_PORT_BEGIN;
2266
2267 __release_state_machine_lock(port);
2268 }
2269
2270 /**
2271 * bond_3ad_handle_link_change - handle a slave's link status change indication
2272 * @slave: slave struct to work on
2273 * @status: whether the link is now up or down
2274 *
2275 * Handle reselection of aggregator (if needed) for this port.
2276 */
2277 void bond_3ad_handle_link_change(struct slave *slave, char link)
2278 {
2279 struct port *port;
2280
2281 port = &(SLAVE_AD_INFO(slave).port);
2282
2283 /* if slave is null, the whole port is not initialized */
2284 if (!port->slave) {
2285 pr_warn("Warning: %s: link status changed for uninitialized port on %s\n",
2286 slave->bond->dev->name, slave->dev->name);
2287 return;
2288 }
2289
2290 __get_state_machine_lock(port);
2291 /* on link down we are zeroing duplex and speed since
2292 * some of the adaptors(ce1000.lan) report full duplex/speed
2293 * instead of N/A(duplex) / 0(speed).
2294 *
2295 * on link up we are forcing recheck on the duplex and speed since
2296 * some of he adaptors(ce1000.lan) report.
2297 */
2298 if (link == BOND_LINK_UP) {
2299 port->is_enabled = true;
2300 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS;
2301 port->actor_oper_port_key = port->actor_admin_port_key |=
2302 __get_duplex(port);
2303 port->actor_admin_port_key &= ~AD_SPEED_KEY_BITS;
2304 port->actor_oper_port_key = port->actor_admin_port_key |=
2305 (__get_link_speed(port) << 1);
2306 } else {
2307 /* link has failed */
2308 port->is_enabled = false;
2309 port->actor_admin_port_key &= ~AD_DUPLEX_KEY_BITS;
2310 port->actor_oper_port_key = (port->actor_admin_port_key &=
2311 ~AD_SPEED_KEY_BITS);
2312 }
2313 pr_debug("Port %d changed link status to %s",
2314 port->actor_port_number,
2315 (link == BOND_LINK_UP) ? "UP" : "DOWN");
2316 /* there is no need to reselect a new aggregator, just signal the
2317 * state machines to reinitialize
2318 */
2319 port->sm_vars |= AD_PORT_BEGIN;
2320
2321 __release_state_machine_lock(port);
2322 }
2323
2324 /**
2325 * bond_3ad_set_carrier - set link state for bonding master
2326 * @bond - bonding structure
2327 *
2328 * if we have an active aggregator, we're up, if not, we're down.
2329 * Presumes that we cannot have an active aggregator if there are
2330 * no slaves with link up.
2331 *
2332 * This behavior complies with IEEE 802.3 section 43.3.9.
2333 *
2334 * Called by bond_set_carrier(). Return zero if carrier state does not
2335 * change, nonzero if it does.
2336 */
2337 int bond_3ad_set_carrier(struct bonding *bond)
2338 {
2339 struct aggregator *active;
2340 struct slave *first_slave;
2341 int ret = 1;
2342
2343 rcu_read_lock();
2344 first_slave = bond_first_slave_rcu(bond);
2345 if (!first_slave) {
2346 ret = 0;
2347 goto out;
2348 }
2349 active = __get_active_agg(&(SLAVE_AD_INFO(first_slave).aggregator));
2350 if (active) {
2351 /* are enough slaves available to consider link up? */
2352 if (active->num_of_ports < bond->params.min_links) {
2353 if (netif_carrier_ok(bond->dev)) {
2354 netif_carrier_off(bond->dev);
2355 goto out;
2356 }
2357 } else if (!netif_carrier_ok(bond->dev)) {
2358 netif_carrier_on(bond->dev);
2359 goto out;
2360 }
2361 } else if (netif_carrier_ok(bond->dev)) {
2362 netif_carrier_off(bond->dev);
2363 }
2364 out:
2365 rcu_read_unlock();
2366 return ret;
2367 }
2368
2369 /**
2370 * __bond_3ad_get_active_agg_info - get information of the active aggregator
2371 * @bond: bonding struct to work on
2372 * @ad_info: ad_info struct to fill with the bond's info
2373 *
2374 * Returns: 0 on success
2375 * < 0 on error
2376 */
2377 int __bond_3ad_get_active_agg_info(struct bonding *bond,
2378 struct ad_info *ad_info)
2379 {
2380 struct aggregator *aggregator = NULL;
2381 struct list_head *iter;
2382 struct slave *slave;
2383 struct port *port;
2384
2385 bond_for_each_slave_rcu(bond, slave, iter) {
2386 port = &(SLAVE_AD_INFO(slave).port);
2387 if (port->aggregator && port->aggregator->is_active) {
2388 aggregator = port->aggregator;
2389 break;
2390 }
2391 }
2392
2393 if (aggregator) {
2394 ad_info->aggregator_id = aggregator->aggregator_identifier;
2395 ad_info->ports = aggregator->num_of_ports;
2396 ad_info->actor_key = aggregator->actor_oper_aggregator_key;
2397 ad_info->partner_key = aggregator->partner_oper_aggregator_key;
2398 memcpy(ad_info->partner_system,
2399 aggregator->partner_system.mac_addr_value, ETH_ALEN);
2400 return 0;
2401 }
2402
2403 return -1;
2404 }
2405
2406 /* Wrapper used to hold bond->lock so no slave manipulation can occur */
2407 int bond_3ad_get_active_agg_info(struct bonding *bond, struct ad_info *ad_info)
2408 {
2409 int ret;
2410
2411 rcu_read_lock();
2412 ret = __bond_3ad_get_active_agg_info(bond, ad_info);
2413 rcu_read_unlock();
2414
2415 return ret;
2416 }
2417
2418 int bond_3ad_xmit_xor(struct sk_buff *skb, struct net_device *dev)
2419 {
2420 struct bonding *bond = netdev_priv(dev);
2421 struct slave *slave, *first_ok_slave;
2422 struct aggregator *agg;
2423 struct ad_info ad_info;
2424 struct list_head *iter;
2425 int slaves_in_agg;
2426 int slave_agg_no;
2427 int agg_id;
2428
2429 if (__bond_3ad_get_active_agg_info(bond, &ad_info)) {
2430 pr_debug("%s: Error: __bond_3ad_get_active_agg_info failed\n",
2431 dev->name);
2432 goto err_free;
2433 }
2434
2435 slaves_in_agg = ad_info.ports;
2436 agg_id = ad_info.aggregator_id;
2437
2438 if (slaves_in_agg == 0) {
2439 pr_debug("%s: Error: active aggregator is empty\n", dev->name);
2440 goto err_free;
2441 }
2442
2443 slave_agg_no = bond_xmit_hash(bond, skb, slaves_in_agg);
2444 first_ok_slave = NULL;
2445
2446 bond_for_each_slave_rcu(bond, slave, iter) {
2447 agg = SLAVE_AD_INFO(slave).port.aggregator;
2448 if (!agg || agg->aggregator_identifier != agg_id)
2449 continue;
2450
2451 if (slave_agg_no >= 0) {
2452 if (!first_ok_slave && SLAVE_IS_OK(slave))
2453 first_ok_slave = slave;
2454 slave_agg_no--;
2455 continue;
2456 }
2457
2458 if (SLAVE_IS_OK(slave)) {
2459 bond_dev_queue_xmit(bond, skb, slave->dev);
2460 goto out;
2461 }
2462 }
2463
2464 if (slave_agg_no >= 0) {
2465 pr_err("%s: Error: Couldn't find a slave to tx on for aggregator ID %d\n",
2466 dev->name, agg_id);
2467 goto err_free;
2468 }
2469
2470 /* we couldn't find any suitable slave after the agg_no, so use the
2471 * first suitable found, if found.
2472 */
2473 if (first_ok_slave)
2474 bond_dev_queue_xmit(bond, skb, first_ok_slave->dev);
2475 else
2476 goto err_free;
2477
2478 out:
2479 return NETDEV_TX_OK;
2480 err_free:
2481 /* no suitable interface, frame not sent */
2482 kfree_skb(skb);
2483 goto out;
2484 }
2485
2486 int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond,
2487 struct slave *slave)
2488 {
2489 int ret = RX_HANDLER_ANOTHER;
2490 struct lacpdu *lacpdu, _lacpdu;
2491
2492 if (skb->protocol != PKT_TYPE_LACPDU)
2493 return ret;
2494
2495 lacpdu = skb_header_pointer(skb, 0, sizeof(_lacpdu), &_lacpdu);
2496 if (!lacpdu)
2497 return ret;
2498
2499 read_lock(&bond->lock);
2500 ret = bond_3ad_rx_indication(lacpdu, slave, skb->len);
2501 read_unlock(&bond->lock);
2502 return ret;
2503 }
2504
2505 /**
2506 * bond_3ad_update_lacp_rate - change the lacp rate
2507 * @bond - bonding struct
2508 *
2509 * When modify lacp_rate parameter via sysfs,
2510 * update actor_oper_port_state of each port.
2511 *
2512 * Hold slave->state_machine_lock,
2513 * so we can modify port->actor_oper_port_state,
2514 * no matter bond is up or down.
2515 */
2516 void bond_3ad_update_lacp_rate(struct bonding *bond)
2517 {
2518 struct port *port = NULL;
2519 struct list_head *iter;
2520 struct slave *slave;
2521 int lacp_fast;
2522
2523 lacp_fast = bond->params.lacp_fast;
2524 bond_for_each_slave(bond, slave, iter) {
2525 port = &(SLAVE_AD_INFO(slave).port);
2526 __get_state_machine_lock(port);
2527 if (lacp_fast)
2528 port->actor_oper_port_state |= AD_STATE_LACP_TIMEOUT;
2529 else
2530 port->actor_oper_port_state &= ~AD_STATE_LACP_TIMEOUT;
2531 __release_state_machine_lock(port);
2532 }
2533 }