lists.openwall.net   lists  /  announce  owl-users  owl-dev  john-users  john-dev  passwdqc-users  yescrypt  popa3d-users  /  oss-security  kernel-hardening  musl  sabotage  tlsify  passwords  /  crypt-dev  xvendor  /  Bugtraq  Full-Disclosure  linux-kernel  linux-netdev  linux-ext4  linux-hardening  linux-cve-announce  PHC 
Open Source and information security mailing list archives
 
Hash Suite: Windows password security audit tool. GUI, reports in PDF.
[<prev] [next>] [<thread-prev] [thread-next>] [day] [month] [year] [list]
Message-ID: <367f9bbb-537b-4828-b8c8-cfc9d8ca8c2c@blackwall.org>
Date: Fri, 25 Jul 2025 11:49:00 +0300
From: Nikolay Aleksandrov <razor@...ckwall.org>
To: Hangbin Liu <liuhangbin@...il.com>, netdev@...r.kernel.org
Cc: Jay Vosburgh <jv@...sburgh.net>, Andrew Lunn <andrew+netdev@...n.ch>,
 "David S. Miller" <davem@...emloft.net>, Eric Dumazet <edumazet@...gle.com>,
 Jakub Kicinski <kuba@...nel.org>, Paolo Abeni <pabeni@...hat.com>,
 Simon Horman <horms@...nel.org>, Shuah Khan <shuah@...nel.org>,
 Jonathan Corbet <corbet@....net>, Petr Machata <petrm@...dia.com>,
 Amit Cohen <amcohen@...dia.com>, Vladimir Oltean <vladimir.oltean@....com>,
 Alessandro Zanni <alessandro.zanni87@...il.com>, linux-doc@...r.kernel.org,
 linux-kselftest@...r.kernel.org, linux-kernel@...r.kernel.org
Subject: Re: [PATCH net 1/2] bonding: send LACPDUs periodically in passive
 mode after receiving partner's LACPDU

On 7/25/25 09:28, Hangbin Liu wrote:
> When `lacp_active` is set to `off`, the bond operates in passive mode, meaning
> it only "speaks when spoken to." However, the current kernel implementation
> only sends an LACPDU in response when the partner's state changes.
> 
> As a result, once LACP negotiation succeeds, the actor stops sending LACPDUs
> until the partner times out and sends an "expired" LACPDU. This causes
> continuous LACP state flapping.
> 
> According to IEEE 802.1AX-2014, 6.4.13 Periodic Transmission machine. The
> values of Partner_Oper_Port_State.LACP_Activity and
> Actor_Oper_Port_State.LACP_Activity determine whether periodic transmissions
> take place. If either or both parameters are set to Active LACP, then periodic
> transmissions occur; if both are set to Passive LACP, then periodic
> transmissions do not occur.
> 
> To comply with this, we remove the `!bond->params.lacp_active` check in
> `ad_periodic_machine()`. Instead, we initialize the actor's port's
> `LACP_STATE_LACP_ACTIVITY` state based on `lacp_active` setting.
> 
> Additionally, we avoid setting the partner's state to
> `LACP_STATE_LACP_ACTIVITY` in the EXPIRED state, since we should not assume
> the partner is active by default.
> 
> This ensures that in passive mode, the bond starts sending periodic LACPDUs
> after receiving one from the partner, and avoids flapping due to inactivity.
> 
> Fixes: 1da177e4c3f4 ("Linux-2.6.12-rc2")

Shouldn't the fixes tag be lacp_active commit id?
E.g. 3a755cd8b7c6 ("bonding: add new option lacp_active")

> Signed-off-by: Hangbin Liu <liuhangbin@...il.com>
> ---
>  drivers/net/bonding/bond_3ad.c     | 72 ++++++++++++++++++++++--------
>  drivers/net/bonding/bond_options.c |  1 +
>  include/net/bond_3ad.h             |  1 +
>  3 files changed, 56 insertions(+), 18 deletions(-)
> 
> diff --git a/drivers/net/bonding/bond_3ad.c b/drivers/net/bonding/bond_3ad.c
> index 2fca8e84ab10..aa64b397bb19 100644
> --- a/drivers/net/bonding/bond_3ad.c
> +++ b/drivers/net/bonding/bond_3ad.c
> @@ -95,13 +95,13 @@ static int ad_marker_send(struct port *port, struct bond_marker *marker);
>  static void ad_mux_machine(struct port *port, bool *update_slave_arr);
>  static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port);
>  static void ad_tx_machine(struct port *port);
> -static void ad_periodic_machine(struct port *port, struct bond_params *bond_params);
> +static void ad_periodic_machine(struct port *port);
>  static void ad_port_selection_logic(struct port *port, bool *update_slave_arr);
>  static void ad_agg_selection_logic(struct aggregator *aggregator,
>  				   bool *update_slave_arr);
>  static void ad_clear_agg(struct aggregator *aggregator);
>  static void ad_initialize_agg(struct aggregator *aggregator);
> -static void ad_initialize_port(struct port *port, int lacp_fast);
> +static void ad_initialize_port(struct port *port, struct bond_params *bond_params);
>  static void ad_enable_collecting(struct port *port);
>  static void ad_disable_distributing(struct port *port,
>  				    bool *update_slave_arr);
> @@ -1307,10 +1307,16 @@ static void ad_rx_machine(struct lacpdu *lacpdu, struct port *port)
>  			 * case of EXPIRED even if LINK_DOWN didn't arrive for
>  			 * the port.
>  			 */
> -			port->partner_oper.port_state &= ~LACP_STATE_SYNCHRONIZATION;
>  			port->sm_vars &= ~AD_PORT_MATCHED;
> +			/* Based on IEEE 8021AX-2014, Figure 6-18 - Receive
> +			 * machine state diagram, the statue should be
> +			 * Partner_Oper_Port_State.Synchronization = FALSE;
> +			 * Partner_Oper_Port_State.LACP_Timeout = Short Timeout;
> +			 * start current_while_timer(Short Timeout);
> +			 * Actor_Oper_Port_State.Expired = TRUE;
> +			 */
> +			port->partner_oper.port_state &= ~LACP_STATE_SYNCHRONIZATION;
>  			port->partner_oper.port_state |= LACP_STATE_LACP_TIMEOUT;
> -			port->partner_oper.port_state |= LACP_STATE_LACP_ACTIVITY;
>  			port->sm_rx_timer_counter = __ad_timer_to_ticks(AD_CURRENT_WHILE_TIMER, (u16)(AD_SHORT_TIMEOUT));
>  			port->actor_oper_port_state |= LACP_STATE_EXPIRED;
>  			port->sm_vars |= AD_PORT_CHURNED;
> @@ -1417,11 +1423,10 @@ static void ad_tx_machine(struct port *port)
>  /**
>   * ad_periodic_machine - handle a port's periodic state machine
>   * @port: the port we're looking at
> - * @bond_params: bond parameters we will use
>   *
>   * Turn ntt flag on priodically to perform periodic transmission of lacpdu's.
>   */
> -static void ad_periodic_machine(struct port *port, struct bond_params *bond_params)
> +static void ad_periodic_machine(struct port *port)
>  {
>  	periodic_states_t last_state;
>  
> @@ -1430,8 +1435,7 @@ static void ad_periodic_machine(struct port *port, struct bond_params *bond_para
>  
>  	/* check if port was reinitialized */
>  	if (((port->sm_vars & AD_PORT_BEGIN) || !(port->sm_vars & AD_PORT_LACP_ENABLED) || !port->is_enabled) ||
> -	    (!(port->actor_oper_port_state & LACP_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & LACP_STATE_LACP_ACTIVITY)) ||
> -	    !bond_params->lacp_active) {
> +	    (!(port->actor_oper_port_state & LACP_STATE_LACP_ACTIVITY) && !(port->partner_oper.port_state & LACP_STATE_LACP_ACTIVITY))) {
>  		port->sm_periodic_state = AD_NO_PERIODIC;
>  	}
>  	/* check if state machine should change state */
> @@ -1955,16 +1959,16 @@ static void ad_initialize_agg(struct aggregator *aggregator)
>  /**
>   * ad_initialize_port - initialize a given port's parameters
>   * @port: the port we're looking at
> - * @lacp_fast: boolean. whether fast periodic should be used
> + * @bond_params: bond parameters we will use
>   */
> -static void ad_initialize_port(struct port *port, int lacp_fast)
> +static void ad_initialize_port(struct port *port, struct bond_params *bond_params)
>  {
>  	static const struct port_params tmpl = {
>  		.system_priority = 0xffff,
>  		.key             = 1,
>  		.port_number     = 1,
>  		.port_priority   = 0xff,
> -		.port_state      = 1,
> +		.port_state      = 0,

1 == LACP_STATE_ACTIVITY :)
Just noting that this lets LACP_STATE_ACTIVITY to be set based on lacp_active.

>  	};
>  	static const struct lacpdu lacpdu = {
>  		.subtype		= 0x01,
> @@ -1982,12 +1986,14 @@ static void ad_initialize_port(struct port *port, int lacp_fast)
>  		port->actor_port_priority = 0xff;
>  		port->actor_port_aggregator_identifier = 0;
>  		port->ntt = false;
> -		port->actor_admin_port_state = LACP_STATE_AGGREGATION |
> -					       LACP_STATE_LACP_ACTIVITY;
> -		port->actor_oper_port_state  = LACP_STATE_AGGREGATION |
> -					       LACP_STATE_LACP_ACTIVITY;
> +		port->actor_admin_port_state = LACP_STATE_AGGREGATION;
> +		port->actor_oper_port_state  = LACP_STATE_AGGREGATION;
> +		if (bond_params->lacp_active) {
> +			port->actor_admin_port_state |= LACP_STATE_LACP_ACTIVITY;
> +			port->actor_oper_port_state  |= LACP_STATE_LACP_ACTIVITY;
> +		}
>  
> -		if (lacp_fast)
> +		if (bond_params->lacp_fast)
>  			port->actor_oper_port_state |= LACP_STATE_LACP_TIMEOUT;
>  
>  		memcpy(&port->partner_admin, &tmpl, sizeof(tmpl));
> @@ -2201,7 +2207,7 @@ void bond_3ad_bind_slave(struct slave *slave)
>  		/* port initialization */
>  		port = &(SLAVE_AD_INFO(slave)->port);
>  
> -		ad_initialize_port(port, bond->params.lacp_fast);
> +		ad_initialize_port(port, &bond->params);
>  
>  		port->slave = slave;
>  		port->actor_port_number = SLAVE_AD_INFO(slave)->id;
> @@ -2513,7 +2519,7 @@ void bond_3ad_state_machine_handler(struct work_struct *work)
>  		}
>  
>  		ad_rx_machine(NULL, port);
> -		ad_periodic_machine(port, &bond->params);
> +		ad_periodic_machine(port);
>  		ad_port_selection_logic(port, &update_slave_arr);
>  		ad_mux_machine(port, &update_slave_arr);
>  		ad_tx_machine(port);
> @@ -2883,6 +2889,36 @@ void bond_3ad_update_lacp_rate(struct bonding *bond)
>  	spin_unlock_bh(&bond->mode_lock);
>  }
>  
> +/**
> + * bond_3ad_update_lacp_active - change the lacp active
> + * @bond: bonding struct
> + *
> + * When modify lacp_active parameter via sysfs,
> + * update actor_oper_port_state of each port.

It could also be netlink, right? I'd just say something like:
Update actor_oper_port_state when lacp_active is modified.

> + *
> + * Hold bond->mode_lock,
> + * so we can modify port->actor_oper_port_state,
> + * no matter bond is up or down.

nit: this last part about bond up/down is unnecessary

> + */
> +void bond_3ad_update_lacp_active(struct bonding *bond)
> +{
> +	struct port *port = NULL;
> +	struct list_head *iter;
> +	struct slave *slave;
> +	int lacp_active;
> +
> +	lacp_active = bond->params.lacp_active;
> +	spin_lock_bh(&bond->mode_lock);
> +	bond_for_each_slave(bond, slave, iter) {
> +		port = &(SLAVE_AD_INFO(slave)->port);
> +		if (lacp_active)
> +			port->actor_oper_port_state |= LACP_STATE_LACP_ACTIVITY;
> +		else
> +			port->actor_oper_port_state &= ~LACP_STATE_LACP_ACTIVITY;
> +	}
> +	spin_unlock_bh(&bond->mode_lock);
> +}
> +
>  size_t bond_3ad_stats_size(void)
>  {
>  	return nla_total_size_64bit(sizeof(u64)) + /* BOND_3AD_STAT_LACPDU_RX */
> diff --git a/drivers/net/bonding/bond_options.c b/drivers/net/bonding/bond_options.c
> index 1d639a3be6ba..3b6f815c55ff 100644
> --- a/drivers/net/bonding/bond_options.c
> +++ b/drivers/net/bonding/bond_options.c
> @@ -1660,6 +1660,7 @@ static int bond_option_lacp_active_set(struct bonding *bond,
>  	netdev_dbg(bond->dev, "Setting LACP active to %s (%llu)\n",
>  		   newval->string, newval->value);
>  	bond->params.lacp_active = newval->value;
> +	bond_3ad_update_lacp_active(bond);

To me it looks like this fix needs to be in a separate patch.

>  
>  	return 0;
>  }
> diff --git a/include/net/bond_3ad.h b/include/net/bond_3ad.h
> index 2053cd8e788a..dba369a2cf27 100644
> --- a/include/net/bond_3ad.h
> +++ b/include/net/bond_3ad.h
> @@ -307,6 +307,7 @@ int bond_3ad_lacpdu_recv(const struct sk_buff *skb, struct bonding *bond,
>  			 struct slave *slave);
>  int bond_3ad_set_carrier(struct bonding *bond);
>  void bond_3ad_update_lacp_rate(struct bonding *bond);
> +void bond_3ad_update_lacp_active(struct bonding *bond);
>  void bond_3ad_update_ad_actor_settings(struct bonding *bond);
>  int bond_3ad_stats_fill(struct sk_buff *skb, struct bond_3ad_stats *stats);
>  size_t bond_3ad_stats_size(void);


Powered by blists - more mailing lists

Powered by Openwall GNU/*/Linux Powered by OpenVZ