On Mon, Mar 02, 2026 at 06:39:57AM +0100, Linus Lüssing wrote:
> We later want to use the multicast lock when setting the bridge
> interface up or down, to be able to atomically both check all conditions
> to toggle the multicast active state and to subsequently toggle it.
> While most variables we check / contexts we check from are serialized
> (toggled variables through netlink/sysfs) the timer_pending() check is
> not and might run in parallel.
> 
> However so far we are not allowed to spinlock __br_multicast_stop() as
> its call to timer_delete_sync() might sleep. Therefore replacing the
> sleeping variant with the non-sleeping timer_shutdown(). It is sufficient
> to only wait for any timer callback to finish when we are freeing the
> multicast context.
> 
> While the disadvantage of using a non-syncing variant might lead us to
> race and still execute its timer callback just after timer_shutdown() was
> called timer_shutdown() also has the following additional advantage(s):
> It for one thing clears the callback function pointer and by that avoids
> rearming. For another a missing function pointer allows us to detect
> early in the timer callback if we, this timer, were just canceled.
> 
> In other words, this also allows us to make sure that once
> timer_shutdown() was called while we do potentially enter its timer
> callback briefly we never run the main task of this timer. Similar to
> what a timer_delete_sync() would have avoided, too. Except we are not
> waiting/sleeping/syncing in br_multicast_stop() but instead (in rare cases)
> briefly busy-wait/sync a bit later when grabbing the multicast spinlock
> in the timer callback.
> 
> This new check also makes the netif_running() check redundant/obsolete
> in these contexts.
> 
> Signed-off-by: Linus Lüssing <[email protected]>
> ---
>  net/bridge/br_multicast.c | 128 +++++++++++++++++++++++++++-----------
>  net/bridge/br_private.h   |   5 ++
>  net/bridge/br_vlan.c      |   5 ++
>  3 files changed, 100 insertions(+), 38 deletions(-)
> 
> diff --git a/net/bridge/br_multicast.c b/net/bridge/br_multicast.c
> index 881d866d687a..b90f0e149c40 100644
> --- a/net/bridge/br_multicast.c
> +++ b/net/bridge/br_multicast.c
> @@ -1663,6 +1663,14 @@ static void br_multicast_router_expired(struct 
> net_bridge_mcast_port *pmctx,
>       spin_unlock(&br->multicast_lock);
>  }
>  
> +static bool br_multicast_is_stopping(struct net_bridge *br,
> +                                  struct timer_list *timer)

both should be const

> +{
> +     lockdep_assert_held_once(&br->multicast_lock);
> +
> +     return !timer->function;
> +}
> +
>  static void br_ip4_multicast_router_expired(struct timer_list *t)
>  {
>       struct net_bridge_mcast_port *pmctx = timer_container_of(pmctx, t,
> @@ -1698,7 +1706,8 @@ static void br_multicast_local_router_expired(struct 
> net_bridge_mcast *brmctx,
>                                             struct timer_list *timer)
>  {
>       spin_lock(&brmctx->br->multicast_lock);
> -     if (brmctx->multicast_router == MDB_RTR_TYPE_DISABLED ||
> +     if (br_multicast_is_stopping(brmctx->br, timer) ||
> +         brmctx->multicast_router == MDB_RTR_TYPE_DISABLED ||
>           brmctx->multicast_router == MDB_RTR_TYPE_PERM ||
>           br_ip4_multicast_is_router(brmctx) ||
>           br_ip6_multicast_is_router(brmctx))
> @@ -1728,10 +1737,11 @@ static void 
> br_ip6_multicast_local_router_expired(struct timer_list *t)
>  #endif
>  
>  static void br_multicast_querier_expired(struct net_bridge_mcast *brmctx,
> -                                      struct bridge_mcast_own_query *query)
> +                                      struct bridge_mcast_own_query *query,
> +                                      struct timer_list *timer)
>  {
>       spin_lock(&brmctx->br->multicast_lock);
> -     if (!netif_running(brmctx->br->dev) ||
> +     if (br_multicast_is_stopping(brmctx->br, timer) ||
>           br_multicast_ctx_vlan_global_disabled(brmctx) ||
>           !br_opt_get(brmctx->br, BROPT_MULTICAST_ENABLED))
>               goto out;
> @@ -1747,7 +1757,7 @@ static void br_ip4_multicast_querier_expired(struct 
> timer_list *t)
>       struct net_bridge_mcast *brmctx = timer_container_of(brmctx, t,
>                                                            
> ip4_other_query.timer);
>  
> -     br_multicast_querier_expired(brmctx, &brmctx->ip4_own_query);
> +     br_multicast_querier_expired(brmctx, &brmctx->ip4_own_query, t);
>  }
>  
>  #if IS_ENABLED(CONFIG_IPV6)
> @@ -1756,7 +1766,7 @@ static void br_ip6_multicast_querier_expired(struct 
> timer_list *t)
>       struct net_bridge_mcast *brmctx = timer_container_of(brmctx, t,
>                                                            
> ip6_other_query.timer);
>  
> -     br_multicast_querier_expired(brmctx, &brmctx->ip6_own_query);
> +     br_multicast_querier_expired(brmctx, &brmctx->ip6_own_query, t);
>  }
>  #endif
>  
> @@ -4040,10 +4050,12 @@ int br_multicast_rcv(struct net_bridge_mcast **brmctx,
>  }
>  
>  static void br_multicast_query_expired(struct net_bridge_mcast *brmctx,
> -                                    struct bridge_mcast_own_query *query)
> +                                    struct bridge_mcast_own_query *query,
> +                                    struct timer_list *timer)
>  {
>       spin_lock(&brmctx->br->multicast_lock);
> -     if (br_multicast_ctx_vlan_disabled(brmctx))
> +     if (br_multicast_is_stopping(brmctx->br, timer) ||
> +         br_multicast_ctx_vlan_disabled(brmctx))
>               goto out;
>  
>       if (query->startup_sent < brmctx->multicast_startup_query_count)
> @@ -4059,7 +4071,7 @@ static void br_ip4_multicast_query_expired(struct 
> timer_list *t)
>       struct net_bridge_mcast *brmctx = timer_container_of(brmctx, t,
>                                                            
> ip4_own_query.timer);
>  
> -     br_multicast_query_expired(brmctx, &brmctx->ip4_own_query);
> +     br_multicast_query_expired(brmctx, &brmctx->ip4_own_query, t);
>  }
>  
>  #if IS_ENABLED(CONFIG_IPV6)
> @@ -4068,7 +4080,7 @@ static void br_ip6_multicast_query_expired(struct 
> timer_list *t)
>       struct net_bridge_mcast *brmctx = timer_container_of(brmctx, t,
>                                                            
> ip6_own_query.timer);
>  
> -     br_multicast_query_expired(brmctx, &brmctx->ip6_own_query);
> +     br_multicast_query_expired(brmctx, &brmctx->ip6_own_query, t);
>  }
>  #endif
>  
> @@ -4111,29 +4123,30 @@ void br_multicast_ctx_init(struct net_bridge *br,
>       seqcount_spinlock_init(&brmctx->ip6_querier.seq, &br->multicast_lock);
>  #endif
>  
> -     timer_setup(&brmctx->ip4_mc_router_timer,
> -                 br_ip4_multicast_local_router_expired, 0);
> -     timer_setup(&brmctx->ip4_other_query.timer,
> -                 br_ip4_multicast_querier_expired, 0);
> -     timer_setup(&brmctx->ip4_other_query.delay_timer,
> -                 br_multicast_query_delay_expired, 0);
> -     timer_setup(&brmctx->ip4_own_query.timer,
> -                 br_ip4_multicast_query_expired, 0);
> +     timer_setup(&brmctx->ip4_mc_router_timer, NULL, 0);
> +     timer_setup(&brmctx->ip4_other_query.timer, NULL, 0);
> +     timer_setup(&brmctx->ip4_other_query.delay_timer, NULL, 0);
> +     timer_setup(&brmctx->ip4_own_query.timer, NULL, 0);
>  #if IS_ENABLED(CONFIG_IPV6)
> -     timer_setup(&brmctx->ip6_mc_router_timer,
> -                 br_ip6_multicast_local_router_expired, 0);
> -     timer_setup(&brmctx->ip6_other_query.timer,
> -                 br_ip6_multicast_querier_expired, 0);
> -     timer_setup(&brmctx->ip6_other_query.delay_timer,
> -                 br_multicast_query_delay_expired, 0);
> -     timer_setup(&brmctx->ip6_own_query.timer,
> -                 br_ip6_multicast_query_expired, 0);
> +     timer_setup(&brmctx->ip6_mc_router_timer, NULL, 0);
> +     timer_setup(&brmctx->ip6_other_query.timer, NULL, 0);
> +     timer_setup(&brmctx->ip6_other_query.delay_timer, NULL, 0);
> +     timer_setup(&brmctx->ip6_own_query.timer, NULL, 0);
>  #endif
>  }
>  
>  void br_multicast_ctx_deinit(struct net_bridge_mcast *brmctx)
>  {
> -     __br_multicast_stop(brmctx);
> +     timer_shutdown_sync(&brmctx->ip4_mc_router_timer);
> +     timer_shutdown_sync(&brmctx->ip4_other_query.timer);
> +     timer_shutdown_sync(&brmctx->ip4_other_query.delay_timer);
> +     timer_shutdown_sync(&brmctx->ip4_own_query.timer);
> +#if IS_ENABLED(CONFIG_IPV6)
> +     timer_shutdown_sync(&brmctx->ip6_mc_router_timer);
> +     timer_shutdown_sync(&brmctx->ip6_other_query.timer);
> +     timer_shutdown_sync(&brmctx->ip6_other_query.delay_timer);
> +     timer_shutdown_sync(&brmctx->ip6_own_query.timer);
> +#endif
>  }
>  
>  void br_multicast_init(struct net_bridge *br)
> @@ -4213,9 +4226,27 @@ void br_multicast_leave_snoopers(struct net_bridge *br)
>       br_ip6_multicast_leave_snoopers(br);
>  }
>  
> +void br_multicast_reset_timer_cbs(struct net_bridge_mcast *brmctx)
> +{
> +     lockdep_assert_held_once(&brmctx->br->multicast_lock);
> +
> +     brmctx->ip4_mc_router_timer.function = 
> br_ip4_multicast_local_router_expired;
> +     brmctx->ip4_other_query.timer.function = 
> br_ip4_multicast_querier_expired;
> +     brmctx->ip4_other_query.delay_timer.function = 
> br_multicast_query_delay_expired;
> +     brmctx->ip4_own_query.timer.function = br_ip4_multicast_query_expired;
> +#if IS_ENABLED(CONFIG_IPV6)
> +     brmctx->ip6_mc_router_timer.function = 
> br_ip6_multicast_local_router_expired;
> +     brmctx->ip6_other_query.timer.function = 
> br_ip6_multicast_querier_expired;
> +     brmctx->ip6_other_query.delay_timer.function = 
> br_multicast_query_delay_expired;
> +     brmctx->ip6_own_query.timer.function = br_ip6_multicast_query_expired;
> +#endif
> +}
> +
>  static void __br_multicast_open_query(struct net_bridge *br,
>                                     struct bridge_mcast_own_query *query)
>  {
> +     lockdep_assert_held_once(&br->multicast_lock);
> +
>       query->startup_sent = 0;
>  
>       if (!br_opt_get(br, BROPT_MULTICAST_ENABLED))
> @@ -4226,13 +4257,15 @@ static void __br_multicast_open_query(struct 
> net_bridge *br,
>  
>  static void __br_multicast_open(struct net_bridge_mcast *brmctx)
>  {
> +     br_multicast_reset_timer_cbs(brmctx);
> +
>       __br_multicast_open_query(brmctx->br, &brmctx->ip4_own_query);
>  #if IS_ENABLED(CONFIG_IPV6)
>       __br_multicast_open_query(brmctx->br, &brmctx->ip6_own_query);
>  #endif
>  }
>  
> -void br_multicast_open(struct net_bridge *br)
> +static void br_multicast_open_locked(struct net_bridge *br)
>  {
>       ASSERT_RTNL();
>  
> @@ -4256,17 +4289,26 @@ void br_multicast_open(struct net_bridge *br)
>       }
>  }
>  
> +void br_multicast_open(struct net_bridge *br)
> +{
> +     spin_lock_bh(&br->multicast_lock);
> +     br_multicast_open_locked(br);
> +     spin_unlock_bh(&br->multicast_lock);
> +}
> +
>  static void __br_multicast_stop(struct net_bridge_mcast *brmctx)
>  {
> -     timer_delete_sync(&brmctx->ip4_mc_router_timer);
> -     timer_delete_sync(&brmctx->ip4_other_query.timer);
> -     timer_delete_sync(&brmctx->ip4_other_query.delay_timer);
> -     timer_delete_sync(&brmctx->ip4_own_query.timer);
> +     lockdep_assert_held_once(&brmctx->br->multicast_lock);
> +
> +     timer_shutdown(&brmctx->ip4_mc_router_timer);
> +     timer_shutdown(&brmctx->ip4_other_query.timer);
> +     timer_shutdown(&brmctx->ip4_other_query.delay_timer);
> +     timer_shutdown(&brmctx->ip4_own_query.timer);
>  #if IS_ENABLED(CONFIG_IPV6)
> -     timer_delete_sync(&brmctx->ip6_mc_router_timer);
> -     timer_delete_sync(&brmctx->ip6_other_query.timer);
> -     timer_delete_sync(&brmctx->ip6_other_query.delay_timer);
> -     timer_delete_sync(&brmctx->ip6_own_query.timer);
> +     timer_shutdown(&brmctx->ip6_mc_router_timer);
> +     timer_shutdown(&brmctx->ip6_other_query.timer);
> +     timer_shutdown(&brmctx->ip6_other_query.delay_timer);
> +     timer_shutdown(&brmctx->ip6_own_query.timer);
>  #endif
>  }
>  
> @@ -4317,12 +4359,12 @@ void br_multicast_toggle_one_vlan(struct 
> net_bridge_vlan *vlan, bool on)
>  
>               spin_lock_bh(&br->multicast_lock);
>               vlan->priv_flags ^= BR_VLFLAG_MCAST_ENABLED;
> -             spin_unlock_bh(&br->multicast_lock);
>  
>               if (on)
>                       __br_multicast_open(&vlan->br_mcast_ctx);
>               else
>                       __br_multicast_stop(&vlan->br_mcast_ctx);
> +             spin_unlock_bh(&br->multicast_lock);
>       } else {
>               struct net_bridge_mcast *brmctx;
>  
> @@ -4380,6 +4422,7 @@ int br_multicast_toggle_vlan_snooping(struct net_bridge 
> *br, bool on,
>       if (!vg)
>               return 0;
>  
> +     spin_lock_bh(&br->multicast_lock);
>       br_opt_toggle(br, BROPT_MCAST_VLAN_SNOOPING_ENABLED, on);
>  
>       /* disable/enable non-vlan mcast contexts based on vlan snooping */
> @@ -4387,6 +4430,8 @@ int br_multicast_toggle_vlan_snooping(struct net_bridge 
> *br, bool on,
>               __br_multicast_stop(&br->multicast_ctx);
>       else
>               __br_multicast_open(&br->multicast_ctx);
> +     spin_unlock_bh(&br->multicast_lock);
> +
>       list_for_each_entry(p, &br->port_list, list) {
>               if (on)
>                       br_multicast_disable_port_ctx(&p->multicast_ctx);
> @@ -4416,7 +4461,7 @@ bool br_multicast_toggle_global_vlan(struct 
> net_bridge_vlan *vlan, bool on)
>       return true;
>  }
>  
> -void br_multicast_stop(struct net_bridge *br)
> +static void br_multicast_stop_locked(struct net_bridge *br)
>  {
>       ASSERT_RTNL();
>  
> @@ -4440,6 +4485,13 @@ void br_multicast_stop(struct net_bridge *br)
>       }
>  }
>  
> +void br_multicast_stop(struct net_bridge *br)
> +{
> +     spin_lock_bh(&br->multicast_lock);
> +     br_multicast_stop_locked(br);
> +     spin_unlock_bh(&br->multicast_lock);
> +}
> +
>  void br_multicast_dev_del(struct net_bridge *br)
>  {
>       struct net_bridge_mdb_entry *mp;
> @@ -4675,7 +4727,7 @@ int br_multicast_toggle(struct net_bridge *br, unsigned 
> long val,
>       if (!netif_running(br->dev))
>               goto unlock;
>  
> -     br_multicast_open(br);
> +     br_multicast_open_locked(br);
>       list_for_each_entry(port, &br->port_list, list)
>               __br_multicast_enable_port_ctx(&port->multicast_ctx);
>  
> diff --git a/net/bridge/br_private.h b/net/bridge/br_private.h
> index 4ab6a1f58116..a181a27aa559 100644
> --- a/net/bridge/br_private.h
> +++ b/net/bridge/br_private.h
> @@ -976,6 +976,7 @@ void br_multicast_disable_port(struct net_bridge_port 
> *port);
>  void br_multicast_init(struct net_bridge *br);
>  void br_multicast_join_snoopers(struct net_bridge *br);
>  void br_multicast_leave_snoopers(struct net_bridge *br);
> +void br_multicast_reset_timer_cbs(struct net_bridge_mcast *brmctx);
>  void br_multicast_open(struct net_bridge *br);
>  void br_multicast_stop(struct net_bridge *br);
>  void br_multicast_dev_del(struct net_bridge *br);
> @@ -1416,6 +1417,10 @@ static inline void br_multicast_leave_snoopers(struct 
> net_bridge *br)
>  {
>  }
>  
> +static inline void br_multicast_reset_timer_cbs(struct net_bridge_mcast 
> *brmctx)
> +{
> +}
> +
>  static inline void br_multicast_open(struct net_bridge *br)
>  {
>  }
> diff --git a/net/bridge/br_vlan.c b/net/bridge/br_vlan.c
> index 326933b455b3..3facb4eda306 100644
> --- a/net/bridge/br_vlan.c
> +++ b/net/bridge/br_vlan.c
> @@ -325,7 +325,12 @@ static int __vlan_add(struct net_bridge_vlan *v, u16 
> flags,
>                       if (err && err != -EOPNOTSUPP)
>                               goto out;
>               }
> +

extra new line

>               br_multicast_ctx_init(br, v, &v->br_mcast_ctx);
> +
> +             spin_lock_bh(&br->multicast_lock);
> +             br_multicast_reset_timer_cbs(&v->br_mcast_ctx);
> +             spin_unlock_bh(&br->multicast_lock);

Have you tested this without bridge IGMP_SNOOPING defined?
I don't think it will compile.

Also, please avoid spilling multicast lock outside of mcast code. In fact
why don't you move this in br_multicast_ctx_init?

>               v->priv_flags |= BR_VLFLAG_GLOBAL_MCAST_ENABLED;
>       }
>  
> -- 
> 2.51.0
> 

Reply via email to