net/mlx5: Fix deadlock between devlink lock and esw->wq

author Cosmin Ratiu <cratiu@nvidia.com>

Thu, 5 Mar 2026 08:10:19 +0000 (10:10 +0200)

committer Jakub Kicinski <kuba@kernel.org>

Sat, 7 Mar 2026 01:24:28 +0000 (17:24 -0800)
author Cosmin Ratiu <cratiu@nvidia.com>
Thu, 5 Mar 2026 08:10:19 +0000 (10:10 +0200)
committer Jakub Kicinski <kuba@kernel.org>
Sat, 7 Mar 2026 01:24:28 +0000 (17:24 -0800)
diff --git a/drivers/net/ethernet/mellanox/mlx5/core/eswitch.c b/drivers/net/ethernet/mellanox/mlx5/core/eswitch.c

index d3af87a94a187fd3a4d99e6ed5f2cfcf4690c5b2..123c96716a544de0ea7ac1716043409abb228da7 100644 (file)
--- a/drivers/net/ethernet/mellanox/mlx5/core/eswitch.c
+++ b/drivers/net/ethernet/mellanox/mlx5/core/eswitch.c
@@ -1072,10 +1072,11 @@ static void mlx5_eswitch_event_handler_register(struct mlx5_eswitch *esw)
  
  static void mlx5_eswitch_event_handler_unregister(struct mlx5_eswitch *esw)
  {
-       if (esw->mode == MLX5_ESWITCH_OFFLOADS && mlx5_eswitch_is_funcs_handler(esw->dev))
+       if (esw->mode == MLX5_ESWITCH_OFFLOADS &&
+           mlx5_eswitch_is_funcs_handler(esw->dev)) {
                 mlx5_eq_notifier_unregister(esw->dev, &esw->esw_funcs.nb);
-
-       flush_workqueue(esw->work_queue);
+               atomic_inc(&esw->esw_funcs.generation);
+       }
  }
  
  static void mlx5_eswitch_clear_vf_vports_info(struct mlx5_eswitch *esw)
diff --git a/drivers/net/ethernet/mellanox/mlx5/core/eswitch.h b/drivers/net/ethernet/mellanox/mlx5/core/eswitch.h

index 6841caef02d10874390dd48d49e07a18c3041227..c2563bee74dfe9ff13ec739103c37bb12681403c 100644 (file)
--- a/drivers/net/ethernet/mellanox/mlx5/core/eswitch.h
+++ b/drivers/net/ethernet/mellanox/mlx5/core/eswitch.h
@@ -335,10 +335,12 @@ struct esw_mc_addr { /* SRIOV only */
  struct mlx5_host_work {
         struct work_struct      work;
         struct mlx5_eswitch     *esw;
+       int                     work_gen;
  };
  
  struct mlx5_esw_functions {
         struct mlx5_nb          nb;
+       atomic_t                generation;
         bool                    host_funcs_disabled;
         u16                     num_vfs;
         u16                     num_ec_vfs;
diff --git a/drivers/net/ethernet/mellanox/mlx5/core/eswitch_offloads.c b/drivers/net/ethernet/mellanox/mlx5/core/eswitch_offloads.c

index 1366f6e489bd2d2f35269d67378a07d27829fc17..8c5e48d001be039855bcb87b2f38a5d6e4994d75 100644 (file)
--- a/drivers/net/ethernet/mellanox/mlx5/core/eswitch_offloads.c
+++ b/drivers/net/ethernet/mellanox/mlx5/core/eswitch_offloads.c
@@ -3582,22 +3582,28 @@ static void esw_offloads_steering_cleanup(struct mlx5_eswitch *esw)
  }
  
  static void
-esw_vfs_changed_event_handler(struct mlx5_eswitch *esw, const u32 *out)
+esw_vfs_changed_event_handler(struct mlx5_eswitch *esw, int work_gen,
+                             const u32 *out)
  {
         struct devlink *devlink;
         bool host_pf_disabled;
         u16 new_num_vfs;
  
+       devlink = priv_to_devlink(esw->dev);
+       devl_lock(devlink);
+
+       /* Stale work from one or more mode changes ago. Bail out. */
+       if (work_gen != atomic_read(&esw->esw_funcs.generation))
+               goto unlock;
+
         new_num_vfs = MLX5_GET(query_esw_functions_out, out,
                                host_params_context.host_num_of_vfs);
         host_pf_disabled = MLX5_GET(query_esw_functions_out, out,
                                     host_params_context.host_pf_disabled);
  
         if (new_num_vfs == esw->esw_funcs.num_vfs || host_pf_disabled)
-               return;
+               goto unlock;
  
-       devlink = priv_to_devlink(esw->dev);
-       devl_lock(devlink);
         /* Number of VFs can only change from "0 to x" or "x to 0". */
         if (esw->esw_funcs.num_vfs > 0) {
                 mlx5_eswitch_unload_vf_vports(esw, esw->esw_funcs.num_vfs);
@@ -3612,6 +3618,7 @@ esw_vfs_changed_event_handler(struct mlx5_eswitch *esw, const u32 *out)
                 }
         }
         esw->esw_funcs.num_vfs = new_num_vfs;
+unlock:
         devl_unlock(devlink);
  }
  
@@ -3628,7 +3635,7 @@ static void esw_functions_changed_event_handler(struct work_struct *work)
         if (IS_ERR(out))
                 goto out;
  
-       esw_vfs_changed_event_handler(esw, out);
+       esw_vfs_changed_event_handler(esw, host_work->work_gen, out);
         kvfree(out);
  out:
         kfree(host_work);
@@ -3648,6 +3655,7 @@ int mlx5_esw_funcs_changed_handler(struct notifier_block *nb, unsigned long type
         esw = container_of(esw_funcs, struct mlx5_eswitch, esw_funcs);
  
         host_work->esw = esw;
+       host_work->work_gen = atomic_read(&esw_funcs->generation);
  
         INIT_WORK(&host_work->work, esw_functions_changed_event_handler);
         queue_work(esw->work_queue, &host_work->work);
author	Cosmin Ratiu <cratiu@nvidia.com>
	Thu, 5 Mar 2026 08:10:19 +0000 (10:10 +0200)
committer	Jakub Kicinski <kuba@kernel.org>
	Sat, 7 Mar 2026 01:24:28 +0000 (17:24 -0800)
drivers/net/ethernet/mellanox/mlx5/core/eswitch.c		patch \| blob \| blame \| history
drivers/net/ethernet/mellanox/mlx5/core/eswitch.h		patch \| blob \| blame \| history
drivers/net/ethernet/mellanox/mlx5/core/eswitch_offloads.c		patch \| blob \| blame \| history