rhashtable: drop ht->mutex in rhashtable_free_and_destroy()

author Mikhail Gavrilov <mikhail.v.gavrilov@gmail.com>

Wed, 22 Apr 2026 21:33:49 +0000 (02:33 +0500)

committer Herbert Xu <herbert@gondor.apana.org.au>

Tue, 5 May 2026 08:12:06 +0000 (16:12 +0800)
author Mikhail Gavrilov <mikhail.v.gavrilov@gmail.com>
Wed, 22 Apr 2026 21:33:49 +0000 (02:33 +0500)
committer Herbert Xu <herbert@gondor.apana.org.au>
Tue, 5 May 2026 08:12:06 +0000 (16:12 +0800)
diff --git a/lib/rhashtable.c b/lib/rhashtable.c

index 7a67ef5b67b666afdd638394f895d7732fb5e62e..426d4e381f136482b25f12058e09521b1f694277 100644 (file)
--- a/lib/rhashtable.c
+++ b/lib/rhashtable.c
@@ -1166,6 +1166,11 @@ static void rhashtable_free_one(struct rhashtable *ht, struct rhash_head *obj,
   * This function will eventually sleep to wait for an async resize
   * to complete. The caller is responsible that no further write operations
   * occurs in parallel.
+ *
+ * After cancel_work_sync() has returned, the deferred rehash worker is
+ * quiesced and, per the contract above, no other concurrent access to the
+ * rhashtable is possible. The tables are therefore owned exclusively by
+ * this function and can be walked without ht->mutex held.
   */
  void rhashtable_free_and_destroy(struct rhashtable *ht,
                                  void (*free_fn)(void *ptr, void *arg),
@@ -1177,8 +1182,15 @@ void rhashtable_free_and_destroy(struct rhashtable *ht,
         irq_work_sync(&ht->run_irq_work);
         cancel_work_sync(&ht->run_work);
  
-       mutex_lock(&ht->mutex);
-       tbl = rht_dereference(ht->tbl, ht);
+       /*
+        * Do NOT take ht->mutex here. The rehash worker establishes
+        * ht->mutex -> fs_reclaim via GFP_KERNEL bucket allocation under
+        * the mutex; callers on the reclaim path (e.g. simple_xattr_ht_free()
+        * from evict() under the dcache shrinker for shmem/kernfs/pidfs
+        * inodes) would otherwise close a circular dependency
+        * fs_reclaim -> ht->mutex.
+        */
+       tbl = rcu_dereference_raw(ht->tbl);
  restart:
         if (free_fn) {
                 for (i = 0; i < tbl->size; i++) {
@@ -1187,22 +1199,21 @@ restart:
                         cond_resched();
                         for (pos = rht_ptr_exclusive(rht_bucket(tbl, i)),
                              next = !rht_is_a_nulls(pos) ?
-                                       rht_dereference(pos->next, ht) : NULL;
+                                       rcu_dereference_raw(pos->next) : NULL;
                              !rht_is_a_nulls(pos);
                              pos = next,
                              next = !rht_is_a_nulls(pos) ?
-                                       rht_dereference(pos->next, ht) : NULL)
+                                       rcu_dereference_raw(pos->next) : NULL)
                                 rhashtable_free_one(ht, pos, free_fn, arg);
                 }
         }
  
-       next_tbl = rht_dereference(tbl->future_tbl, ht);
+       next_tbl = rcu_dereference_raw(tbl->future_tbl);
         bucket_table_free(tbl);
         if (next_tbl) {
                 tbl = next_tbl;
                 goto restart;
         }
-       mutex_unlock(&ht->mutex);
  }
  EXPORT_SYMBOL_GPL(rhashtable_free_and_destroy);
author	Mikhail Gavrilov <mikhail.v.gavrilov@gmail.com>
	Wed, 22 Apr 2026 21:33:49 +0000 (02:33 +0500)
committer	Herbert Xu <herbert@gondor.apana.org.au>
	Tue, 5 May 2026 08:12:06 +0000 (16:12 +0800)