kernfs: fix xattr race condition with multiple superblocks

author Miklos Szeredi <mszeredi@redhat.com>

Fri, 5 Jun 2026 13:53:16 +0000 (15:53 +0200)

committer Christian Brauner <brauner@kernel.org>

Sat, 6 Jun 2026 13:21:40 +0000 (15:21 +0200)
author Miklos Szeredi <mszeredi@redhat.com>
Fri, 5 Jun 2026 13:53:16 +0000 (15:53 +0200)
committer Christian Brauner <brauner@kernel.org>
Sat, 6 Jun 2026 13:21:40 +0000 (15:21 +0200)
diff --git a/fs/kernfs/file.c b/fs/kernfs/file.c

index 1163aa769738498890cc53ac09ef95d0b06b487e..8e0e90c933720be1a61174d795c41b72d7d77e0b 100644 (file)
--- a/fs/kernfs/file.c
+++ b/fs/kernfs/file.c
@@ -40,22 +40,15 @@ struct kernfs_open_node {
  static DEFINE_SPINLOCK(kernfs_notify_lock);
  static struct kernfs_node *kernfs_notify_list = KERNFS_NOTIFY_EOL;
  
+/* Compatibility wrappers - use the common hashed node lock */
  static inline struct mutex *kernfs_open_file_mutex_ptr(struct kernfs_node *kn)
  {
-       int idx = hash_ptr(kn, NR_KERNFS_LOCK_BITS);
-
-       return &kernfs_locks->open_file_mutex[idx];
+       return kernfs_node_lock_ptr(kn);
  }
  
  static inline struct mutex *kernfs_open_file_mutex_lock(struct kernfs_node *kn)
  {
-       struct mutex *lock;
-
-       lock = kernfs_open_file_mutex_ptr(kn);
-
-       mutex_lock(lock);
-
-       return lock;
+       return kernfs_node_lock(kn);
  }
  
  /**
diff --git a/fs/kernfs/inode.c b/fs/kernfs/inode.c

index 38b28aa7cd023fb891da71d18b3c37798e3ee1b5..e676737d9531a7e031889d2e1559ff9c40f2d5b3 100644 (file)
--- a/fs/kernfs/inode.c
+++ b/fs/kernfs/inode.c
@@ -320,6 +320,15 @@ int kernfs_xattr_set(struct kernfs_node *kn, const char *name,
         if (!attrs)
                 return -ENOMEM;
  
+       /*
+        * Protect xattr modifications with the hashed per-node mutex.
+        * Multiple superblocks (with different namespaces) can share the same
+        * kernfs_node, so inode locking alone is insufficient. The hashed mutex
+        * ensures serialization of concurrent xattr operations on the same node,
+        * including the lazy allocation of the xattrs structure itself.
+        */
+       CLASS(kernfs_node_lock, lock)(kn);
+
         xattrs = simple_xattrs_lazy_alloc(&attrs->xattrs, value, flags);
         if (IS_ERR_OR_NULL(xattrs))
                 return PTR_ERR(xattrs);
@@ -372,6 +381,9 @@ static int kernfs_vfs_user_xattr_set(const struct xattr_handler *handler,
         if (!attrs)
                 return -ENOMEM;
  
+       /* See comment in kernfs_xattr_set() about locking. */
+       CLASS(kernfs_node_lock, lock)(kn);
+
         xattrs = simple_xattrs_lazy_alloc(&attrs->xattrs, value, flags);
         if (IS_ERR_OR_NULL(xattrs))
                 return PTR_ERR(xattrs);
diff --git a/fs/kernfs/kernfs-internal.h b/fs/kernfs/kernfs-internal.h

index 8d8912f50b054de2346dc4bdfc6d63ce8194cae0..1dc6663553d1a572114a632df9e750187cc9e063 100644 (file)
--- a/fs/kernfs/kernfs-internal.h
+++ b/fs/kernfs/kernfs-internal.h
@@ -211,4 +211,24 @@ extern const struct inode_operations kernfs_symlink_iops;
   * kernfs locks
   */
  extern struct kernfs_global_locks *kernfs_locks;
+
+/* Hashed mutex helpers - protect per-node data structures */
+static inline struct mutex *kernfs_node_lock_ptr(struct kernfs_node *kn)
+{
+       int idx = hash_ptr(kn, NR_KERNFS_LOCK_BITS);
+
+       return &kernfs_locks->node_mutex[idx];
+}
+
+static inline struct mutex *kernfs_node_lock(struct kernfs_node *kn)
+{
+       struct mutex *lock = kernfs_node_lock_ptr(kn);
+
+       mutex_lock(lock);
+       return lock;
+}
+
+DEFINE_CLASS(kernfs_node_lock, struct mutex *,
+            mutex_unlock(_T), kernfs_node_lock(kn), struct kernfs_node *kn)
+
  #endif /* __KERNFS_INTERNAL_H */
diff --git a/fs/kernfs/mount.c b/fs/kernfs/mount.c

index 6e3217b6e4811a2d5dce76819c2745b86c873f5a..f183a96778b9a2789a8bf298835c56d3ee288101 100644 (file)
--- a/fs/kernfs/mount.c
+++ b/fs/kernfs/mount.c
@@ -446,7 +446,7 @@ static void __init kernfs_mutex_init(void)
         int count;
  
         for (count = 0; count < NR_KERNFS_LOCKS; count++)
-               mutex_init(&kernfs_locks->open_file_mutex[count]);
+               mutex_init(&kernfs_locks->node_mutex[count]);
  }
  
  static void __init kernfs_lock_init(void)
diff --git a/include/linux/kernfs.h b/include/linux/kernfs.h

index e21b2f7f4159fef9765ee7736855f298a3bc5d92..351a5101c8628771d7c3eb8ce7e48cf334a9ecfc 100644 (file)
--- a/include/linux/kernfs.h
+++ b/include/linux/kernfs.h
@@ -76,20 +76,25 @@ struct kernfs_iattrs;
   * kernfs_open_file.
   *
   * kernfs_open_files are chained at kernfs_open_node->files, which is
- * protected by kernfs_global_locks.open_file_mutex[i].
+ * protected by kernfs_global_locks.node_mutex[i].
   *
   * To reduce possible contention in sysfs access, arising due to single
- * locks, use an array of locks (e.g. open_file_mutex) and use kernfs_node
+ * locks, use an array of locks (e.g. node_mutex) and use kernfs_node
   * object address as hash keys to get the index of these locks.
   *
   * Hashed mutexes are safe to use here because operations using these don't
   * rely on global exclusion.
   *
+ * The hashed mutex array protects per-node data: the kernfs_open_node for
+ * open file management, and kernfs_node xattr operations (necessary because
+ * multiple superblocks with different namespaces can share the same
+ * kernfs_node, making per-inode locking insufficient).
+ *
   * In future we intend to replace other global locks with hashed ones as well.
   * kernfs_global_locks acts as a holder for all such hash tables.
   */
  struct kernfs_global_locks {
-       struct mutex open_file_mutex[NR_KERNFS_LOCKS];
+       struct mutex node_mutex[NR_KERNFS_LOCKS];
  };
  
  enum kernfs_node_type {
author	Miklos Szeredi <mszeredi@redhat.com>
	Fri, 5 Jun 2026 13:53:16 +0000 (15:53 +0200)
committer	Christian Brauner <brauner@kernel.org>
	Sat, 6 Jun 2026 13:21:40 +0000 (15:21 +0200)
fs/kernfs/file.c		patch \| blob \| blame \| history
fs/kernfs/inode.c		patch \| blob \| blame \| history
fs/kernfs/kernfs-internal.h		patch \| blob \| blame \| history
fs/kernfs/mount.c		patch \| blob \| blame \| history
include/linux/kernfs.h		patch \| blob \| blame \| history