btrfs: enable experimental bs > ps support

author Qu Wenruo <wqu@suse.com>

Tue, 9 Sep 2025 03:08:47 +0000 (12:38 +0930)

committer David Sterba <dsterba@suse.com>

Tue, 23 Sep 2025 06:49:25 +0000 (08:49 +0200)
author Qu Wenruo <wqu@suse.com>
Tue, 9 Sep 2025 03:08:47 +0000 (12:38 +0930)
committer David Sterba <dsterba@suse.com>
Tue, 23 Sep 2025 06:49:25 +0000 (08:49 +0200)
diff --git a/fs/btrfs/direct-io.c b/fs/btrfs/direct-io.c

index fe9a4bd7e6e6831b61b7b8f9f4242363e492b2fa..802d4dbe5b381763979f8da7f16ddc9034cd72bd 100644 (file)
--- a/fs/btrfs/direct-io.c
+++ b/fs/btrfs/direct-io.c
@@ -786,6 +786,18 @@ static ssize_t check_direct_IO(struct btrfs_fs_info *fs_info,
         if (iov_iter_alignment(iter) & blocksize_mask)
                 return -EINVAL;
  
+       /*
+        * For bs > ps support, we heavily rely on large folios to make sure no
+        * block will cross large folio boundaries.
+        *
+        * But memory provided by direct IO is only virtually contiguous, not
+        * physically contiguous, and will break the btrfs' large folio requirement.
+        *
+        * So for bs > ps support, all direct IOs should fallback to buffered ones.
+        */
+       if (fs_info->sectorsize > PAGE_SIZE)
+               return -EINVAL;
+
         return 0;
  }
  
diff --git a/fs/btrfs/disk-io.c b/fs/btrfs/disk-io.c

index 5c57f523f4498d2a345c6721b5c47b2aa16c025a..0aee3239518d7694888188aa628b07f6f4bece97 100644 (file)
--- a/fs/btrfs/disk-io.c
+++ b/fs/btrfs/disk-io.c
@@ -3242,18 +3242,24 @@ int btrfs_check_features(struct btrfs_fs_info *fs_info, bool is_rw_mount)
         }
  
         /*
-        * Subpage runtime limitation on v1 cache.
+        * Subpage/bs > ps runtime limitation on v1 cache.
          *
          * V1 space cache still has some hard coded PAGE_SIZE usage, while
          * we're already defaulting to v2 cache, no need to bother v1 as it's
          * going to be deprecated anyway.
          */
-       if (fs_info->sectorsize < PAGE_SIZE && btrfs_test_opt(fs_info, SPACE_CACHE)) {
+       if (fs_info->sectorsize != PAGE_SIZE && btrfs_test_opt(fs_info, SPACE_CACHE)) {
                 btrfs_warn(fs_info,
         "v1 space cache is not supported for page size %lu with sectorsize %u",
                            PAGE_SIZE, fs_info->sectorsize);
                 return -EINVAL;
         }
+       if (fs_info->sectorsize > PAGE_SIZE && btrfs_fs_incompat(fs_info, RAID56)) {
+               btrfs_err(fs_info,
+               "RAID56 is not supported for page size %lu with sectorsize %u",
+                         PAGE_SIZE, fs_info->sectorsize);
+               return -EINVAL;
+       }
  
         /* This can be called by remount, we need to protect the super block. */
         spin_lock(&fs_info->super_lock);
@@ -3388,6 +3394,10 @@ int __cold open_ctree(struct super_block *sb, struct btrfs_fs_devices *fs_device
         fs_info->stripesize = stripesize;
         fs_info->fs_devices->fs_info = fs_info;
  
+       if (fs_info->sectorsize > PAGE_SIZE)
+               btrfs_warn(fs_info,
+                          "support for block size %u with page size %zu is experimental, some features may be missing",
+                          fs_info->sectorsize, PAGE_SIZE);
         /*
          * Handle the space caching options appropriately now that we have the
          * super block loaded and validated.
diff --git a/fs/btrfs/fs.c b/fs/btrfs/fs.c

index 29ad1c8591944b21776b02875c6ac9d471214ad4..feb0a2faa8379b448ba2805ea9d8f6ca9799166b 100644 (file)
--- a/fs/btrfs/fs.c
+++ b/fs/btrfs/fs.c
@@ -97,8 +97,7 @@ bool __attribute_const__ btrfs_supported_blocksize(u32 blocksize)
          */
         if (IS_ENABLED(CONFIG_HIGHMEM) && blocksize > PAGE_SIZE)
                 return false;
-       if (blocksize <= PAGE_SIZE)
-               return true;
+       return true;
  #endif
         return false;
  }
diff --git a/fs/btrfs/ioctl.c b/fs/btrfs/ioctl.c

index 063291519b363b95730b6dc52c66f80e998b9ed2..0e9e2b99939232b7c9547041969a5856531ab06b 100644 (file)
--- a/fs/btrfs/ioctl.c
+++ b/fs/btrfs/ioctl.c
@@ -4418,6 +4418,10 @@ static int btrfs_ioctl_encoded_read(struct file *file, void __user *argp,
                 goto out_acct;
         }
  
+       if (fs_info->sectorsize > PAGE_SIZE) {
+               ret = -ENOTTY;
+               goto out_acct;
+       }
         if (compat) {
  #if defined(CONFIG_64BIT) && defined(CONFIG_COMPAT)
                 struct btrfs_ioctl_encoded_io_args_32 args32;
@@ -4509,6 +4513,7 @@ out_acct:
  
  static int btrfs_ioctl_encoded_write(struct file *file, void __user *argp, bool compat)
  {
+       struct btrfs_fs_info *fs_info = inode_to_fs_info(file->f_inode);
         struct btrfs_ioctl_encoded_io_args args;
         struct iovec iovstack[UIO_FASTIOV];
         struct iovec *iov = iovstack;
@@ -4522,6 +4527,11 @@ static int btrfs_ioctl_encoded_write(struct file *file, void __user *argp, bool
                 goto out_acct;
         }
  
+       if (fs_info->sectorsize > PAGE_SIZE) {
+               ret = -ENOTTY;
+               goto out_acct;
+       }
+
         if (!(file->f_mode & FMODE_WRITE)) {
                 ret = -EBADF;
                 goto out_acct;
@@ -4780,14 +4790,14 @@ out_fail:
  
  static int btrfs_uring_encoded_read(struct io_uring_cmd *cmd, unsigned int issue_flags)
  {
+       struct file *file = cmd->file;
+       struct btrfs_inode *inode = BTRFS_I(file->f_inode);
+       struct extent_io_tree *io_tree = &inode->io_tree;
+       struct btrfs_fs_info *fs_info = inode->root->fs_info;
         size_t copy_end_kernel = offsetofend(struct btrfs_ioctl_encoded_io_args, flags);
         size_t copy_end;
         int ret;
         u64 disk_bytenr, disk_io_size;
-       struct file *file;
-       struct btrfs_inode *inode;
-       struct btrfs_fs_info *fs_info;
-       struct extent_io_tree *io_tree;
         loff_t pos;
         struct kiocb kiocb;
         struct extent_state *cached_state = NULL;
@@ -4803,10 +4813,11 @@ static int btrfs_uring_encoded_read(struct io_uring_cmd *cmd, unsigned int issue
                 ret = -EPERM;
                 goto out_acct;
         }
-       file = cmd->file;
-       inode = BTRFS_I(file->f_inode);
-       fs_info = inode->root->fs_info;
-       io_tree = &inode->io_tree;
+       if (fs_info->sectorsize > PAGE_SIZE) {
+               ret = -ENOTTY;
+               goto out_acct;
+       }
+
         sqe_addr = u64_to_user_ptr(READ_ONCE(cmd->sqe->addr));
  
         if (issue_flags & IO_URING_F_COMPAT) {
@@ -4933,9 +4944,10 @@ out_acct:
  
  static int btrfs_uring_encoded_write(struct io_uring_cmd *cmd, unsigned int issue_flags)
  {
+       struct file *file = cmd->file;
+       struct btrfs_fs_info *fs_info = inode_to_fs_info(file->f_inode);
         loff_t pos;
         struct kiocb kiocb;
-       struct file *file;
         ssize_t ret;
         void __user *sqe_addr;
         struct io_btrfs_cmd *bc = io_uring_cmd_to_pdu(cmd, struct io_btrfs_cmd);
@@ -4948,8 +4960,11 @@ static int btrfs_uring_encoded_write(struct io_uring_cmd *cmd, unsigned int issu
                 ret = -EPERM;
                 goto out_acct;
         }
+       if (fs_info->sectorsize > PAGE_SIZE) {
+               ret = -ENOTTY;
+               goto out_acct;
+       }
  
-       file = cmd->file;
         sqe_addr = u64_to_user_ptr(READ_ONCE(cmd->sqe->addr));
  
         if (!(file->f_mode & FMODE_WRITE)) {
diff --git a/fs/btrfs/send.c b/fs/btrfs/send.c

index 32653fc44a7583f731ef1fb92bd4355e5bc4c0fc..5e073502b9e8e90bafa1a05c8a70ecb455ce2954 100644 (file)
--- a/fs/btrfs/send.c
+++ b/fs/btrfs/send.c
@@ -5654,7 +5654,14 @@ static int send_extent_data(struct send_ctx *sctx, struct btrfs_path *path,
  
         ei = btrfs_item_ptr(leaf, path->slots[0],
                             struct btrfs_file_extent_item);
-       if ((sctx->flags & BTRFS_SEND_FLAG_COMPRESSED) &&
+       /*
+        * Do not go through encoded read for bs > ps cases.
+        *
+        * Encoded send is using vmallocated pages as buffer, which we can
+        * not ensure every folio is large enough to contain a block.
+        */
+       if (sctx->send_root->fs_info->sectorsize <= PAGE_SIZE &&
+           (sctx->flags & BTRFS_SEND_FLAG_COMPRESSED) &&
             btrfs_file_extent_compression(leaf, ei) != BTRFS_COMPRESS_NONE) {
                 bool is_inline = (btrfs_file_extent_type(leaf, ei) ==
                                   BTRFS_FILE_EXTENT_INLINE);
author	Qu Wenruo <wqu@suse.com>
	Tue, 9 Sep 2025 03:08:47 +0000 (12:38 +0930)
committer	David Sterba <dsterba@suse.com>
	Tue, 23 Sep 2025 06:49:25 +0000 (08:49 +0200)
fs/btrfs/direct-io.c		patch \| blob \| blame \| history
fs/btrfs/disk-io.c		patch \| blob \| blame \| history
fs/btrfs/fs.c		patch \| blob \| blame \| history
fs/btrfs/ioctl.c		patch \| blob \| blame \| history
fs/btrfs/send.c		patch \| blob \| blame \| history