fs/dax: always remove DAX page-cache entries when breaking layouts

author Alistair Popple <apopple@nvidia.com>

Fri, 28 Feb 2025 03:31:01 +0000 (14:31 +1100)

committer Andrew Morton <akpm@linux-foundation.org>

Tue, 18 Mar 2025 05:06:37 +0000 (22:06 -0700)
author Alistair Popple <apopple@nvidia.com>
Fri, 28 Feb 2025 03:31:01 +0000 (14:31 +1100)
committer Andrew Morton <akpm@linux-foundation.org>
Tue, 18 Mar 2025 05:06:37 +0000 (22:06 -0700)
diff --git a/fs/dax.c b/fs/dax.c

index f1945aa65eb099216e6d680c699975ef608470b4..14fbe516303713dcae1aeffafbab78f9c6444340 100644 (file)
--- a/fs/dax.c
+++ b/fs/dax.c
@@ -846,6 +846,36 @@ int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index)
         return ret;
  }
  
+void dax_delete_mapping_range(struct address_space *mapping,
+                               loff_t start, loff_t end)
+{
+       void *entry;
+       pgoff_t start_idx = start >> PAGE_SHIFT;
+       pgoff_t end_idx;
+       XA_STATE(xas, &mapping->i_pages, start_idx);
+
+       /* If end == LLONG_MAX, all pages from start to till end of file */
+       if (end == LLONG_MAX)
+               end_idx = ULONG_MAX;
+       else
+               end_idx = end >> PAGE_SHIFT;
+
+       xas_lock_irq(&xas);
+       xas_for_each(&xas, entry, end_idx) {
+               if (!xa_is_value(entry))
+                       continue;
+               entry = wait_entry_unlocked_exclusive(&xas, entry);
+               if (!entry)
+                       continue;
+               dax_disassociate_entry(entry, mapping, true);
+               xas_store(&xas, NULL);
+               mapping->nrpages -= 1UL << dax_entry_order(entry);
+               put_unlocked_entry(&xas, entry, WAKE_ALL);
+       }
+       xas_unlock_irq(&xas);
+}
+EXPORT_SYMBOL_GPL(dax_delete_mapping_range);
+
  static int wait_page_idle(struct page *page,
                         void (cb)(struct inode *),
                         struct inode *inode)
@@ -857,6 +887,9 @@ static int wait_page_idle(struct page *page,
  /*
   * Unmaps the inode and waits for any DMA to complete prior to deleting the
   * DAX mapping entries for the range.
+ *
+ * For NOWAIT behavior, pass @cb as NULL to early-exit on first found
+ * busy page
   */
  int dax_break_layout(struct inode *inode, loff_t start, loff_t end,
                 void (cb)(struct inode *))
@@ -871,10 +904,17 @@ int dax_break_layout(struct inode *inode, loff_t start, loff_t end,
                 page = dax_layout_busy_page_range(inode->i_mapping, start, end);
                 if (!page)
                         break;
+               if (!cb) {
+                       error = -ERESTARTSYS;
+                       break;
+               }
  
                 error = wait_page_idle(page, cb, inode);
         } while (error == 0);
  
+       if (!page)
+               dax_delete_mapping_range(inode->i_mapping, start, end);
+
         return error;
  }
  EXPORT_SYMBOL_GPL(dax_break_layout);
diff --git a/fs/xfs/xfs_inode.c b/fs/xfs/xfs_inode.c

index d4f07e02b28b000cceb08878560feae5abb040c4..80083376a1d057e25c8eef59bad7d3a06f3ea83a 100644 (file)
--- a/fs/xfs/xfs_inode.c
+++ b/fs/xfs/xfs_inode.c
@@ -2735,7 +2735,6 @@ xfs_mmaplock_two_inodes_and_break_dax_layout(
         struct xfs_inode        *ip2)
  {
         int                     error;
-       struct page             *page;
  
         if (ip1->i_ino > ip2->i_ino)
                 swap(ip1, ip2);
@@ -2759,8 +2758,8 @@ again:
          * need to unlock & lock the XFS_MMAPLOCK_EXCL which is not suitable
          * for this nested lock case.
          */
-       page = dax_layout_busy_page(VFS_I(ip2)->i_mapping);
-       if (!dax_page_is_idle(page)) {
+       error = dax_break_layout(VFS_I(ip2), 0, -1, NULL);
+       if (error) {
                 xfs_iunlock(ip2, XFS_MMAPLOCK_EXCL);
                 xfs_iunlock(ip1, XFS_MMAPLOCK_EXCL);
                 goto again;
diff --git a/include/linux/dax.h b/include/linux/dax.h

index a6b277f1e13a09b2ceae711295c7e3f7c449ebcb..2fbb262092caca519c43fc165baf134358663c94 100644 (file)
--- a/include/linux/dax.h
+++ b/include/linux/dax.h
@@ -255,6 +255,8 @@ vm_fault_t dax_iomap_fault(struct vm_fault *vmf, unsigned int order,
  vm_fault_t dax_finish_sync_fault(struct vm_fault *vmf,
                 unsigned int order, pfn_t pfn);
  int dax_delete_mapping_entry(struct address_space *mapping, pgoff_t index);
+void dax_delete_mapping_range(struct address_space *mapping,
+                               loff_t start, loff_t end);
  int dax_invalidate_mapping_entry_sync(struct address_space *mapping,
                                       pgoff_t index);
  int __must_check dax_break_layout(struct inode *inode, loff_t start,
diff --git a/mm/truncate.c b/mm/truncate.c

index 76d8fcd89bd003a6c0a565ec5a023376b1c86fe2..79570045071c07b4857eb8de6b07940a28245438 100644 (file)
--- a/mm/truncate.c
+++ b/mm/truncate.c
@@ -78,8 +78,22 @@ static void truncate_folio_batch_exceptionals(struct address_space *mapping,
  
         if (dax_mapping(mapping)) {
                 for (i = j; i < nr; i++) {
-                       if (xa_is_value(fbatch->folios[i]))
+                       if (xa_is_value(fbatch->folios[i])) {
+                               /*
+                                * File systems should already have called
+                                * dax_break_layout_entry() to remove all DAX
+                                * entries while holding a lock to prevent
+                                * establishing new entries. Therefore we
+                                * shouldn't find any here.
+                                */
+                               WARN_ON_ONCE(1);
+
+                               /*
+                                * Delete the mapping so truncate_pagecache()
+                                * doesn't loop forever.
+                                */
                                 dax_delete_mapping_entry(mapping, indices[i]);
+                       }
                 }
                 goto out;
         }
author	Alistair Popple <apopple@nvidia.com>
	Fri, 28 Feb 2025 03:31:01 +0000 (14:31 +1100)
committer	Andrew Morton <akpm@linux-foundation.org>
	Tue, 18 Mar 2025 05:06:37 +0000 (22:06 -0700)
fs/dax.c		patch \| blob \| blame \| history
fs/xfs/xfs_inode.c		patch \| blob \| blame \| history
include/linux/dax.h		patch \| blob \| blame \| history
mm/truncate.c		patch \| blob \| blame \| history