xfs: pin inode backing buffer to the inode log item

author Dave Chinner <dchinner@redhat.com>

Fri, 4 Sep 2020 19:57:20 +0000 (15:57 -0400)

committer Eric Sandeen <sandeen@sandeen.net>

Fri, 4 Sep 2020 19:57:20 +0000 (15:57 -0400)
author Dave Chinner <dchinner@redhat.com>
Fri, 4 Sep 2020 19:57:20 +0000 (15:57 -0400)
committer Eric Sandeen <sandeen@sandeen.net>
Fri, 4 Sep 2020 19:57:20 +0000 (15:57 -0400)
diff --git a/include/xfs_trans.h b/include/xfs_trans.h

index 75ca3777b76177080ba6defa229649fda2338a44..84f29418c40c757497743b8834bc7d7fd0189fdc 100644 (file)
--- a/include/xfs_trans.h
+++ b/include/xfs_trans.h
@@ -22,6 +22,7 @@ typedef struct xfs_log_item {
         struct xfs_mount                *li_mountp;     /* ptr to fs mount */
         uint                            li_type;        /* item type */
         unsigned long                   li_flags;       /* misc flags */
+       struct xfs_buf                  *li_buf;        /* real buffer pointer */
  } xfs_log_item_t;
  
  #define XFS_LI_DIRTY   3       /* log item dirty in transaction */
diff --git a/libxfs/libxfs_io.h b/libxfs/libxfs_io.h

index 34462f78a4c2cebf79eb268881d3dfc83ec110ad..8b67a57df9f760980473a57e2e8cf295c4d615d7 100644 (file)
--- a/libxfs/libxfs_io.h
+++ b/libxfs/libxfs_io.h
@@ -243,6 +243,12 @@ xfs_buf_associate_memory(struct xfs_buf *bp, void *mem, size_t len)
         return 0;
  }
  
+static inline void
+xfs_buf_hold(struct xfs_buf *bp)
+{
+       bp->b_node.cn_count++;
+}
+
  int libxfs_buf_get_uncached(struct xfs_buftarg *targ, size_t bblen, int flags,
                 struct xfs_buf **bpp);
  int libxfs_buf_read_uncached(struct xfs_buftarg *targ, xfs_daddr_t daddr,
@@ -253,7 +259,7 @@ int libxfs_buf_read_uncached(struct xfs_buftarg *targ, xfs_daddr_t daddr,
  static inline bool
  xfs_buf_delwri_queue(struct xfs_buf *bp, struct list_head *buffer_list)
  {
-       bp->b_node.cn_count++;
+       xfs_buf_hold(bp);
         list_add_tail(&bp->b_list, buffer_list);
         return true;
  }
diff --git a/libxfs/trans.c b/libxfs/trans.c

index a61f803fe32d80a165b890a739a75773f3001ac6..5b6e5946709a310314239bbd68a91622aa3fde58 100644 (file)
--- a/libxfs/trans.c
+++ b/libxfs/trans.c
@@ -780,6 +780,8 @@ xfs_inode_item_put(
  {
         struct xfs_inode                *ip = iip->ili_inode;
  
+       ASSERT(iip->ili_item.li_buf == NULL);
+
         ip->i_itemp = NULL;
         kmem_cache_free(xfs_ili_zone, iip);
  }
@@ -795,47 +797,35 @@ static void
  inode_item_done(
         struct xfs_inode_log_item       *iip)
  {
-       xfs_dinode_t                    *dip;
-       xfs_inode_t                     *ip;
-       xfs_mount_t                     *mp;
         xfs_buf_t                       *bp;
         int                             error;
  
-       ip = iip->ili_inode;
-       mp = iip->ili_item.li_mountp;
-       ASSERT(ip != NULL);
+       ASSERT(iip->ili_inode != NULL);
  
         if (!(iip->ili_fields & XFS_ILOG_ALL))
-               goto free;
+               goto free_item;
  
-       /*
-        * Get the buffer containing the on-disk inode.
-        */
-       error = xfs_imap_to_bp(mp, NULL, &ip->i_imap, &dip, &bp, 0);
-       if (error) {
-               fprintf(stderr, _("%s: warning - imap_to_bp failed (%d)\n"),
-                       progname, error);
-               goto free;
-       }
+       bp = iip->ili_item.li_buf;
+       iip->ili_item.li_buf = NULL;
  
         /*
          * Flush the inode and disassociate it from the transaction regardless
          * of whether the flush succeed or not. If we fail the flush, make sure
          * we still release the buffer reference we currently hold.
          */
-       error = libxfs_iflush_int(ip, bp);
+       error = libxfs_iflush_int(iip->ili_inode, bp);
         bp->b_transp = NULL;    /* remove xact ptr */
  
         if (error) {
                 fprintf(stderr, _("%s: warning - iflush_int failed (%d)\n"),
                         progname, error);
-               libxfs_buf_relse(bp);
                 goto free;
         }
  
         libxfs_buf_mark_dirty(bp);
-       libxfs_buf_relse(bp);
  free:
+       libxfs_buf_relse(bp);
+free_item:
         xfs_inode_item_put(iip);
  }
  
diff --git a/libxfs/xfs_inode_buf.c b/libxfs/xfs_inode_buf.c

index 6362ee44225903a0b579be88c1377e8ae91f554e..89676440387f7e62cc6a7c539f00cde547497411 100644 (file)
--- a/libxfs/xfs_inode_buf.c
+++ b/libxfs/xfs_inode_buf.c
@@ -173,7 +173,8 @@ xfs_imap_to_bp(
         }
  
         *bpp = bp;
-       *dipp = xfs_buf_offset(bp, imap->im_boffset);
+       if (dipp)
+               *dipp = xfs_buf_offset(bp, imap->im_boffset);
         return 0;
  }
  
diff --git a/libxfs/xfs_trans_inode.c b/libxfs/xfs_trans_inode.c

index aaa310f783414e55cb027681e8b6c274a58142b2..4387660b9e075dd8c455f3972b8c93bb9c7dfdcb 100644 (file)
--- a/libxfs/xfs_trans_inode.c
+++ b/libxfs/xfs_trans_inode.c
@@ -8,6 +8,8 @@
  #include "xfs_shared.h"
  #include "xfs_format.h"
  #include "xfs_log_format.h"
+#include "xfs_trans_resv.h"
+#include "xfs_mount.h"
  #include "xfs_inode.h"
  #include "xfs_trans.h"
  
@@ -69,13 +71,19 @@ xfs_trans_ichgtime(
  }
  
  /*
- * This is called to mark the fields indicated in fieldmask as needing
- * to be logged when the transaction is committed.  The inode must
- * already be associated with the given transaction.
+ * This is called to mark the fields indicated in fieldmask as needing to be
+ * logged when the transaction is committed.  The inode must already be
+ * associated with the given transaction.
   *
- * The values for fieldmask are defined in xfs_inode_item.h.  We always
- * log all of the core inode if any of it has changed, and we always log
- * all of the inline data/extents/b-tree root if any of them has changed.
+ * The values for fieldmask are defined in xfs_inode_item.h.  We always log all
+ * of the core inode if any of it has changed, and we always log all of the
+ * inline data/extents/b-tree root if any of them has changed.
+ *
+ * Grab and pin the cluster buffer associated with this inode to avoid RMW
+ * cycles at inode writeback time. Avoid the need to add error handling to every
+ * xfs_trans_log_inode() call by shutting down on read error.  This will cause
+ * transactions to fail and everything to error out, just like if we return a
+ * read error in a dirty transaction and cancel it.
   */
  void
  xfs_trans_log_inode(
@@ -128,6 +136,39 @@ xfs_trans_log_inode(
         spin_lock(&iip->ili_lock);
         iip->ili_fsync_fields |= flags;
  
+       if (!iip->ili_item.li_buf) {
+               struct xfs_buf  *bp;
+               int             error;
+
+               /*
+                * We hold the ILOCK here, so this inode is not going to be
+                * flushed while we are here. Further, because there is no
+                * buffer attached to the item, we know that there is no IO in
+                * progress, so nothing will clear the ili_fields while we read
+                * in the buffer. Hence we can safely drop the spin lock and
+                * read the buffer knowing that the state will not change from
+                * here.
+                */
+               spin_unlock(&iip->ili_lock);
+               error = xfs_imap_to_bp(ip->i_mount, tp, &ip->i_imap, NULL,
+                                       &bp, 0);
+               if (error) {
+                       xfs_force_shutdown(ip->i_mount, SHUTDOWN_META_IO_ERROR);
+                       return;
+               }
+
+               /*
+                * We need an explicit buffer reference for the log item but
+                * don't want the buffer to remain attached to the transaction.
+                * Hold the buffer but release the transaction reference.
+                */
+               xfs_buf_hold(bp);
+               xfs_trans_brelse(tp, bp);
+
+               spin_lock(&iip->ili_lock);
+               iip->ili_item.li_buf = bp;
+       }
+
         /*
          * Always OR in the bits from the ili_last_fields field.  This is to
          * coordinate with the xfs_iflush() and xfs_iflush_done() routines in
author	Dave Chinner <dchinner@redhat.com>
	Fri, 4 Sep 2020 19:57:20 +0000 (15:57 -0400)
committer	Eric Sandeen <sandeen@sandeen.net>
	Fri, 4 Sep 2020 19:57:20 +0000 (15:57 -0400)
include/xfs_trans.h		patch \| blob \| blame \| history
libxfs/libxfs_io.h		patch \| blob \| blame \| history
libxfs/trans.c		patch \| blob \| blame \| history
libxfs/xfs_inode_buf.c		patch \| blob \| blame \| history
libxfs/xfs_trans_inode.c		patch \| blob \| blame \| history